Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import pandas as pd
- import argparse
- parser = argparse.ArgumentParser()
- parser.add_argument("-in", "--input", help="blast outfmt 6 formata", required=True)
- args = parser.parse_args()
- read_file = args.input
- header_outfmt6 = ['qseqid','sseqid','pident','length','mismatch','gapopen','qstart','qend','sstart','send','evalue','bitscore']
- df = pd.read_csv(read_file, sep='t',header = None,names = header_outfmt6)
- df_2 = df.drop_duplicates(subset=['sseqid','sstart','send'])
- out_csv = read_file+'.filtred'
- df_2.to_csv(out_csv, sep='t')
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement