Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- pat = open('PATRIC_genome.txt','r')
- queen = open('PRJNA348753_AssemblyDetails.txt','r')
- patlist=[]
- queenlist=[]
- x=0
- newlist=[]
- for line in queen:
- line = line.split('\t')
- if len(line) > 1:
- queenlist.append(line[5])
- for line in pat:
- line = line.replace("\"",'')
- line = line.replace('\t',' ')
- line = line.split(' ')
- patlist.append(line[1]+ ' ' +line[2])
- ''''''
- for species in queenlist:
- for spec in patlist:
- if species == spec:
- if species not in newlist:
- newlist.append(species)
- else:
- pass
- print newlist
- print len(newlist)
- #print queenlist[0:10]
- pat.close()
- queen.close()
Add Comment
Please, Sign In to add comment