Guest User

Untitled

a guest
Dec 14th, 2018
93
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.75 KB | None | 0 0
  1. codon_table = {
  2. "UUU": "F", "UUC": "F", "UUA": "L", "UUG": "L", "UCU": "S",
  3. "UCC": "S", "UCA": "S", "UCG": "S", "UAU": "Y", "UAC": "Y",
  4. "UAA": "_", "UAG": "_", "UGA": "_", "UGU": "C", "UGC": "C",
  5. "UGG": "W", "CUU": "L", "CUC": "L", "CUA": "L", "CUG": "L",
  6. "CCU": "P", "CCC": "P", "CCA": "P", "CCG": "P", "CAU": "H",
  7. "CAC": "H", "CAA": "Q", "CAG": "Q", "CGU": "R", "CGC": "R",
  8. "CGA": "R", "CGG": "R", "AUU": "I", "AUC": "I", "AUA": "I",
  9. "AUG": "M", "ACU": "T", "ACC": "T", "ACA": "T", "ACG": "T",
  10. "AAU": "N", "AAC": "N", "AAA": "K", "AAG": "K", "AGU": "S",
  11. "AGC": "S", "AGA": "R", "AGG": "R", "GUU": "V", "GUC": "V",
  12. "GUA": "V", "GUG": "V", "GCU": "A", "GCC": "A", "GCA": "A",
  13. "GCG": "A", "GAU": "D", "GAC": "D", "GAA": "E", "GAG": "E",
  14. "GGU": "G", "GGC": "G", "GGA": "G", "GGG": "G"}
  15.  
  16. >seq1
  17. ATGCTGATGATAGGTATGGGTA
  18. GATAGATGAGAGAGATGAGAAT
  19. >seq2
  20. ATGCGATGATAGATG
  21. >seq3
  22. ATGC
  23.  
  24. def dna_to_protein(inputFilename, outputFilename="protein.fasta"):
  25. inputFile = open(inputFilename, "r")
  26. outputFile = open(outputFilename, "w")
  27. for line in inputFile:
  28. line = line.strip()
  29. if line and not line.startswith('>'):
  30. line = line.replace("T","U")
  31. for i in range(0,len(line),3):
  32. codon=line[i:i+3]
  33. if len(codon) == 3:
  34. amino=codon_table[codon]
  35. if amino != "_":
  36. line = line + amino
  37. elif amino == "_":
  38. line = line + amino
  39. return line
  40. print(line, file=outputFile)
  41.  
  42.  
  43. dna_to_protein("dna.fasta", "protein.fasta")
  44.  
  45. >seq1
  46. MLMIGMGR_MREMRX
  47. >seq2
  48. MR__M
  49. >seq3
  50. MX
Add Comment
Please, Sign In to add comment