Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- def get_not_overlapping_read():
- geneId = "ENSMUSG00000000827"
- read_name = "ch361_read8692_template_pass_BYK_CB_ONT_1_FAF04998_A"
- read_size = 1740
- gene_size = 20825
- strand = "+"
- # Alignment n°1
- block_tuple_1 = (65, 146)
- read_start1 = 65
- read_stop1 = 146
- read_string1 = "AAACTCTTTCACAGGCTGGACAGAAAACATCAGCTGCCCTGTCCACCATGGGCTCTG-CATCAGCAGGAAGCTTGG-G-TATGAG"
- gene_start1 = 11041
- gene_stop1 = 11125
- gene_string1 = "AAACTCTTTCACAGGCTGGACAGAAAACATCAGCTGCCCTGTCCACCATGGGCTCTGCCATCAGCAGGAAGCTTGGAGACATGAG"
- alignIdentity1 = 0.9529411764705882
- alignGap1 = 3
- alignSize1 = 85
- alignString1 = "||||||||||||||||||||||||||||||||||||||||||||||||||||||||| |||||||||||||||||| | |||||"
- # Alignment n°2
- block_tuple_2 = (147, 1512)
- read_start2 = 147
- read_stop2 = 1512
- read_string2 = "TCCTAAGGTTGTGGGTGGC--AGAGAATGGCGGCGATAACCTCCCT-CCTCTCCTGGAAGTGGTGACCAGACATTGCCGGATCATGCGCCTTTCT-AGCC" \
- "TGT-CT-GCTTGCCAGCCACAGAGTGC--AAGCACACGCTCATCATC---GCTGCAACTCTGCATGACAGAGCCACCAGCCAGAGACGGTGAAGAGCTGT" \
- "GGTTTGAAGTGA-TCAT-GCCATGTTCATGCAGATGTGGCTGCC--AGCATGAATT-GAGAACAGTCTTGTACATAAA--TAACACACTAAAGTTCGT-G" \
- "GT-AAACGAACCACTGTGCCATCCTTTCAAGGGCCACAGGAAATGGACAGGGTGGCGGGGCACTCAGGCCTGAG--GCACTGAACCAGGAGCCCTGCTCC" \
- "CTTTGAAGGAGTCAGCAGAGTGCTGA-GGAAGAA-TGTGAGTATTG-GTGAACAGTATTTCCTT-CTGACCTCCT-CCCTAGCTCAGGAGGAATACACTT" \
- "ACCTAGGTAATAT--CATGGTCGCAGTTGTCATACAGACTGAGAGAGAGTTGTCTATTTTCTGAGA-CCT-GA----AAACAT-GTAACTGCTTCATTCT" \
- "TACACTAACAACCTGGCTTTGGC-GAAGCAGATTTACTA--TTTTAAATGTGATAGTCTTTTCA------AAATAG----AAAAAGTGA-GCAAGACAGC" \
- "TTTAGCCTCATTGTTGAATATTATTTCTTTGAATTCATGCTGAAACTCAAACCTTACATTGCCTTATGC--TGAACATAGTC-TTTTATATATCTAAATA" \
- "AATGAAGGTTCTTTAATGGGTTATGATACAATGTAGAA-TTTATTCTGG-CCATCTCATACTCCTGCCAGGCGCAGTTGCTTACA-TTTATTTCTTTAAT" \
- "ACTTTCTCCT-GTGTTGCAAACTTGGTTCTCTTAAG--GTGGCATTTT-CAATA----ACCACTCTGACCCACAGGGCTCTTGTGCTGTAGGTTAGGAGA" \
- "GCTGAGAGAA-AAA------CCTTTATCTTTAGCACCTGAATGGGATGTGCCCTGCACAGTGTTGC--TACTGACAGTGGAGCAGAATACCAGTCCCATA" \
- "GTCTCTTGCCGCATCTGTTTATTACGCTGGAGAATAAATGAACCAGCCTTACAGATC-GGGCGGGGATGTGG-TTTAGTTCAG-CAGAACTCTTTTGTCA" \
- "TCTTTTCTCTCCAGGAGCTTCAAAGATTTCTTTCTAAGTTCTTTCCTCCTGCTTCCAGTACGCCACATTCTGCAGCCTCTCAATACC-G----ATTTGTG" \
- "TTGAAATCATG--TTGGAGA-AGGG-CAACACTGTGCCTTAATGGCTCTGCTTGGGGCAAAGACTTTATCTGTTTGTACACATCTCTACACTCCTAGGGT" \
- "--GGTGG--TTGTTCCATTGGTTCGTTT---GTTAAATATTCAGTATTCCTAGTTTTG"
- gene_start2 = 17938
- gene_stop2 = 19379
- gene_string2 = "T-CTAAGGTTGTGGGTGGCAGAGAGAATGGCAGCGATAACCTCCCTCCCTCTCCTGGAAGTGGTGACCAGACATTGCCGGATCATGCGCCTTTCTAAGCC" \
- "TGTCCTAGCTTGCCAGCCACAGAGTACAGAAGCACACGCTCATCATCACAGCTGCAACTCTGCATGACAGAGCCACCAGCCAGAGACAGTGAAGAGCTG-" \
- "GTTTTGAAGACAGTCATACCCATGTTCATGCAGATGTGGCTGCCTTGGCATGAATTAGAGAACAGTCTTGTACATAAATGTTTTACACTAAAGTTCGTAG" \
- "ATGAAGCAGACCACTGTGCCATCCTTTCAAGGGCCACAGGAAATGGACAGGGTGGCGGGGCACTCAGGCCTGAGGAGCACTGAACCAGGAGCCCTGCTCC" \
- "CTTTGAAGGTCTCAGCAGAGTGCTGAGGGAAGAAGTGTGAGTATTGAGTGAACAGTATTTCCTTCCTGACCTCCTCCCCTAGCTCAGGAGGAATACACTT" \
- "ACCTAGGTAATATCGCATGGTCGCAGTTGTCATACAGACTGAGAGAGAGTTGTCTATTTTCTGAGACCCTAGAAAGGAAACATAGCAACTGCTTCATTCT" \
- "TACACTAACAACCTGGCTTTGGCAGAAGCAGATTTACTATTTTTTAAATGTGATAGTCTTTTCAAAAATTAAATAGGAAAAAAAAGTGAGGCAAGACAGC" \
- "TTTAGCCTCATTGTTGAATATTATTTCTTTGAATTCAAGCTGAAACTCAAGCCTTACATTGCCTTATGCTTTGTTTATAGTCTTTTTATATATCTAAATA" \
- "AATGAAGGTTCTTTAATGGGTTATGATACAATGTAGAATTTTATTCTGGCCCATCTCATACTCCTGCCAGTACCAGTT-ATTACATTTTATTTCTTTAAT" \
- "ACTTTCTCCTGGTGTGCAAAACTTGGTTCTCTTAAGGAGTGGCATTTTCCAATAGCTTTCCACTCTGACCCACAGGGCTCTTGTGCTGTAGGTTAGGAGA" \
- "GCTGAGAGAAGAAAAAAAAGCCTTTATCTTTAGCACCTGAATGGGATGTGCCCTGCACAGTGTTGCTTTACTGACAGTGG-GCAGGGCTCTGGT-CCATA" \
- "GTCTC-TGCC-TGTCTGTTTATTAC-ATGGAGAATAAATGAACCAGCCTTACAGATCAGGTAGGGGATGTGGTTTTGGTTCAGCCAGAACTCTGCTGTCA" \
- "TCTTTTCT---CAGGAGCTTCAAAGATTTCTTTCTAAGTTCTTTCCTCCTGCTTCCAAT-TGCCACATTCTGCAGCCTCTCAATACCAGGGCCCTGTGTG" \
- "TTGAGATCATGATTTGGAGAGAGGGCCAGCACTGTGCCTTAATGGCTCTTAGCAGGGCAAAGACTTTATCTGTTTGTACACATCTCTACACTCCTAGGGT" \
- "GAGGTGGGATTTGTCCATT--TTAGTTTCTGGTTTGACA--CAGTGTGAGGTGTCTTG"
- alignIdentity2 = 0.8786008230452675
- alignGap2 = 108
- alignSize2 = 1458
- alignString2 = "| ||||||||||||||||| |||||||||| |||||||||||||| |||||||||||||||||||||||||||||||||||||||||||||||| ||||" \
- "||| || |||||||||||||||||| | |||||||||||||||||| ||||||||||||||||||||||||||||||||||||| ||||||||||| " \
- "| ||||||| | |||| ||||||||||||||||||||||||| ||||||||| ||||||||||||||||||||| | |||||||||||||| |" \
- " | || | ||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||| ||||||||||||||||||||||||" \
- "||||||||| ||||||||||||||| ||||||| ||||||||||| ||||||||||||||||| |||||||||| ||||||||||||||||||||||||" \
- "||||||||||||| ||||||||||||||||||||||||||||||||||||||||||||||||||| ||| || |||||| | ||||||||||||||" \
- "||||||||||||||||||||||| ||||||||||||||| ||||||||||||||||||||||| |||||| ||||||||| ||||||||||" \
- "||||||||||||||||||||||||||||||||||||| |||||||||||| |||||||||||||||||| || |||||| |||||||||||||||||" \
- "|||||||||||||||||||||||||||||||||||||| |||||||||| |||||||||||||||||||| ||||| ||||| ||||||||||||||" \
- "|||||||||| |||| |||||||||||||||||| |||||||||| ||||| |||||||||||||||||||||||||||||||||||||||||" \
- "|||||||||| ||| |||||||||||||||||||||||||||||||||||||||||||||| |||||||||||| |||| | || |||||" \
- "||||| |||| |||||||||||| |||||||||||||||||||||||||||||| || |||||||||| ||| |||||| ||||||||| |||||" \
- "|||||||| |||||||||||||||||||||||||||||||||||||||||||||| | |||||||||||||||||||||||||| | | ||||" \
- "|||| |||||| ||||||| |||| || |||||||||||||||||||| ||||||||||||||||||||||||||||||||||||||||||||||" \
- " ||||| || |||||| || |||| ||| | | |||| | || |||"
- # Alignment n°3
- block_tuple_3 = (1513, 1680)
- read_start3 = 1513
- read_stop3 = 1680
- read_string3 = "CC--AGAATACTCTACCACACAAAGCAAGGAACAACGAATAACTGGGGAACT---GAAGAGCACACCATTG--GTCTTCTTTT-CAGGGTTAAAAACAATAGCTGTGTGA-GGAACACATTACAGGAGTG--GGT--CTGATATATCTTCCTACAAATATTAGCAGGCAAC--GTCAATAAGG"
- gene_start3 = 19411
- gene_stop3 = 19593
- gene_string3 = "CCTTAGAATACTCTACCACACAAAGCAAGGAACAACGAATAACTGGGGAGCTGAAGAAGAGCACACCATTGGTGTCTTCTTTTCCAGGGTTAAAAACAATAGCTGTGTGAGGGAACACATTACAGGAGTGTAGGTCACTGATATATCTTCCTACAAATATTAGCAGGCAGCTTGTCAATAAAG"
- alignIdentity3 = 0.9016393442622951
- alignGap3 = 15
- alignSize3 = 183
- alignString3 = "|| ||||||||||||||||||||||||||||||||||||||||||||| || |||||||||||||||| |||||||||| |||||||||||||||||||||||||| ||||||||||||||||||| ||| |||||||||||||||||||||||||||||||| | |||||||| |"
- read = { read_name : {
- block_tuple_1 : {"ReadId": read_name, "ReadSize": read_size, "ReadStart": read_start1, "ReadStop": read_stop1, "Strand": strand, "GeneId": geneId, "GeneSize": gene_size, "GeneStart": gene_start1, "GeneStop": gene_stop1, "AlignIdentity": alignIdentity1, "AlignGap": alignGap1, "AlignSize": alignSize1, "GeneString": gene_string1, "ReadString": read_string1, "AlignString": alignString1},
- block_tuple_2 : {"ReadId": read_name, "ReadSize": read_size, "ReadStart": read_start2, "ReadStop": read_stop2, "Strand": strand, "GeneId": geneId, "GeneSize": gene_size, "GeneStart": gene_start2, "GeneStop": gene_stop2, "AlignIdentity": alignIdentity2, "AlignGap": alignGap2, "AlignSize": alignSize2, "GeneString": gene_string2, "ReadString": read_string2, "AlignString": alignString2},
- block_tuple_3 : {"ReadId": read_name, "ReadSize": read_size, "ReadStart": read_start3, "ReadStop": read_stop3, "Strand": strand, "GeneId": geneId, "GeneSize": gene_size, "GeneStart": gene_start3, "GeneStop": gene_stop3, "AlignIdentity": alignIdentity3, "AlignGap": alignGap3, "AlignSize": alignSize3, "GeneString": gene_string3, "ReadString": read_string3, "AlignString": alignString3}
- }
- }
- return read
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement