Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- from sys import argv, exit
- import csv
- import re
- if len(argv) < 3:
- print("mising command-line argument")
- exit(1)
- #pattern1 = re.compile(r'AGAT')
- #pattern2 = re.compile(r'AATG')
- #pattern3 = re.compile(r'TATC')
- # pattern = re.compile(r'contents[i:j]')
- with open(argv[1],"r") as file, open(argv[2],"r") as csvfile:
- count = 0
- contents = file.read()
- csvcontents = csv.reader(csvfile)
- header = next(csvcontents)
- data = [row for row in csvcontents]
- i = 0
- j = 4
- while contents[i:j]:
- span = contents[i:j]
- repcount = 1
- while contents[i+4:j+4] == span:
- repcount += 1
- i += 4
- j += 4
- #if repcount != 0:
- if repcount > 1:
- print("span " + span + " repeats " + str(repcount) + " times")
- i += 4
- j += 4
- else:
- i += 4
- j += 4
- index = 0
- for headervalue in header:
- index += 1
- if headervalue == span:
- data = [row for row in contents]
- #if int(data[index]) == repcount:
- if data[index] == repcount:
- print("possible match is named " + data[0])
- #with open(argv[2],"r") as csvfile:
- # csvcontents = csv.reader(csvfile)
- # header = next(csvcontents) # look up what next is doing again
- # print("seeing what the next() function does by assigning it to header")
- # print("printing header")
- # print(header) ## assign header into a list
- # data = [row for row in csvcontents]
- # print("printing data[0]")
- # print(data[0])
- # row could be called anything... how does it know to print a row?
- # is it part of the csv reader() method?
- # print("printing 1 line at a time")
- # i = 0
- # while i < len(data):
- # print(data[i])
- # i += 1
- # print("print(data[15][2]) prints: ")
- # print(int(data[15][2]))
- # print("print(data[15][1]) prints: ")
- # print(int(data[15][1]))
- # print("print(data[15][0]) prints: ")
- # print(str(data[15][0]))
- #File "fcsvdna.py", line 70, in <module>
- # print(int(data[15][0]))
- # ValueError: invalid literal for int() with base 10: 'Neville'
- #print("header[1] prints: ")
- #print(header[1])
- #print("printing everything in the csv file: ")
- #print(data)
Advertisement
Add Comment
Please, Sign In to add comment