Guest User

Untitled

a guest
Feb 19th, 2018
71
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 2.42 KB | None | 0 0
  1. import pyodbc,nltk,array,re,itertools
  2. cnxn = pyodbc.connect('Driver={MySQL ODBC 5.1 Driver};Server=127.0.0.1;Port=3306;Database=information_schema;User=root; Password=1234;Option=3;')
  3. cursor = cnxn.cursor()
  4. cursor.execute("use collegedatabase ;")
  5. cursor.execute("select * from sampledata ; ")
  6. cnxn.commit()
  7. s=[]
  8. j=[]
  9. x=[]
  10. words = []
  11. w = []
  12. sfq = []
  13. POS=[]
  14. wnl = nltk.WordNetLemmatizer()
  15. p = []
  16. clean= []
  17. l =[]
  18. tupletolist= []
  19. results = []
  20. aux = []
  21. regex = re.compile("w+.")
  22. pp = []
  23. array1=[]
  24.  
  25. f = open("C:\Users\vchauhan\Desktop\tupletolist.txt","w")
  26. for entry in cursor:
  27. s.append(entry.injury_type),j.append(entry.injury_desc)
  28.  
  29. def isAcceptableChar(character):
  30. return character not in "~!@#$%^&*()_+`1234567890-={}|:<>?[];',/."
  31.  
  32.  
  33. from nltk.tokenize import word_tokenize
  34. from nltk.corpus import stopwords
  35. english_stops = set(stopwords.words('english'))
  36. for i in range(0,200):
  37. j.append(filter(isAcceptableChar, j[i]))
  38. w.append([word for word in word_tokenize(j[i].lower()) if word not in english_stops])
  39. for j in range (0,len(w[i])):
  40. results = regex.search(w[i][j])
  41. if results:
  42. str.rstrip(w[i][j],'.')
  43. for a in range(0 , 200):
  44. sfq.append(" ".join(w[a]))
  45.  
  46. from nltk.stem import LancasterStemmer
  47. stemmer = LancasterStemmer()
  48.  
  49. for i in range (0,200):
  50. pp.append(len(w[i]))
  51.  
  52. for a in range (0,200):
  53. p.append(word_tokenize(sfq[a]))
  54. POS.append([wnl.lemmatize(t) for t in p[a]])
  55. x.append(nltk.pos_tag(POS[a]))
  56. clean.append((re.sub('()[]{}'':/-[(",)]','',str(x[a]))))
  57. cursor.execute("update sampledata SET POS = ? where SRNO = ?", (re.sub('()[]{}'':/-[(",)]','',str(x[a]))), a)
  58.  
  59. for i in range (0,len(array1)):
  60. results.append(regex.search(array1[i][0]))
  61. if results[i] is not None:
  62. aux.append(i)
  63.  
  64. f.write(str(w))
  65.  
  66. Traceback (most recent call last):
  67. File "C:UsersvchauhanDesktopregexsolution_try.py", line 37, in <module>
  68. j.append(filter(isAcceptableChar, j[i]))
  69. AttributeError: 'int' object has no attribute 'append'
  70.  
  71. j.append(filter(isAcceptableChar, j[i])) # j is not a list here,it is an int.
  72. w.append([word for word in word_tokenize(j[i].lower()) if word not in english_stops])
  73. for j in range (0,len(w[i])): # here j is an int
  74.  
  75. for j in range (0,len(w[i])):
  76.  
  77. for i in range(0,200):
  78. j.append(filter(isAcceptableChar, j[i]))
  79. w.append([word for word in word_tokenize(j[i].lower()) if word not in english_stops])
  80. for j in range (0,len(w[i])):
Add Comment
Please, Sign In to add comment