Advertisement
suthagar23

Untitled

Aug 19th, 2018
137
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.07 KB | None | 0 0
  1.  
  2. import json
  3. from datetime import datetime
  4. from imp import reload
  5. import tensorflow as tf
  6. import nltk
  7. from nltk.corpus import wordnet
  8. from nltk.corpus import stopwords
  9. from nltk.tokenize import sent_tokenize
  10. from nltk.tokenize import word_tokenize
  11. from nltk.tag import pos_tag
  12. from nltk.stem import WordNetLemmatizer
  13. from nltk.corpus.reader.wordnet import WordNetError
  14. # import multiprocessing as mp
  15. from threading import Thread
  16. import sys
  17. import re
  18. import os
  19.  
  20. file = "/home/suthagar/Desktop/scrapy/CS4642-DailyMirror-Tech/outputs/"
  21.  
  22. all_files = os.listdir(file)
  23. fullData = []
  24. i=0
  25. if len(all_files) > 0:
  26. for inputFileName in all_files:
  27. inputFile = open(file + inputFileName, "r+")
  28. corpusLines = inputFile.readlines()
  29. # print(corpusLines[0])
  30. jsonData = json.loads(corpusLines[0])
  31. fullData.append(jsonData)
  32. # fullData += corpusLines
  33. print(inputFileName)
  34. # i+=1
  35. # if i>2:
  36. # break
  37.  
  38. f = open(file + "output-all.json", "w")
  39. f.write(json.dumps(fullData))
  40. print("completed")
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement