Guest User

Untitled

a guest
Dec 12th, 2018
67
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.90 KB | None | 0 0
  1. from kafka import KafkaConsumer
  2. import re
  3.  
  4.  
  5. # connect to kafka topic
  6. kaf = KafkaConsumer('kafka.consumer.topic',
  7. auto_offset_reset='earliest', bootstrap_servers=[
  8. 'consumer-kafka.hdw.r53.deap.tv'])
  9. outputfile = 'Z:\KafkaConsum\file.csv'
  10.  
  11. outfile = open(outputfile, mode='w', newline='')
  12. i = 0
  13.  
  14. header = True
  15.  
  16. for row in kaf:
  17. a = row.value.decode("utf-8")
  18. if 'Twitter' in a:
  19. data = re.findall(r'w+=s*['"]?[w-]+', a)
  20. headers = []
  21. array = []
  22. for pair in data:
  23. m = re.search(r'(w+)=s*['"]?([w-]+)', pair)
  24. headers.append(m.group(1)) # get header
  25. array.append(m.group(2)) # get value
  26. if header == True:
  27. h = '|'.join(headers)
  28. print(h)
  29. outfile.write(h + 'n')
  30. header = False
  31. r = '|'.join(array)
  32. print(r)
  33. outfile.write(r + 'n')
  34. outfile.close()
Add Comment
Please, Sign In to add comment