Guest User

Untitled

a guest
Jan 17th, 2018
98
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.78 KB | None | 0 0
  1. def ocr_space_file(filename, overlay=True, api_key='myAPI', language='eng'):
  2.  
  3. payload = {'isOverlayRequired': overlay,
  4. 'apikey': api_key,
  5. 'language': language,
  6. }
  7. with open(filename, 'rb') as f:
  8. r = requests.post('https://api.ocr.space/parse/image',
  9. files={filename: f},
  10. data=payload,
  11. )
  12.  
  13. Info = r.content.decode()
  14. obj = json.loads(Info)
  15.  
  16. f = open('Data.txt', 'w')
  17. for i in obj['ParsedResults']:
  18. for j in range(0,len(i["TextOverlay"]['Lines'])):
  19. allInfo = i["TextOverlay"]['Lines'][j]['Words']
  20. for k in allInfo:
  21. text = k['WordText']
  22. coords = [k['Left'],k['Top'],k['Width'],k['Height']]
  23. f1 = ','.join(map(str, coords))
  24. f.write(text+ " "+ f1 + 'n' )
  25. f.close()
  26. return r.content.decode()
  27.  
  28. test_file = ocr_space_file(filename='1my.png', language='eng')
  29.  
  30. imagePaths = [f for f in glob.glob('cropped_images/*.png')]
  31. save_path = 'Labeled_images/'
  32.  
  33. def ocr_all_screenshots():
  34.  
  35. for pic in imagePaths:
  36.  
  37. #src_fname, ext = os.path.splitext(pic) # split filename and extension
  38. # construct output filename, basename to remove input directory
  39. #save_fname = os.path.join(save_path, os.path.basename(src_fname) + '_labeled.png')
  40. os.chdir(save_path)
  41. ocr_space_file(pic)
  42.  
  43. ocr_all_screenshots()
  44.  
  45. def ocr_space_file(filename, overlay=True, api_key='мой API', language='eng'):
  46. ...обработка json
  47. for i in obj['ParsedResults']:
  48. f = open('Data' +str(i) +'.txt', 'w')
  49. ...
  50. f1 = ','.join(map(str, coords))
  51. f.write(f1 + 'n' )
  52. f.close()
  53. return r.content.decode()
Add Comment
Please, Sign In to add comment