Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import json
- import urllib2
- import re
- img_pattern = "[[File:\\2.png|frame|none|none|\\1]]"
- img_reg_pattern = re.compile("!\\[(.*)\\]\\(.*:(.*)\\)")
- title_pattern = "== \\1 =="
- title_reg_pattern = re.compile("# (.*)")
- section_pattern = "=== \\1 ==="
- section_reg_pattern = re.compile("## (.*)")
- link_pattern = "[[\\2|\\1]]"
- link_reg_pattern = re.compile("\\[(.*)\\]\\((?:.*/)?(.*).md\\)")
- doc_list = {"items": {}, "blocks": {}}
- def parse_doc(contents):
- doc = img_reg_pattern.sub(img_pattern, contents)
- doc = section_reg_pattern.sub(section_pattern, doc)
- doc = title_reg_pattern.sub(title_pattern, doc)
- doc = link_reg_pattern.sub(link_pattern, doc)
- doc = doc.replace("@", "-")
- return doc
- itemdoc_json = json.loads( urllib2.urlopen("https://api.github.com/repositories/17380796/contents/src/main/resources/assets/computronics/doc/computronics/en_US/item").read() )
- blockdoc_json = json.loads( urllib2.urlopen("https://api.github.com/repositories/17380796/contents/src/main/resources/assets/computronics/doc/computronics/en_US/item").read() )
- for entry in itemdoc_json:
- if entry['download_url'] and entry['name']:
- doc_content = urllib2.urlopen( entry['download_url'] ).read()
- doc_list['items'][entry['name']] = parse_doc(doc_content)
- for entry in blockdoc_json:
- if entry['download_url'] and entry['name']:
- doc_content = urllib2.urlopen( entry['download_url'] ).read()
- doc_list['blocks'][entry['name']] = parse_doc(doc_content)
- # Do whatever you need to do with it here, I'll just print it out
- print doc_list
Advertisement
Add Comment
Please, Sign In to add comment