Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import requests
- def petscan(pos, neg, ns):
- params = {
- "language": "en",
- "project": "wiktionary",
- "categories": "\r\n".join(pos),
- "negcats": "\r\n".join(neg),
- "ns[%d]" % ns: 1,
- "format": "json",
- "doit": "Do it!"
- }
- response = requests.get("https://petscan.wmflabs.org/", params)
- return response.json()["*"][0]["a"]["*"]
- def get_langs():
- pos = ["Terms derived from other languages by language"]
- return [result["title"].split("_terms_")[0] for result in petscan(pos, [], 14)]
- def incorrect_derivations(lang):
- pos = ["%s terms derived from other languages|7" % lang]
- neg = ["%s lemmas" % lang, "%s non-lemma forms" % lang]
- return [result["title"] for result in petscan(pos, neg, 0)]
- for lang in get_langs():
- results = incorrect_derivations(lang)
- if results:
- print("==%s==" % lang)
- for title in results:
- print("* [[%s]]" % title)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement