Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import pandas as pd
- #import matplotlib.pyplot as plt
- #import numpy as np
- #import matplotlib.font_manager as fm
- reddit = praw.Reddit(client_id='',
- client_secret='',
- password='',
- user_agent='footballer by /u/kunalc',
- username='kunalc')
- submissions=reddit.subreddit('soccer').top(limit=500)
- submissions=list(submissions)
- print(len(submissions))
- dicta={}
- for submission in submissions:
- title=submission.title
- data=title.split()
- for word in data:
- if word[0].isupper():
- if word in dicta:
- dicta[word]=dicta[word]+1
- else:
- dicta[word]=1
- names=[]
- counts=[]
- for item in dicta:
- names.append(item)
- counts.append(dicta[item])
- df=pd.DataFrame(columns=['words','counts'])
- df['words']=names
- df['counts']=counts
- df2=df.sort_values('counts',ascending=False)
Add Comment
Please, Sign In to add comment