Guest User

Untitled

a guest
Jul 21st, 2018
98
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.53 KB | None | 0 0
  1. from sklearn.datasets import fetch_20newsgroups
  2. import pandas as pd
  3.  
  4. def twenty_newsgroup_to_csv():
  5. newsgroups_train = fetch_20newsgroups(subset='train')
  6.  
  7. df = pd.DataFrame([newsgroups_train.data, newsgroups_train.target.tolist()]).T
  8. df.columns = ['text', 'target']
  9.  
  10. targets = pd.DataFrame( newsgroups_train.target_names)
  11. targets.columns=['title']
  12.  
  13. out = pd.merge(df, targets, left_on='target', right_index=True)
  14. out['date'] = pd.to_datetime('now')
  15. out.to_csv('20_newsgroup.csv')
  16.  
  17. twenty_newsgroup_to_csv()
Add Comment
Please, Sign In to add comment