Advertisement
Guest User

Untitled

a guest
Aug 19th, 2019
83
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 2.23 KB | None | 0 0
  1. import pandas as pd
  2. text =[list(['n[PROV', 'REPORT]nPerson', 'Name:', 'n','John', 'DearnProgram', 'Date:', '1/11/2000', '10:42', 'AMnMR']),
  3. list(['nToday', 'Name:', 'n','James', 'JaynProgram', 'Date:', '3/11/2000', '1:45', 'PMnmissing']),
  4. list(['n[NEWS', 'REPORT]nPerson', 'Name:', 'n','Jane', 'DoenProgram', 'Date:', '3/11/2000', '1:45', 'PMnMR']),
  5. list(['n[PROV', 'REPORT]nPerson', 'Name:', 'n','Amy', 'ArmynProgram', 'Date:', '10/1/2000', '11:45', 'AMnMR'])]
  6.  
  7.  
  8. df = pd.DataFrame({'Text' : text,
  9. 'ID': [1,2,3,4],
  10. 'P_ID': ['A','B','C','D'],
  11.  
  12. })
  13.  
  14. df
  15. ID P_ID Text
  16. 0 1 A [n[PROV, REPORT]nPerson, Name:, n, John, DearnProgram, Date:, 1/11/2000, 10:42, AMnMR]
  17. 1 2 B [nToday, Name:, n, James, JaynProgram, Date:, 3/11/2000, 1:45, PMnmissing]
  18. 2 3 C [n[NEWS, REPORT]nPerson, Name:, n, Jane, DoenProgram, Date:, 3/11/2000, 1:45, PMnMR]
  19. 3 4 D [n[PROV, REPORT]nPerson, Name:, n, Amy, ArmynProgram, Date:, 10/1/2000, 11:45, AMnMR]
  20.  
  21. df['Text'].values
  22.  
  23. array([ list(['n[PROV', 'REPORT]nPerson', 'Name:', 'n', 'John', 'DearnProgram', 'Date:', '1/11/2000', '10:42', 'AMnMR']),
  24. list(['nToday', 'Name:', 'n', 'James', 'JaynProgram', 'Date:', '3/11/2000', '1:45', 'PMnmissing']),
  25. list(['n[NEWS', 'REPORT]nPerson', 'Name:', 'n', 'Jane', 'DoenProgram', 'Date:', '3/11/2000', '1:45', 'PMnMR']),
  26. list(['n[PROV', 'REPORT]nPerson', 'Name:', 'n', 'Amy', 'ArmynProgram', 'Date:', '10/1/2000', '11:45', 'AMnMR'])], dtype=object)
  27.  
  28. df['New_Text'] = df['Text'].replace(r'n', ' n ', regex=True)
  29.  
  30. df['New_Text'].values
  31.  
  32. array([ list(['n', '[PROV', 'REPORT]', 'n' ,'Person', 'Name:', 'n', 'John', 'Dear', 'n', 'Program', 'Date:', '1/11/2000', '10:42', 'AM', 'n', 'MR']),
  33. list(['n', 'Today', 'Name:', 'n', 'James', 'Jay', 'n', 'Program', 'Date:', '3/11/2000', '1:45', 'PM','n', 'missing']),
  34. list(['n', '[NEWS', 'REPORT]','n', 'Person', 'Name:', 'n', 'Jane', 'Doe', 'n', 'Program', 'Date:', '3/11/2000', '1:45', 'PM', 'n', 'MR']),
  35. list(['n', '[PROV', 'REPORT]', 'n', 'Person', 'Name:', 'n', 'Amy', 'Army', 'n', 'Program', 'Date:', '10/1/2000', '11:45', 'AM', 'n', 'MR'])], dtype=object)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement