Advertisement
Guest User

Untitled

a guest
Jun 17th, 2019
63
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.08 KB | None | 0 0
  1. import pandas as pd
  2. import xml.etree.ElementTree as ET
  3.  
  4. xml1 = """<?xml version="1.0" encoding="ISO-8859-1"?>
  5. <pisteAuditProfilingQualif>
  6. ...
  7. <demande>
  8. ...
  9. </demande>
  10. </pisteAuditProfilingQualif>"""
  11.  
  12.  
  13. xml2 = """<?xml version="1.0" encoding="ISO-8859-1"?>
  14. ...
  15. <demande>
  16. ...
  17. <REQ_TITLE_2>Sirrah!</REQ_TITLE_2>
  18. <REQ_NAME_2>George</REQ_NAME_2>
  19. </demande>
  20. </pisteAuditProfilingQualif>"""
  21.  
  22. df = pd.DataFrame({'a':[42, 54],'xml':[xml1, xml2]})
  23.  
  24. dfx = pd.DataFrame()
  25. for x in df.xml:
  26. ex = ET.fromstring(x)
  27. ed = ex.find('demande')
  28. dfx = dfx.append(dict([(e.tag, e.text) for e in ed.iter()]), ignore_index=True)
  29.  
  30. print(df.join(dfx))
  31.  
  32. a xml ... REQ_NAME_2 REQ_TITLE_2
  33. 0 42 <?xml version="1.0" encoding="ISO-8859-1"?>n ... ... NaN NaN
  34. 1 54 <?xml version="1.0" encoding="ISO-8859-1"?>n ... ... George Sirrah!
  35.  
  36. [2 rows x 12 columns]
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement