Guest User

Untitled

a guest
May 23rd, 2018
99
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 3.00 KB | None | 0 0
  1. <var-def name="htmlBody">
  2. <regexp replace="true" flag-caseinsensitive="true" flag-multiline="true" flag-dotall="true">
  3. <regexp-pattern><![CDATA[&#27]]></regexp-pattern>
  4. <regexp-source>
  5. <var name="htmlBody"/>
  6. </regexp-source>
  7. <regexp-result>
  8. <template></template>
  9. </regexp-result>
  10. </regexp>
  11. </var-def>
  12.  
  13. <var-def name="articleContent">
  14. <xpath expression="//article/div/div[@class='gs-container']//figure[@itemprop='associatedMedia image']">
  15. <var name="htmlBody"/>
  16. </xpath>
  17. <xpath expression="//article/div/div[@class='gs-container']//figure[@itemprop='associatedMedia video']">
  18. <var name="htmlBody"/>
  19. </xpath>
  20. <xpath expression="//article//div[@itemprop='articleBody']">
  21. <var name="htmlBody"/>
  22. </xpath>
  23. </var-def>
  24.  
  25. <var-def name="articleContent">
  26. <regexp replace="true">
  27. <regexp-pattern><![CDATA[<picture>.*?<source media=.*?srcset="(.*?)".*?</picture>]]></regexp-pattern>
  28. <regexp-source>
  29. <var name="articleContent" />
  30. </regexp-source>
  31. <regexp-result>
  32. <template><![CDATA[<img src="${_1}"/>]]></template>
  33. </regexp-result>
  34. </regexp>
  35. </var-def>
  36.  
  37. <var-def name="articleContent">
  38. <regexp replace="true">
  39. <regexp-pattern><![CDATA[img src="//]]></regexp-pattern>
  40. <regexp-source>
  41. <var name="articleContent" />
  42. </regexp-source>
  43. <regexp-result>
  44. <template><![CDATA[img src="http://]]></template>
  45. </regexp-result>
  46. </regexp>
  47. </var-def>
  48.  
  49. <var-def name="articleContent">
  50. <regexp replace="true">
  51. <regexp-pattern><![CDATA[amp-img]]></regexp-pattern>
  52. <regexp-source>
  53. <var name="articleContent" />
  54. </regexp-source>
  55. <regexp-result>
  56. <template><![CDATA[img]]></template>
  57. </regexp-result>
  58. </regexp>
  59. </var-def>
  60.  
  61. <var-def name="articleContent">
  62. <regexp replace="true">
  63. <regexp-pattern><![CDATA[&#39;]]></regexp-pattern>
  64. <regexp-source>
  65. <var name="articleContent" />
  66. </regexp-source>
  67. <regexp-result>
  68. <template><![CDATA[']]></template>
  69. </regexp-result>
  70. </regexp>
  71. </var-def>
  72.  
  73. <var-def name="articleContent">
  74. <regexp replace="true">
  75. <regexp-pattern><![CDATA[<h[123](.*?)>(.*?)</h[123]>]]></regexp-pattern>
  76. <regexp-source>
  77. <var name="articleContent" />
  78. </regexp-source>
  79. <regexp-result>
  80. <template><![CDATA[<h4${_1}>${_2}</h4>]]></template>
  81. </regexp-result>
  82. </regexp>
  83. </var-def>
  84.  
  85. <var-def name="contentBody">
  86. <![CDATA[<root>]]>
  87. <var name="articleContent"/>
  88. <![CDATA[</root>]]>
  89. </var-def>
  90.  
  91. <var-def name="imageUrl">
  92. <xpath expression="//img/@src">
  93. <var name="contentBody"/>
  94. </xpath>
  95. <xpath expression="//video/@poster">
  96. <var name="contentBody"/>
  97. </xpath>
  98. </var-def>
Add Comment
Please, Sign In to add comment