Advertisement
Guest User

Untitled

a guest
Nov 28th, 2012
2,395
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
XML 2.53 KB | None | 0 0
  1. <?xml version="1.0" encoding="utf-8"?><scraper framework="11" date="2012-11-28" name="Data18" content="movies" language="en">
  2.     <CreateSearchUrl dest="3">
  3.         <RegExp input="$$1" output="&lt;url&gt;http://www.data18.com/search/?k=\1&amp;t=2&lt;/url&gt;" dest="3">
  4.             <expression />
  5.         </RegExp>
  6.     </CreateSearchUrl>
  7.     <GetSearchResults dest="6">
  8.         <RegExp input="$$4" output="&lt;?xml version=&quot;1.0&quot; encoding=&quot;utf-8&quot; standalone=&quot;yes&quot;?&gt;&lt;results&gt;\1&lt;/results&gt;" dest="6">
  9.             <RegExp input="$$1" output="&lt;entity&gt;&lt;title&gt;\2&lt;/title&gt;&lt;url&gt;\1&lt;/url&gt;&lt;/entity&gt;" dest="4">
  10.                 <expression repeat="yes">&lt;a href="(http://www.data18.com/[^/]*/\d+/)"&gt;&lt;img src=[^ ]* class=[^ ]* title="([^"]*)"</expression>
  11.             </RegExp>
  12.             <expression noclean="1" />
  13.         </RegExp>
  14.     </GetSearchResults>
  15.     <GetDetails dest="7">
  16.         <RegExp input="$$5" output="&lt;?xml version=&quot;1.0&quot; encoding=&quot;utf-8&quot; standalone=&quot;yes&quot;?&gt;&lt;details&gt;\1&lt;/details&gt;" dest="7">
  17.             <RegExp input="$$1" output="&lt;title&gt;\1&lt;/title&gt;" dest="5+">
  18.                 <expression noclean="1">&lt;h1 class="h1big"&gt;([^&lt;]*)&lt;/h1&gt;</expression>
  19.             </RegExp>
  20.             <RegExp input="$$1" output="&lt;plot&gt;\1&lt;/plot&gt;" dest="5+">
  21.                 <expression>&lt;b&gt;Description:&lt;/b&gt;([^\t\r\n]*)</expression>
  22.             </RegExp>
  23.             <RegExp input="$$1" output="&lt;actor&gt;&lt;name&gt;\2&lt;/name&gt;&lt;thumb&gt;\1&lt;/thumb&gt;&lt;/actor&gt;" dest="5+">
  24.                 <expression repeat="yes" noclean="1">&lt;img src="(http://www.data18.com/img/stars[^"]*).*?alt="([^"]*)</expression>
  25.             </RegExp>
  26.             <RegExp input="$$1" output="&lt;thumb aspect=&quot;poster&quot;&gt;\1&lt;/thumb&gt;" dest="5+">
  27.                 <expression noclean="1">&lt;img src="([^"]*)" alt="Enlarge Cover"</expression>
  28.             </RegExp>
  29.             <RegExp input="$$1" output="&lt;runtime&gt;\1&lt;/runtime&gt;" dest="5+">
  30.                 <expression noclean="1">Length:&lt;/b&gt;[^\d]*(\d+)</expression>
  31.             </RegExp>
  32.             <RegExp input="$$1" output="&lt;director&gt;\1&lt;/director&gt;" dest="5+">
  33.                 <expression noclean="1">Director:&lt;/b&gt;[^&gt;]*&gt;([^&lt;]*)</expression>
  34.             </RegExp>
  35.             <RegExp input="$$1" output="&lt;studio&gt;\1&lt;/studio&gt;" dest="5+">
  36.                 <expression noclean="1">Studio:&lt;/b&gt;[^&gt;]*&gt;([^&lt;]*)</expression>
  37.             </RegExp>
  38.             <RegExp input="$$1" output="&lt;year&gt;\1&lt;/year&gt;" dest="5+">
  39.                 <expression>Release date:&lt;/b&gt;[^\d]*(\d{4})</expression>
  40.             </RegExp>
  41.             <expression noclean="1" />
  42.         </RegExp>
  43.     </GetDetails>
  44. </scraper>
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement