Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- <?xml version="1.0" encoding="UTF-8"?>
- <scraper framework="1.1" date="2014-10-25" name="jav" content="movies" language="en">
- <CreateSearchUrl SearchStringEncoding="utf-8" dest="2">
- <RegExp input="$$1" output="<url>http://www.heyzo.com/moviepages/\1/index.html</url>" dest="2">
- <expression clear="yes" noclean="1" encode="1">([0-9]{4})</expression>
- </RegExp>
- </CreateSearchUrl>
- <GetSearchResults clearbuffers="no" dest="4">
- <RegExp input="$$3" output="<?xml version="1.0" encoding="UTF-8" standalone="yes"?><results><entity>\1</entity></results>" dest="4">
- <RegExp input="$$1" output="<title>\1</title>" dest="3">
- <expression><title\b[^>]*>(.*?)</title></expression>
- </RegExp>
- <RegExp input="$$1" output="<url>$$2</url>" dest="3+">
- <expression/>
- </RegExp>
- <expression noclean="1"/>
- </RegExp>
- </GetSearchResults>
- <GetDetails dest="5">
- <RegExp input="$$8" output="<details>\1</details>" dest="5">
- <RegExp input="$$1" output="<title>\1</title>" dest="8">
- <expression trim="1"><h1>(.*?)\s*-.*?</h1></expression>
- </RegExp>
- <RegExp input="$$1" output="<year>\1</year>" dest="8+">
- <expression><span class="dataInfo">\s*?([0-9]{4})-[0-9]{2}-[0-9]{2}</expression>
- </RegExp>
- <RegExp input="$$1" output="<thumb>http://www.heyzo.com\1001.jpg</thumb><thumb>http://www.heyzo.com\1002.jpg</thumb><thumb>http://www.heyzo.com\1003.jpg</thumb><thumb>http://www.heyzo.com\1004.jpg</thumb><thumb>http://www.heyzo.com\1005.jpg</thumb>" dest="8+">
- <expression>(/contents/3000/[0-9]{4}/gallery/)</expression>
- </RegExp>
- <RegExp input="$$1" output="<studio>Heyzo</studio>" dest="8+">
- <expression/>
- </RegExp>
- <RegExp input="$$3" output="<genre>\1</genre>" dest="8+">
- <RegExp input="$$1" output="\1" dest="3">
- <expression noclean="1"><div class="tagkeyword"><span>タグキーワード</span></div>(.*?</ul>)</expression>
- </RegExp>
- <expression repeat="yes"><li>(.*?)</li></expression>
- </RegExp>
- <RegExp input="$$1" output="<actor><thumb spoof="http://www.heyzo.com">http://www.heyzo.com/actorprofile/3000/0\1/profile.jpg</thumb><name>\2 </name></actor>" dest="8+">
- <expression><span class="dataInfo">\s*<a href="/listpages/actor_([0-9]+)_1.html\?sort=pop" title="">(.*?)</a></expression>
- </RegExp>
- <RegExp input="$$1" output="<plot>\1</plot>" dest="8+">
- <expression trim="1"><p class="memo">(.*?)<</expression>
- </RegExp>
- <RegExp input="$$1" output="<fanart><thumb>\1.jpg</thumb></fanart>" dest="8+">
- <expression>(http://www.heyzo.com/contents/3000/[0-9]+/images/player_thumbnail)_450.jpg</expression>
- </RegExp>
- <RegExp input="$$1" output="<set>\1</set>" dest="9">
- <expression><a href="/listpages/series_[0-9]+_1.html">(.*?)</a></expression>
- </RegExp>
- <expression noclean="1"/>
- </RegExp>
- </GetDetails>
- </scraper>
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement