Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- <?xml version="1.0" encoding="utf-8"?><scraper framework="1,1" date="2011-03-26" name="imdb_olympia_v1.5" content="movies" thumb="imdb.png" language="en">
- <GetSettings dest="3">
- <RegExp input="$$5" output="<settings>\1</settings>" dest="3">
- <RegExp input="$$1" output="<setting label="Title Language From" type="labelenum" values="Keep Original|USA / International|Argentina|Austria|Belgium|Brazil|Bulgaria|Canada|China|Colombia|Chile|Croatia|Czech Republic|Denmark|Finland|France|Germany|Greece|Hong Kong|Hungary|Iceland|India|Israel|Italy|Japan|Mexico|Netherlands|Norway|Pakistan|Poland|Portugal|Romania|Russia|Serbia|Singapore|Slovenia|Spain|Sweden|Switzerland|Thailand|Turkey|Uruguay|Venezuela" id="akatitles" default="Keep Original"></setting>" dest="5">
- <expression />
- </RegExp>
- <RegExp input="$$1" output="<setting label="HD-Trailers.net Quality" type="labelenum" values="none|480p|720p|1080p" id="TrailerQ" default="480p"></setting>" dest="5+">
- <expression />
- </RegExp>
- <RegExp input="$$1" output="<setting label="Get Plot from TMDb" type="bool" id="tmdbplot" default="false"></setting>" dest="5+">
- <expression />
- </RegExp>
- <RegExp input="$$1" output="<setting label="TMDb Plot Language" type="labelenum" values="da|fi|nl|de|it|es|fr|pl|hu|el|tr|ru|he|ja|pt|zh|cs|sl|hr|ko|en|sv|no" id="plotlanguage" default="en"></setting>" dest="5+">
- <expression />
- </RegExp>
- <expression noclean="1" />
- </RegExp>
- </GetSettings>
- <NfoUrl dest="3">
- <RegExp input="$$1" output="<url>http://akas.imdb.com/title/tt\1/</url><id>tt\1</id>" dest="3">
- <expression clear="yes" noclean="1">imdb....?/Title\?([0-9]*)</expression>
- </RegExp>
- <RegExp input="$$1" output="<url>http://akas.imdb.com/title/tt\1/</url><id>tt\1</id>" dest="3+">
- <expression noclean="1">imdb....?/title/tt([0-9]*)</expression>
- </RegExp>
- </NfoUrl>
- <CreateSearchUrl dest="3" SearchStringEncoding="iso-8859-1">
- <RegExp input="$$1" output="<url>http://akas.imdb.com/find?s=tt;q=\1$$4</url>" dest="3">
- <RegExp input="$$2" output="%20(\1)" dest="4">
- <expression clear="yes">(.+)</expression>
- </RegExp>
- <expression noclean="1"/>
- </RegExp>
- </CreateSearchUrl>
- <GetSearchResults dest="8">
- <RegExp input="$$5" output="<?xml version="1.0" encoding="iso-8859-1" standalone="yes"?><results>\1</results>" dest="8">
- <RegExp input="$$1" output="\1" dest="7">
- <expression clear="yes">/title/([t0-9]*)/(combined|faq|releaseinfo|vote)</expression>
- </RegExp>
- <RegExp input="$$1" output="<entity><title>\2</title><year>\3</year><url cache="$$7-main.html">http://akas.imdb.com/title/$$7/</url><id>$$7</id></entity>" dest="5">
- <expression clear="yes" noclean="2"><meta name="title" content="(IMDb - )*(?:&#x22;)?([^"]*?)(?:&#x22;)? \([^\(]*?([0-9]{4})\)</expression>
- </RegExp>
- <RegExp input="$$1" output="\1" dest="4">
- <expression noclean="1">(><a href="/title.*)</expression>
- </RegExp>
- <RegExp input="$$4" output="<entity><title>\2</title><year>\3</year><url cache="\1-main.html">http://akas.imdb.com/title/\1/</url><id>\1</id></entity>" dest="5+">
- <expression repeat="yes" noclean="1,2">><a href="/title/([t0-9]*)/[^>]*>(?:&#x22;)?([^<]*?)(?:&#x22;)?</a> *\([^\(]*?([0-9]{4})</expression>
- </RegExp>
- <expression clear="yes" noclean="1"/>
- </RegExp>
- </GetSearchResults>
- <GetDetails dest="3">
- <RegExp input="$$5" output="<details>\1</details>" dest="3">
- <RegExp input="$$2" output="<id>\1</id>" dest="5">
- <expression/>
- </RegExp>
- <RegExp input="$$1" output="\2" dest="18">
- <expression><meta name="title" content="(IMDb - )*(?:&#x22;)?([^"]*?)(?:&#x22;)? \([^\(]*?([0-9]{4})\)</expression>
- </RegExp>
- <RegExp input="$$18" output="<sorttitle>\1</sorttitle><originaltitle>\1</originaltitle>" dest="5+">
- <expression/>
- </RegExp>
- <RegExp input="$$17" output="\1" dest="19">
- <RegExp input="$$18" output="\1-" dest="17">
- <expression repeat="yes" trim="1">([\w]+)</expression>
- </RegExp>
- <expression noclean="1" />
- </RegExp>
- <RegExp input="$$2" output="<url cache="$$2-combined.html" function="ParseIMDBAKATitles">http://akas.imdb.com/title/$$2/combined</url>" dest="5+">
- <expression noclean="1" />
- </RegExp>
- <RegExp input="$$1" output="<year>\2</year>" dest="5+">
- <expression><meta name="title" content="([^"]*?) \([^\(]*?([0-9]{4})\)</expression>
- </RegExp>
- <RegExp input="$$1" output="<top250>\1</top250>" dest="5+">
- <expression>Top 250 #([0-9]*)</</expression>
- </RegExp>
- <RegExp input="$$1" output="<mpaa>\1</mpaa>" dest="5+">
- <expression>MPAA</a>\)</h4>\n?<span itemprop="contentRating">([^<]*)</expression>
- </RegExp>
- <RegExp input="$$1" output="<tagline>\1</tagline>" dest="5+">
- <expression><h4[^>]*?>Taglines:</h4>\n?([^<]*)</expression>
- </RegExp>
- <RegExp input="$$1" output="<runtime>\1</runtime>" dest="5+">
- <expression trim="1"><h4[^>]*?>Runtime:</h4>[^0-9]*([0-9]+)</expression>
- </RegExp>
- <RegExp input="$$1" output="<rating>\1</rating><votes>\2</votes>" dest="5+">
- <expression>itemprop="ratingValue">([0-9.]+).*?>.*?title="([0-9,]+)\s</expression>
- </RegExp>
- <RegExp input="$$1" output="<genre>\1</genre>" dest="5+">
- <expression repeat="yes"><a href="/genre/([^"]+)</expression>
- </RegExp>
- <RegExp input="$$1" output="<country>\1</country>" dest="5+">
- <expression repeat="yes"><a href="/country/[^>]+>([^<]+)</expression>
- </RegExp>
- <RegExp input="$$1" output="<studio>\1</studio>" dest="5+">
- <expression>"/company/[^>]+>([^<]+)</a></expression>
- </RegExp>
- <RegExp input="$$1" output="<plot>\1</plot>" dest="5+">
- <expression trim="1"><h2>Storyline</h2>\n+<p>([^<]+)</expression>
- </RegExp>
- <RegExp input="$$1" output="<outline>\1</outline>" dest="5+">
- <expression trim="1">itemprop="description">([^<]+)<</expression>
- </RegExp>
- <RegExp input="$$1" output="<premiered>\1</premiered>" dest="5+">
- <expression trim="1">itemprop="datePublished" datetime=".{10,}?">([^<]+)<</expression>
- </RegExp>
- <RegExp input="$$2" output="<url cache="$$2-combined.html" function="ParseIMDBCertification">http://akas.imdb.com/title/$$2/combined</url>" dest="5+">
- <expression noclean="1" />
- </RegExp>
- <RegExp input="$$2" output="<url cache="$$2-main.html" function="ParseIMDBCast">http://akas.imdb.com/title/$$2/</url>" dest="5+">
- <expression noclean="1" />
- </RegExp>
- <RegExp input="$$2" output="<url cache="$$2-main.html" function="ParseIMDBDirectors">http://akas.imdb.com/title/$$2/</url>" dest="5+">
- <expression noclean="1" />
- </RegExp>
- <RegExp input="$$2" output="<url cache="$$2-main.html" function="ParseIMDBWriters">http://akas.imdb.com/title/$$2/</url>" dest="5+">
- <expression noclean="1" />
- </RegExp>
- <RegExp input="$$2" output="<url function="ParseTMDBFanart" cache="tmdb-images-$$2.xml">http://api.themoviedb.org/2.1/Movie.getImages/en/xml/57983e31fb435df4df77afb854740ea9/$$2</url>" dest="5+">
- <expression/>
- </RegExp>
- <RegExp input="$$2" output="<url function="ParseTMDBThumbs" cache="tmdb-images-$$2.xml">http://api.themoviedb.org/2.1/Movie.imdbLookup/en/xml/57983e31fb435df4df77afb854740ea9/$$2</url>" dest="5+">
- <expression/>
- </RegExp>
- <RegExp conditional="tmdbplot" input="$$2" output="<url function="GetTMDBPlot">http://api.themoviedb.org/2.1/Movie.imdbLookup/en/xml/57983e31fb435df4df77afb854740ea9/$$2</url>" dest="5+">
- <expression/>
- </RegExp>
- <RegExp input="$INFO[TrailerQ]" output="<url function="Get480pTrailer">http://www.hd-trailers.net/movie/$$19</url>" dest="5+">
- <expression>480p</expression>
- </RegExp>
- <RegExp input="$INFO[TrailerQ]" output="<url function="Get720pTrailer">http://www.hd-trailers.net/movie/$$19</url>" dest="5+">
- <expression>720p</expression>
- </RegExp>
- <RegExp input="$INFO[TrailerQ]" output="<url function="Get1080pTrailer">http://www.hd-trailers.net/movie/$$19</url>" dest="5+">
- <expression>1080p</expression>
- </RegExp>
- <expression noclean="1"/>
- </RegExp>
- </GetDetails>
- <ParseIMDBAKATitles dest="5">
- <RegExp input="$$2" output="<details><sorttitle>\1</sorttitle><title>\1</title></details>" dest="5">
- <RegExp input="$$1" output="\1" dest="2">
- <expression><h1>([^<]*)</expression>
- </RegExp>
- <RegExp input="$$10" output="\1" dest="4">
- <RegExp input="$$1" output="\1" dest="9">
- <expression><meta name="title" content="(?:&#x22;)?([^"]*?)(?:&#x22;)? \([^\(]*?([0-9]{4})\)</expression>
- </RegExp>
- <RegExp input="$$9" output="\1" dest="10">
- <expression />
- </RegExp>
- <RegExp input="$$1" output="\1" dest="11">
- <expression clear="yes">>\s*?"([^<]+)"[^<]+[<em>]?[^"]+Hong Kong [<em>][^"]+English</expression>
- </RegExp>
- <RegExp input="$$11" output="\1" dest="10">
- <expression>(.+)</expression>
- </RegExp>
- <RegExp input="$$1" output="\1" dest="11">
- <expression clear="yes">>\s*?"([^<]+)"[^<]+[<em>]?[^"]+((Canada)\s(<em>)?\((English|imdb))</expression>
- </RegExp>
- <RegExp input="$$11" output="\1" dest="10">
- <expression>(.+)</expression>
- </RegExp>
- <RegExp input="$$1" output="\1" dest="11">
- <expression clear="yes">>\s*?"([^<]+)"[^<]+[<em>]?[^"]+(UK(<em>)?<br>)</expression>
- </RegExp>
- <RegExp input="$$11" output="\1" dest="10">
- <expression>(.+)</expression>
- </RegExp>
- <RegExp input="$$1" output="\1" dest="11">
- <expression clear="yes">>\s*?"([^<]+)"[^"]+International\s(<em>)?\(English title\)(</em>)?(,|<)( |b)</expression>
- </RegExp>
- <RegExp input="$$11" output="\1" dest="10">
- <expression>(.+)</expression>
- </RegExp>
- <RegExp input="$$1" output="\1" dest="11">
- <expression clear="yes">>\s*?"([^<]+)"[^"]+International\s(<em>)?\(English title\)(</em>)? (<em>)?\(imdb</expression>
- </RegExp>
- <RegExp input="$$11" output="\1" dest="10">
- <expression>(.+)</expression>
- </RegExp>
- <RegExp input="$$1" output="\1" dest="12">
- <expression clear="yes"><a href="/country/[^>]+>(UK</a></div>)</expression>
- </RegExp>
- <RegExp input="$$12" output="$$9" dest="10">
- <expression>(.+)</expression>
- </RegExp>
- <RegExp input="$$1" output="\1" dest="12">
- <expression clear="yes"><a href="/country/[^>]+>(USA</a></div>)</expression>
- </RegExp>
- <RegExp input="$$12" output="$$9" dest="10">
- <expression>(.+)</expression>
- </RegExp>
- <RegExp input="$$1" output="\1" dest="11">
- <expression clear="yes">>\s*?"([^<]+)"[^<]+[<em>]?[^"]+(USA(<em>)?<br>)</expression>
- </RegExp>
- <RegExp input="$$11" output="\1" dest="10">
- <expression>(.+)</expression>
- </RegExp>
- <RegExp input="$$1" output="\1" dest="11">
- <expression clear="yes">>\s*?"([^<]+)"[^<]+[<em>]?[^"]+((USA)\s(<em>)?\((English|imdb))</expression>
- </RegExp>
- <RegExp input="$$11" output="\1" dest="10">
- <expression>(.+)</expression>
- </RegExp>
- <RegExp input="$$1" output="\1" dest="11">
- <expression clear="yes">>\s*?"([^<]+)"[^<]+[<em>]?[^"]+((USA)\s(<em>)?\((new title))</expression>
- </RegExp>
- <RegExp input="$$11" output="\1" dest="10">
- <expression>(.+)</expression>
- </RegExp>
- <expression noclean="1" />
- </RegExp>
- <RegExp input="$$4" output="\1" dest="2">
- <expression>(.+)</expression>
- </RegExp>
- <RegExp input="$$1" output="\1" dest="4">
- <expression>>\s*?"([^<]+)"[^<]+[<em>]?[^"]+$INFO[akatitles]</expression>
- </RegExp>
- <RegExp input="$$4" output="\1" dest="2">
- <expression>(.+)</expression>
- </RegExp>
- <RegExp input="$$1" output="\1" dest="5">
- <expression>><a href="/country/[^>]+>($INFO[akatitles]</a></div>)</expression>
- </RegExp>
- <RegExp input="$$5" output="$$9" dest="4">
- <expression>($INFO[akatitles])</expression>
- </RegExp>
- <RegExp input="$INFO[akatitles]" output="$$9" dest="4">
- <expression>Keep Original</expression>
- </RegExp>
- <RegExp input="$$4" output="\1" dest="2">
- <expression>(.+)</expression>
- </RegExp>
- <expression noclean="1" />
- </RegExp>
- </ParseIMDBAKATitles>
- <ParseIMDBCertification dest="5">
- <RegExp input="$$2" output="<details>\1</details>" dest="5">
- <RegExp input="$$1" output="<certification>\1</certification>" dest="2+">
- <expression repeat="yes">certificates=[^"]*">([^<]*)</expression>
- </RegExp>
- <expression noclean="1" />
- </RegExp>
- </ParseIMDBCertification>
- <ParseIMDBCast dest="5">
- <RegExp input="$$2" output="<details>\1</details>" dest="5">
- <RegExp input="$$1" output="\1" dest="6">
- <expression noclean="1"><table class="cast_list">(.*?)</table></expression>
- </RegExp>
- <RegExp input="$$6" output="<actor><thumb>\2_SX512_SY512_\3</thumb><name>\1</name><role>\5</role></actor>" dest="7">
- <expression repeat="yes" clear="yes" trim="3,4" noclean="1,2"><noscript><img \n[^a]*alt="([^"]*)"[^"]*"[^"]*"[^s]*src="(?:([^"]*\.)[^"]*(\.jpg))[^>]*.*?ter">[^>]*>\n\s*(<[^>]*>)?([^<\(]*)?</expression>
- </RegExp>
- <RegExp input="$$6" output="<actor><thumb></thumb><name>\1</name><role>\3</role></actor>" dest="7+">
- <expression repeat="yes" trim="1,2" noclean="1,2"><img \n[^a]*alt="([^"]*)"[^"]*"[^"]*"[^s]*src="(?:[^"]*\.[^"]*\.png)" class="" />*.*?ter">[^>]*>\n\s*(<[^>]*>)?([^<\(]*)?</expression>
- </RegExp>
- <RegExp input="$$7" output="<actor><thumb>\1</thumb>\2</actor>" dest="2+">
- <expression repeat="yes" clear="yes" noclean="1,2,3"><actor><thumb>(?:(http.*?)|_SX[0-9]+_SY[0-9]+_)?</thumb>(.*?)</actor></expression>
- </RegExp>
- <expression noclean="1" />
- </RegExp>
- </ParseIMDBCast>
- <ParseIMDBDirectors dest="5">
- <RegExp input="$$2" output="<details>\1</details>" dest="5">
- <RegExp input="$$1" output="\1" dest="6">
- <expression clear="yes" noclean="1">Director[s]?.*?</h4>(.*?)<div class</expression>
- </RegExp>
- <RegExp input="$$6" output="<director>\1</director>" dest="2+">
- <expression repeat="yes" fixchars="1" clear="yes"><a href="/name[^>]*>([^<]*)<</expression>
- </RegExp>
- <expression noclean="1" />
- </RegExp>
- </ParseIMDBDirectors>
- <ParseIMDBWriters dest="5">
- <RegExp input="$$2" output="<details>\1</details>" dest="5">
- <RegExp input="$$1" output="\1" dest="6">
- <expression noclean="1">Writer[s]?.*?</h4>(.*?)<div class</expression>
- </RegExp>
- <RegExp input="$$6" output="<credits>\1</credits>" dest="2+">
- <expression repeat="yes" fixchars="1"><a href="/name[^>]*>([^<]*)<</expression>
- </RegExp>
- <expression noclean="1" />
- </RegExp>
- </ParseIMDBWriters>
- <ParseTMDBFanart dest="5">
- <RegExp input="$$2" output="<details><fanart>\1</fanart></details>" dest="5">
- <RegExp input="$$1" output="<thumb>\1</thumb>" dest="3">
- <expression noclean="1" repeat="yes"><backdrop[^>]*>(.*?)</backdrop></expression>
- </RegExp>
- <RegExp input="$$3" output="<thumb preview="\2">\1\3</thumb>" dest="4">
- <expression noclean="1,3" repeat="yes"><thumb>(.*?)url="([^"]*)" size="poster"(.*?)</thumb></expression>
- </RegExp>
- <RegExp input="$$4" output="<thumb\1>\2</thumb>" dest="2">
- <expression repeat="yes" noclean="1"><thumb([^>]*)>.*?url="([^"]*)" size="original".*?</thumb></expression>
- </RegExp>
- <expression noclean="1">(.+)</expression>
- </RegExp>
- </ParseTMDBFanart>
- <ParseTMDBThumbs dest="5">
- <RegExp input="$$2" output="<details>\1</details>" dest="5">
- <RegExp input="$$1" output="<thumb>\1</thumb>" dest="3">
- <expression noclean="1" repeat="yes"><poster[^>]*>(.*?)</poster></expression>
- </RegExp>
- <RegExp input="$$3" output="<thumb preview="\2">\1\3</thumb>" dest="4">
- <expression noclean="1,3" repeat="yes"><thumb>(.*?)url="([^"]*)" size="mid"(.*?)</thumb></expression>
- </RegExp>
- <RegExp input="$$4" output="<thumb\1>\2</thumb>" dest="2">
- <expression repeat="yes" noclean="1"><thumb([^>]*)>.*?url="([^"]*)" size="original".*?</thumb></expression>
- </RegExp>
- <expression noclean="1">(.+)</expression>
- </RegExp>
- </ParseTMDBThumbs>
- <GetTMDBPlot dest="5">
- <RegExp input="$$1" output="<details><url function="ParseTMDBPlot" cache="tmdb-info-$INFO[plotlanguage]-\1.xml">http://api.themoviedb.org/2.1/Movie.getInfo/$INFO[plotlanguage]/xml/57983e31fb435df4df77afb854740ea9/\1</url></details>" dest="5">
- <expression noclean="1"><id>([^<]*)</id></expression>
- </RegExp>
- </GetTMDBPlot>
- <ParseTMDBPlot dest="5">
- <RegExp input="$$2" output="<details>\1</details>" dest="5">
- <RegExp input="$$1" output="<plot>\1</plot>" dest="2">
- <expression noclean="1"><overview>([^<]*)</overview></expression>
- </RegExp>
- <RegExp input="$$1" output="<outline>\1.</outline>" dest="2+">
- <expression noclean="1"><overview>(.{180,}?)[.?!]</expression>
- </RegExp>
- <expression noclean="1">(.+)</expression>
- </RegExp>
- </ParseTMDBPlot>
- <Get480pTrailer dest="5">
- <!--Fetch 480p trailer link from hdtrailers.net-->
- <RegExp input="$$1" output="<details><trailer>http://playlist.yahoo.com/makeplaylist.dll?sdm=web&pt=rd&sid=\1</trailer></details>" dest="5">
- <expression noclean="1">">Trailer</span></td>.*?sid=(\d*)" rel="lightbox\[res480p</expression>
- </RegExp>
- </Get480pTrailer>
- <Get720pTrailer dest="5">
- <RegExp input="$$6" output="<details><trailer>\1</trailer></details>" dest="5">
- <!--Fallback to fetch 480p trailer link if 720p is not available-->
- <RegExp input="$$1" output="http://playlist.yahoo.com/makeplaylist.dll?sdm=web&pt=rd&sid=\1" dest="6">
- <expression noclean="1">">Trailer</span></td>.*?sid=(\d*)" rel="lightbox\[res480p</expression>
- </RegExp>
- <!--Fetch 720p trailer link from hdtrailers.net-->
- <RegExp input="$$1" output="http://playlist.yahoo.com/makeplaylist.dll?sdm=web&pt=rd&sid=\1" dest="6">
- <expression noclean="1">">Trailer</span></td>.*?sid=(\d*)" rel="lightbox\[res720p</expression>
- </RegExp>
- <expression noclean="1" />
- </RegExp>
- </Get720pTrailer>
- <Get1080pTrailer dest="5">
- <RegExp input="$$6" output="<details><trailer>\1</trailer></details>" dest="5">
- <!--Fallback to fetch 480p trailer link if 720p and 1080p are not available-->
- <RegExp input="$$1" output="http://playlist.yahoo.com/makeplaylist.dll?sdm=web&pt=rd&sid=\1" dest="6">
- <expression noclean="1">">Trailer</span></td>.*?sid=(\d*)" rel="lightbox\[res480p</expression>
- </RegExp>
- <!--Fallback to fetch 720p trailer link if 1080p is not available-->
- <RegExp input="$$1" output="http://playlist.yahoo.com/makeplaylist.dll?sdm=web&pt=rd&sid=\1" dest="6">
- <expression noclean="1">">Trailer</span></td>.*?sid=(\d*)" rel="lightbox\[res720p</expression>
- </RegExp>
- <!--Fetch 1080p trailer link from hdtrailers.net-->
- <RegExp input="$$1" output="http://playlist.yahoo.com/makeplaylist.dll?sdm=web&pt=rd&sid=\1" dest="6">
- <expression noclean="1">">Trailer</span></td>.*?sid=(\d*)" rel="lightbox\[res1080p</expression>
- </RegExp>
- <expression noclean="1" />
- </RegExp>
- </Get1080pTrailer>
- </scraper>
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement