diff options
Diffstat (limited to 'system/scrapers/video/filmstarts.xml')
-rw-r--r-- | system/scrapers/video/filmstarts.xml | 159 |
1 files changed, 159 insertions, 0 deletions
diff --git a/system/scrapers/video/filmstarts.xml b/system/scrapers/video/filmstarts.xml new file mode 100644 index 0000000000..676224405c --- /dev/null +++ b/system/scrapers/video/filmstarts.xml @@ -0,0 +1,159 @@ +<?xml version="1.0" encoding="utf-8" standalone="yes"?> +<scraper framework="1.1" date="2009-08-15" name="Filmstarts" content="movies" thumb="filmstarts.jpg" language="de"> + <include>common/tmdb.xml</include> + <GetSettings dest="3"> + <RegExp input="$$5" output="<settings>\1</settings>" dest="3"> + <RegExp input="$$1" output="<setting label="Fanart" type="bool" id="fanart" default="true"></setting>" dest="5+"> + <expression></expression> + </RegExp> + <expression noclean="1"></expression> + </RegExp> + </GetSettings> + + <NfoUrl dest="3"> + <RegExp input="$$1" output="<url>http://www.filmstarts.de/kritiken/\2.html</url>" dest="3"> + <expression clear="yes" noclean="1">(filmstarts.de/kritiken/)(.*).html</expression> + </RegExp> + <RegExp input="$$1" output="<url function="GetByIMDBId">http://www.imdb.com/title/tt\2/externalreviews</url>" dest="3+"> + <expression>(imdb.com/)Title\?([0-9]+)</expression> + </RegExp> + <RegExp input="$$1" output="<url function="GetByIMDBId">http://www.imdb.com/title/tt\2/externalreviews</url>" dest="3+"> + <expression>(imdb.com/title/tt)([0-9]*)</expression> + </RegExp> + </NfoUrl> + + <GetByIMDBId dest="3"> + <RegExp input="$$1" output="<url>http://www.filmstarts.de/kritiken/\1</url>" dest="3+"> + <expression noclean="1"><a href="http://www.filmstarts.de/kritiken/([^"]*)"</expression> + </RegExp> + </GetByIMDBId> + + <CreateSearchUrl dest="3" SearchStringEncoding="iso-8859-1"> + <RegExp input="$$1" output="<url>http://www.filmstarts.de/finde.html?t=film&amp;anfrage=\1&amp;x=0&amp;y=0&</url>" dest="3"> + <expression noclean="1"></expression> + </RegExp> + </CreateSearchUrl> + + <GetSearchResults dest="3"> + <RegExp input="$$5" output="<?xml version="1.0" encoding="iso-8859-1" standalone="yes"?><results>\1</results>" dest="3"> + <RegExp input="$$1" output="<entity><title>\2</title><url>http://www.filmstarts.de/kritiken/\1</url>;</entity>" dest="5"> + <expression repeat="yes"><li><a href="/kritiken/([^"]*)">.*?<span class="t">([^<]*)</span></expression> + </RegExp> + <expression noclean="1"></expression> + </RegExp> + </GetSearchResults> + + <GetDetails dest="3"> + <RegExp input="$$5" output="<?xml version="1.0" encoding="iso-8859-1" standalone="yes"?><details>\1</details>" dest="3"> + + <!--Title --> + <RegExp input="$$1" output="<title>\1</title>" dest="5+"> + <expression trim="1" noclean="1"><title>([^<|^(]*)</expression> + </RegExp> + + <!--Original Title--> + <RegExp input="$$1" output="<originaltitle>\1</originaltitle>" dest="5+"> + <expression>Originaltitel:(.*?)</div</expression> + </RegExp> + + <!--Year Film--> + <RegExp input="$$1" output="<year>\1</year>" dest="5+"> + <expression trim="1" noclean="1">genre".*weak".*[A-Z]([0-9 ]*) </div</expression> + </RegExp> + + <!--MPAA Film--> + <RegExp input="$$1" output="<mpaa>ab \1</mpaa>" dest="5+"> + <expression>FSK:.*?Ab ([0-9]*)<</expression> + </RegExp> + + <!--Director Film--> + <RegExp input="$$1" output="<director>\1</director>" dest="5+"> + <expression trim="1" noclean="1">Regie</span>.*?class="name">(.*?)</span</expression> + </RegExp> + + <!--Studio Film--> + <RegExp input="$$1" output="<studio>\1</studio>" dest="5+"> + <expression trim="1" noclean="1">Verleih:.*?">(.*?)</td</expression> + </RegExp> + + <!--Runtime Film--> + <RegExp input="$$1" output="<runtime>\1</runtime>" dest="5+"> + <expression trim="1" noclean="1">Laufzeit:</span>.*?">([A-Za-z0-9 ]*)</td</expression> + </RegExp> + + <!--User rating--> + <RegExp input="$$1" output="<rating>\1</rating><votes>\2</votes>" dest="5+"> + <expression trim="1" noclean="1">"Wertung: ([0-9]*) / ([0-9]*)"</expression> + </RegExp> + + <!--Genre Film--> + <RegExp input="$$1" output="<genre>\1</genre>" dest="5+"> + <expression trim="1" noclean="1"><div class="genre"><a.*?">(.*?)</a</expression> + </RegExp> + + <!--Writer--> + <RegExp input="$$1" output="<credits>\1</credits>" dest="5+"> + <expression trim="1" noclean="1">Drehbuch</span>.*?class="name">([A-Za-z ]*)</span</expression> + </RegExp> + + <!--Plot--> + <RegExp input="$$1" output="<plot>\1</plot>" dest="5+"> + <expression trim="1">"text critic topBorder">([^<]*)</div</expression> + </RegExp> + <RegExp input="$$1" output="<plot>\1</plot>" dest="5+"> + <expression trim="1">"text critic topBorder">.*?<br /><br />(.*?)</div></expression> + </RegExp> + + <!--Actors --> + <RegExp input="$$1" output="<url function="GetActors">http://www.filmstarts.de/kritiken/\1/castcrew.html</url>" dest="5+"> + <expression noclean="1">/kritiken/([-.%a-z0-9A-Z]+)/bilder.html</expression> + </RegExp> + + <!--Posters --> + <RegExp input="$$1" output="<url function="GetPosters">http://www.filmstarts.de/kritiken/\1/bilder.html</url>" dest="5+"> + <expression noclean="1">/kritiken/([-.%a-z0-9A-Z]+)/bilder.html</expression> + </RegExp> + + <!--URL to Google and Fanart--> + <RegExp conditional="fanart" input="$$8" output="<url function="GetTMDBFanartByIMDBId">http://www.google.com/search?q=site:imdb.com\1</url>" dest="5+"> + <RegExp input="$$1" output=""\1"+\3+||+"\2"" dest="7"> + <expression><title>([^<|^(]*).*Originaltitel:(.*?)</div>.*weak".*[A-Z]([0-9 ]*) </div</expression> + </RegExp> + <RegExp input="$$7" output="+\1" dest="8+"> + <expression repeat="yes">([^ ,]+)</expression> + </RegExp> + <expression></expression> + </RegExp> + <expression noclean="1"></expression> + </RegExp> + </GetDetails> + + <!--Poster--> + <GetPosters dest="5"> + <RegExp input="$$2" output="<?xml version="1.0" encoding="iso-8859-1" standalone="yes"><details>\1</details>" dest="5+"> + <RegExp input="$$1" output="<thumb preview="http://thumbs.filmstarts.de/image/\1">http://thumbs.filmstarts.de/wallpaper/\1</thumb>" dest="2"> + <expression repeat="yes">src="http://thumbs.filmstarts.de/mini/([^"]*)"</expression> + </RegExp> + <expression noclean="1"></expression> + </RegExp> + </GetPosters> + + <!--Actors--> + <GetActors dest="5"> + <RegExp input="$$2" output="<?xml version="1.0" encoding="iso-8859-1" standalone="yes"><details>\1</details>" dest="5+"> + <RegExp input="$$1" output="\1" dest="7+"> + <expression noclean="1">Schauspieler</li>(.*)</expression> + </RegExp> + <RegExp input="$$7" output="<actor><name>\1</name><thumb>http://thumbs.filmstarts.de/wallpaper/\2</thumb><role>\3</role></actor>" dest="2+"> + <expression repeat="yes" >img alt="([^"]*)".*?src="http://thumbs.filmstarts.de/nano/([^"]*)".*?role weak.*?">als ([A-Za-z ]*)<</expression> + </RegExp> + <RegExp input="$$7" output="<actor><name>\1</name><role>\2</role></actor>" dest="2+"> + <expression repeat="yes" >img alt="([^"]*)".*?src="/designs/default/images/no_avatar_small.gif".*?role weak.*?">als ([A-Za-z ]*)<</expression> + </RegExp> + <RegExp input="$$7" output="<actor><name>\1</name></actor>" dest="2+"> + <expression repeat="yes" >class="name">([A-Za-z ]*)</span</expression> + </RegExp> + <expression noclean="1"></expression> + </RegExp> + </GetActors> +</scraper> |