aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorvdrfan <vdrfan@svn>2009-12-20 07:11:46 +0000
committervdrfan <vdrfan@svn>2009-12-20 07:11:46 +0000
commitf235603c4cccb2bbf2d163764f34f5b0a3b383c5 (patch)
treef6156f6728d7c7ea57b8330b39f77bf961c732de
parentaa760aa635d36d3c9e27cb823503042400d2674d (diff)
fixed: Ticket #8219 - Daum Movie Scraper Patch (thanks hojel!)
git-svn-id: https://xbmc.svn.sourceforge.net/svnroot/xbmc/trunk@25870 568bbfeb-2a22-0410-94d2-cc84cf5bfa90
-rw-r--r--system/scrapers/video/daum.xml58
1 files changed, 34 insertions, 24 deletions
diff --git a/system/scrapers/video/daum.xml b/system/scrapers/video/daum.xml
index f84bed4084..896c748d45 100644
--- a/system/scrapers/video/daum.xml
+++ b/system/scrapers/video/daum.xml
@@ -27,7 +27,7 @@
<GetSearchResults dest="8">
<RegExp input="$$5" output="&lt;?xml version=&quot;1.0&quot; encoding=&quot;UTF-8&quot; standalone=&quot;yes&quot;?&gt;&lt;results&gt;\1&lt;/results&gt;" dest="8">
<RegExp input="$$1" output="&lt;entity&gt;&lt;title&gt;\2(\4,\3) &lt;/title&gt;&lt;url&gt;http://movie.daum.net/moviedetail/moviedetailMain.do?movieId=\1&lt;/url&gt;&lt;/entity&gt;" dest="5">
- <expression repeat="yes">class=&quot;fl srch&quot;&gt;&lt;a href=&quot;http://movie.daum.net/moviedetail/moviedetailMain.do\?movieId=([0-9]*)&quot;[^&gt;]*&gt;(.[^\(]*)\(([0-9]*)\)[^\%]*\%&quot;[^&quot;]*&quot;cb&quot;[^&quot;]*&quot;fs13[^&quot;]*&quot;&gt;(.[^\/]*)\/</expression>
+ <expression repeat="yes">class=&quot;fl srch&quot;&gt;&lt;a href=&quot;http://movie.daum.net/moviedetail/moviedetailMain.do\?movieId=([0-9]+)&quot;[^&gt;]*&gt;([^%]*)&lt;/a&gt;[ ]*\(([0-9]+)\)&lt;/span&gt;[^\(]*&quot;fs13&quot;&gt;([^&quot;]*)&lt;/span</expression>
</RegExp>
<expression noclean="1"/>
</RegExp>
@@ -35,22 +35,38 @@
<GetDetails dest="3">
<RegExp input="$$8" output="&lt;details&gt;\1&lt;/details&gt;" dest="3">
<!-- Titles, year !-->
+ <RegExp input="$$1" output="&lt;title&gt;\1&lt;/title&gt;&lt;year&gt;\2&lt;/year&gt;" dest="8">
+ <expression noclean="1">class=&quot;title_kor&quot;[ ]*&gt;([^&lt;]+)&lt;/strong&gt;[^\(]*\(.*?&lt;?([0-9]+).*?title_AKA&quot;[ ]*&gt;[ \n]*&lt;span class=&quot;eng&quot;&gt;[ \n]*&lt;/span</expression>
+ </RegExp>
+ <RegExp input="$$1" output="&lt;title&gt;\1 (\3)&lt;/title&gt;&lt;year&gt;\2&lt;/year&gt;" dest="8">
+ <expression noclean="1">class=&quot;title_kor&quot;[ ]*&gt;([^&lt;]+)&lt;/strong&gt;[^\(]*\(.*?&lt;?([0-9]+).*?title_AKA&quot;[ ]*&gt;[ \n]*&lt;span class=&quot;eng&quot;&gt;[ \n]*([^ \n][^&lt;]*)&lt;/span</expression>
+ </RegExp>
<RegExp input="$$1" output="&lt;title&gt;\1 (\3)&lt;/title&gt;&lt;year&gt;\2&lt;/year&gt;" dest="8">
- <expression noclean="1">class=&quot;title_kor&quot;&gt;&lt;a[^&gt;]*&gt;(.[^&lt;]*)&lt;/a&gt;&lt;/strong&gt;[^&gt;]*&gt;\(&lt;a[^&gt;]*&gt;([0-9]*)&lt;/a&gt;\)[^&quot;]*&quot;title_AKA&quot;[^&quot;]*&quot;eng&quot;&gt;(.[^&lt;]*)&lt;</expression>
+ <expression noclean="1">class=&quot;title_kor&quot;[ ]*&gt;([^&lt;]+)&lt;/strong&gt;[^\(]*\(.*?&lt;?([0-9]+).*?title_AKA&quot;[ ]*&gt;[ \n]*([^ \n].*?)&lt;span class=&quot;eng&quot;&gt;[ \n]*&lt;/span</expression>
+ </RegExp>
+ <RegExp input="$$1" output="&lt;title&gt;\1 (\3,\4)&lt;/title&gt;&lt;year&gt;\2&lt;/year&gt;" dest="8+">
+ <expression noclean="1">class=&quot;title_kor&quot;[ ]*&gt;([^&lt;]+)&lt;/strong&gt;[^\(]*\(.*?&lt;?([0-9]+).*?title_AKA&quot;[ ]*&gt;([^&quot;]+)&quot;eng&quot;&gt;([^&lt;]*)&lt;/span</expression>
</RegExp>
<!-- Director's names !-->
<RegExp input="$$7" output="&lt;director&gt;\1&lt;/director&gt;" dest="8+">
<RegExp input="$$1" output="\1" dest="7">
- <expression noclean="1">&lt;strong&gt;감독&lt;/strong&gt;(.*)&lt;strong&gt;등급&lt;/strong&gt;</expression>
+ <expression noclean="1">&lt;strong&gt;감독&lt;/strong&gt;(.*?)&lt;strong&gt;출연&lt;/strong&gt;</expression>
+ </RegExp>
+ <expression noclean="1" repeat="yes">&lt;a href=[^&gt;]*&gt;([^&lt;]+)&lt;/a&gt;</expression>
+ </RegExp>
+ <!-- Studio !-->
+ <RegExp input="$$7" output="&lt;studio&gt;\1&lt;/studio&gt;" dest="8+">
+ <RegExp input="$$1" output="\1" dest="7">
+ <expression noclean="1">&lt;strong&gt;제작/배급&lt;/strong&gt;(.*?)&lt;strong&gt;감독&lt;/strong&gt;</expression>
</RegExp>
- <expression noclean="1" repeat="yes">&lt;a[^&gt;]*&gt;(.[^&lt;]*)&lt;/a&gt;</expression>
+ <expression noclean="1" repeat="yes">&lt;a href=&quot;[^&gt;]*&gt;([^&lt;]+)&lt;/a&gt;</expression>
</RegExp>
<!-- Actors !-->
- <RegExp input="$$7" output="&lt;actor&gt;&lt;name&gt;\1&lt;/name&gt;&lt;role&gt;\2&lt;/role&gt;&lt;thumb&gt;\3&lt;/thumb&gt;&lt;/actor&gt;" dest="8+">
+ <RegExp input="$$7" output="&lt;actor&gt;&lt;name&gt;\2&lt;/name&gt;&lt;role&gt;\3&lt;/role&gt;&lt;thumb&gt;\1&lt;/thumb&gt;&lt;/actor&gt;" dest="8+">
<RegExp input="$$1" output="\1" dest="7">
- <expression noclean="1">&quot;div_actors&quot;(.*)&quot;netizenGrade&quot;</expression>
+ <expression noclean="1">출연.*?&quot;actors&quot;(.*)&quot;gradeWrap&quot;</expression>
</RegExp>
- <expression noclean="1" repeat="yes">class=&quot;actor&quot; title=&quot;(.[^\|]*)\|\|(.[^&quot;]*)&quot;&gt;&lt;img src=&quot;(.[^&quot;]*)&quot;</expression>
+ <expression noclean="1" repeat="yes">class=&quot;cast_text&quot;&gt;&lt;img id=&quot;[^&quot;]*&quot;src=&quot;(.[^&quot;]*)&quot;[^&gt;]*&gt;[^&gt;]*&gt;(.[^&lt;]*)&lt;/a&gt;[^\(]*\((.[^\)]*)\)</expression>
</RegExp>
<!-- Tag Line !-->
<RegExp input="$$7" output="&lt;tagline&gt;\1&lt;/tagline&gt;" dest="8+">
@@ -60,11 +76,11 @@
<expression>class=&quot;txt&quot;&gt;[^&gt;]*&gt;(.[^&lt;]*)&lt;/b&gt;</expression>
</RegExp>
<!-- Plot !-->
- <RegExp input="$$7" output="&lt;plot&gt;\1&lt;/plot&gt;" dest="8+">
- <expression>class=&quot;txt&quot;&gt;[^&gt;]*&gt;[^&lt;]*&lt;/b&gt;&lt;br&gt;(.[^\t]*)\t</expression>
+ <RegExp input="$$1" output="&lt;plot&gt;\1&lt;/plot&gt;" dest="8+">
+ <expression>&lt;div class=&quot;txt&quot;&gt;&lt;table&gt;&lt;tr&gt;&lt;td&gt;[^&gt;]*&gt;[^&gt;]*&gt;&lt;/a&gt;[^\t]*\t(.[^&lt;]*)&lt;</expression>
</RegExp>
- <RegExp input="$$7" output="&lt;plot&gt;\1&lt;/plot&gt;" dest="8+">
- <expression>class=&quot;txt&quot;&gt;\n\t\t(.[^\t]*)\t</expression>
+ <RegExp input="$$1" output="&lt;plot&gt;\1&lt;/plot&gt;" dest="8+">
+ <expression>&lt;div class=&quot;txt&quot;&gt;&lt;table&gt;&lt;tr&gt;&lt;td&gt;[^\t]*\t(.[^&lt;]*)&lt;</expression>
</RegExp>
<!-- Single Poster !-->
<RegExp conditional="!EnableThumbs" input="$$1" output="&lt;thumb&gt;\1&lt;/thumb&gt;" dest="8+">
@@ -100,11 +116,8 @@
<expression>&lt;span class=&quot;fs11 fc3&quot;&gt;\(([0-9]*)명 참여\)&lt;/span&gt;</expression>
</RegExp>
<!-- MPAA !-->
- <RegExp input="$$7" output="&lt;mpaa&gt;\1&lt;/mpaa&gt;" dest="8+">
- <RegExp input="$$1" output="\1" dest="7">
- <expression noclean="1">&lt;strong&gt;등급&lt;/strong&gt;&lt;/dt&gt;[^&gt;]*&gt;(.[^&lt;]*)&lt;/dd&gt;</expression>
- </RegExp>
- <expression noclean="1" trim="1">\b(.[^\t]*)\t</expression>
+ <RegExp input="$$1" output="&lt;mpaa&gt;\1&lt;/mpaa&gt;" dest="8+">
+ <expression noclean="1">icon_rating_[0-9]*\.gif&quot; title=&quot;(.[^&quot;]*)&quot;</expression>
</RegExp>
<!-- Poster !-->
<RegExp conditional="EnableThumbs" input="$$1" output="&lt;url function=&quot;GetDaumPoster&quot;&gt;\1&lt;/url&gt;" dest="8+">
@@ -122,7 +135,7 @@
</RegExp>
<!-- FanArts !-->
<RegExp conditional="EnableFanArt" input="$$1" output="&lt;url function=&quot;GetDAUMFanart&quot;&gt;\1&lt;/url&gt;" dest="8+">
- <expression noclean="1">class=&quot;title_kor&quot;&gt;&lt;a href=&quot;(.[^&quot;]*)&quot;</expression>
+ <expression noclean="1">&lt;a class=&quot;tab1&quot; href=&quot;(.[^&quot;]*)&quot;</expression>
</RegExp>
<!-- Writer !-->
<RegExp conditional="EnableWriter" input="$$1" output="&lt;url function=&quot;GetWriter&quot;&gt;\1&lt;/url&gt;" dest="8+">
@@ -134,13 +147,10 @@
<GetDaumPoster dest="8">
<RegExp input="$$9" output="&lt;details&gt;\1&lt;/details&gt;" dest="8">
<RegExp input="$$1" output="\1" dest="7">
- <expression noclean="1">id=&quot;photo&quot;(.*)id=&quot;steal&quot;</expression>
+ <expression noclean="1">id=&quot;photo&quot;(.*)id=&quot;photoViewer&quot;</expression>
</RegExp>
<RegExp input="$$7" output="&lt;thumb preview=&quot;http://\1/C155x225/\2&quot;&gt;http://\1/image/\2&lt;/thumb&gt;" dest="9">
- <expression noclean="1" repeat="yes">&lt;img src=&quot;http://(.[^/]*)/C155x225/(.[^&quot;]*)&quot;</expression>
- </RegExp>
- <RegExp input="$$7" output="&lt;thumb preview=&quot;http://movie.daum-img.net/movie/movie-photo/\1/\2/\3/155_225_\4&quot;&gt;http://movie.daum-img.net/movie/movie-photo/\1/\2/\3/\4&lt;/thumb&gt;" dest="9+">
- <expression noclean="1" repeat="yes">&lt;img src=&quot;http://movie.daum-img.net/movie/movie-photo/([0-9]*)/([0-9]*)/([0-9]*)/[0-9]*_[0-9]*_(.[^&quot;]*)&quot;</expression>
+ <expression noclean="1" repeat="yes">&lt;img src=&quot;http://([^/]+)/C155x225/([^&quot;]+)&quot;</expression>
</RegExp>
<expression noclean="1"/>
</RegExp>
@@ -152,7 +162,7 @@
</GetTMDBId>
<GetTMDBFanart clearbuffers="no" dest="8">
<RegExp input="$$1" output="&lt;thumb preview=&quot;http://themoviedb.org/image/backdrops/\1/\2_poster.\3&quot;&gt;http://themoviedb.org/image/backdrops/\1/\2.\3&lt;/thumb&gt;" dest="10+">
- <expression clear="yes" noclean="1" repeat="yes">&lt;backdrop size=&quot;original&quot;&gt;.*?/([0-9]+)/([^\.]+)\.([^&lt;]*)&lt;/backdrop&gt;</expression>
+ <expression clear="yes" noclean="1" repeat="yes">&lt;backdrop size=&quot;original&quot;&gt;.*?/([0-9]+)/([^\.]+)\.([a-zA-Z]*)[^&lt;]*&lt;/backdrop&gt;</expression>
</RegExp>
</GetTMDBFanart>
<GetDAUMFanart clearbuffers="no" dest="8">
@@ -165,7 +175,7 @@
</GetDAUMFanart>
<GetWriter dest="8">
<RegExp input="$$1" output="\1" dest="7">
- <expression noclean="1">&lt;h5&gt;각본&lt;/h5&gt;(.*)&lt;h5&gt;촬영&lt;/h5&gt;</expression>
+ <expression noclean="1">&lt;h5[ ]*&gt;[ ]*각본&lt;/h5&gt;(.*)&lt;h5[ ]*&gt;촬영&lt;/h5&gt;</expression>
</RegExp>
<RegExp input="$$6" output="&lt;details&gt;\1&lt;/details&gt;" dest="8">
<RegExp input="$$7" output="&lt;credits&gt;\1&lt;/credits&gt;" dest="6">