blob: c11931f92b90d758907835f294a165036b22e206 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
|
<?xml version="1.0" encoding="utf-8"?>
<scraper framework="1.0" date="2010-02-16" name="Rotten Tomatoes" content="movies" thumb="rottentomatoes.png" language="en">
<include>common/tmdb.xml</include>
<include>common/movieposterdb.xml</include>
<GetSettings dest="3">
<RegExp input="$$5" output="<settings>\1</settings>" dest="3">
<RegExp input="$$1" output="<setting label="Location" type="labelenum" id="locality" values="us|au|uk" default="au"></setting>" dest="5">
<expression></expression>
</RegExp>
<RegExp input="$$1" output="<setting label="Rating Type" type="labelenum" id="ratetype" values="Overall|Top Critics|RT Community" default="Overall"></setting>" dest="5+">
<expression></expression>
</RegExp>
<RegExp input="$$1" output="<setting label="Retrieve Classification Reason" type="bool" id="classreason" default="true"></setting>" dest="5+">
<expression></expression>
</RegExp>
<RegExp input="$$1" output="<setting label="Retrieve Fanart" type="bool" id="fanart" default="true"></setting>" dest="5+">
<expression></expression>
</RegExp>
<RegExp input="$$1" output="<setting label="Retrieve Thumbs" type="bool" id="thumbs" default="true"></setting>" dest="5+">
<expression></expression>
</RegExp>
<expression noclean="1"></expression>
</RegExp>
</GetSettings>
<NfoUrl dest="3">
<RegExp input="$$1" output="\1" dest="3">
<expression noclean="1">(http://$INFO[locality]\.rottentomatoes\.com/m/[A-Za-z0-9_]*)</expression>
</RegExp>
<RegExp input="$$1" output="<url>http://$INFO[locality].rottentomatoes.com/alias?type=imdbid&amp;s=\2</url>" dest="3+">
<expression>(imdb.com/)Title\?([0-9]+)</expression>
</RegExp>
<RegExp input="$$1" output="<url>http://$INFO[locality].rottentomatoes.com/alias?type=imdbid&amp;s=\2</url>" dest="3+">
<expression>(imdb.com/title/tt)([0-9]*)</expression>
</RegExp>
</NfoUrl>
<CreateSearchUrl dest="3">
<RegExp input="$$1" output="http://$INFO[locality].rottentomatoes.com/search/full_search.php?search=\1" dest="3">
<expression noclean="1"></expression>
</RegExp>
</CreateSearchUrl>
<GetSearchResults dest="8">
<RegExp input="$$5" output="<?xml version="1.0" encoding="iso-8859-1" standalone="yes"?><results>\1</results>" dest="8">
<RegExp input="$$1" output="<entity><title>\2 (\3)</title><url>http://$INFO[locality].rottentomatoes.com/m/\1</url></entity>" dest="5">
<expression repeat="yes"><a href="/m/([^"]*)">([^<]*).*?([0-9]{4})</expression>
</RegExp>
<expression noclean="1"></expression>
</RegExp>
</GetSearchResults>
<GetDetails dest="3">
<RegExp input="$$8" output="<details>\1</details>" dest="3">
<RegExp input="$$1" output="<title>\1</title>" dest="6">
<expression trim="1" noclean="1"><span property="v:name">([^<]*)</span> (\([0-9]{4})\)</h1></expression>
</RegExp>
<RegExp input="$$6" output="\1" dest="8">
<expression noclean="1"></expression>
</RegExp>
<RegExp input="$$1" output="<year>\1</year>" dest="9">
<expression noclean="1"><h1.class="movie_title clearfix">[\S\s]*\(([0-9]{4})\)</h1>[\S\s]*dialog_content clearfix</expression>
</RegExp>
<RegExp input="$$9" output="\1" dest="8+">
<expression noclean="1"></expression>
</RegExp>
<RegExp input="$$7" output="<director>\1</director>" dest="8+">
<RegExp input="$$1" output="\1" dest="7">
<expression noclean="1"><p class="movie_crew_shortened[\S\s]*Director:([\S\s]*)movie_crew_all</expression>
</RegExp>
<expression repeat="yes" noclean="1"><a.href="[^>]*>([A-Za-z ]*)</expression>
</RegExp>
<!-- MPAA / Classification-->
<RegExp conditional="!classreason" input="$$1" output="<mpaa>\1</mpaa>" dest="8+">
<expression><div id="movie_stats">[\S\s]*<span class="content">([^<]*)[\S\s]*\[See.Full.Rating\]</expression>
</RegExp>
<RegExp conditional="classreason" input="$$1" output="<mpaa>\1 \2</mpaa>" dest="8+">
<expression><div id="movie_stats">[\S\s]*<span class="content">([^<]*)[\S\s]*\[See.Full.Rating\][\S\s]*movie_rating_reason".style="display:.none">([^<]*)</expression>
</RegExp>
<!-- Runtime -->
<RegExp input="$$1" output="<runtime>\1</runtime>" dest="8+">
<expression>property="v:runtime" content="([^"]*)"</expression>
</RegExp>
<RegExp input="$$1" output="<studio>\1</studio>" dest="8+">
<expression><span class="label">Studio:</span>([^<]*)</expression>
</RegExp>
<!-- Credits -->
<RegExp input="$$7" output="<credits>\1</credits>" dest="8+">
<RegExp input="$$1" output="\1" dest="7">
<expression noclean="1">class="label">Screenwriter:</span>([^:]*)</expression>
</RegExp>
<expression noclean="1" repeat="yes"><a.href="[^>]*>([^<]*)</expression>
</RegExp>
<!-- Rating -->
<RegExp input="$$1" output="$INFO[ratetype]\1" dest="10">
<expression noclean="1">(<h1 class="movie_title clearfix">[\S\s]*<div id="tomatometer_bar">)</expression>
</RegExp>
<RegExp input="$$10" output="<rating max="100">\1</rating>" dest="8+">
<expression>Overall[\S\s]*<li class="ui-tabs-selected"><a title="([0-9]{2,3})</expression>
</RegExp>
<RegExp input="$$10" output="<rating max="100">\1</rating>" dest="8+">
<expression>Top Critics[\S\s]*<a title="(\d{1,3})%" href="/m/[^/]*/\?critic=creamcrop"></expression>
</RegExp>
<RegExp input="$$10" output="<rating max="100">\1</rating>" dest="8+">
<expression>RT Community[\S\s]*<a title="(\d{1,3})%" href="reviews_users.php"></expression>
</RegExp>
<!-- Votes -->
<RegExp input="$$1" output="<votes>\1</votes>" dest="8+">
<expression><p>Reviews Counted:<span>([^<]*)</expression>
</RegExp>
<!-- Genre -->
<RegExp input="$$1" output="<genre>\1</genre>" dest="8+">
<expression noclean="1"><span.class="label">Genre:</span>.<span class="content"><a.href="/movie/browser.php\?genre=[0-9]*">([^<]*)</expression>
</RegExp>
<!-- Actors-->
<RegExp input="$$7" output="<actor><name>\1</name><role></role></actor>" dest="8+">
<RegExp input="$$1" output="\1" dest="7">
<expression noclean="1"><span class="label">Starring:([\S\s]*)<p class="movie_cast_all"</expression>
</RegExp>
<expression repeat="yes" noclean="1"><a.href="[^>]*>([A-Za-z ]*)</expression>
</RegExp>
<!-- Outline -->
<RegExp input="$$1" output="<outline>\1</outline>" dest="8+">
<expression><p id="consensus"><span>Consensus:[^>]*>([^\n\r\t]*)</expression>
</RegExp>
<!-- Plot -->
<RegExp input="$$1" output="<plot>\1</plot>" dest="8+">
<expression><span id="movie_synopsis_all" style="display: none;">([\S\s]*)<a href="#" id="movie_synopsis_link</expression>
</RegExp>
<RegExp input="$$6" output="+\1" dest="12+">
<expression repeat="yes">([^ ,]+)</expression>
</RegExp>
<RegExp conditional="thumbs" input="$$12" output="<url cache="rottentomatoes_temp.xml" function="GetTMDBThumbsById">http://www.google.com/search?q=site:imdb.com\1</url>" dest="8+">
<RegExp input="$$1" output=""\1"+\2" dest="4+">
<expression>www\.imdb\.com/title/(tt[0-9]*)/\s</expression>
</RegExp>
<RegExp input="$$4" output="+\1" dest="12+">
<expression repeat="yes">([^ ,]+)</expression>
</RegExp>
<expression></expression>
</RegExp>
<RegExp conditional="fanart" input="$$12" output="<url cache="rottentomatoes_temp.xml" function="GetTMDBFanartById">http://www.google.com/search?q=site:imdb.com\1</url>" dest="8+">
<RegExp input="$$1" output=""\1"+\2" dest="4+">
<expression>www\.imdb\.com/title/(tt[0-9]*)/\s</expression>
</RegExp>
<RegExp input="$$4" output="+\1" dest="12+">
<expression repeat="yes">([^ ,]+)</expression>
</RegExp>
<expression></expression>
</RegExp>
<expression noclean="1"></expression>
</RegExp>
</GetDetails>
</scraper>
|