blob: 973e0e23f23aeb3fd01dcd5bd19663c8aa699d5c (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
|
<?xml version="1.0" encoding="UTF-8"?>
<scraper framework="1.1" date="2009-12-11" name="M1905" content="movies" thumb="M1905.jpg" language="zh">
<GetSettings dest="3">
<RegExp input="$$5" output="<settings>\1</settings>" dest="3">
<RegExp input="$$1" output="<setting label="Enable Fanart" type="bool" id="fanart" default="true"></setting>" dest="5+">
<expression/>
</RegExp>
<expression noclean="1"/>
</RegExp>
</GetSettings>
<NfoUrl dest="3">
<RegExp input="$$1" output="<url>\1</url>" dest="3">
<expression clear="yes" noclean="1">(http://www.m1905.com/film/[0-9]*\.shtml)</expression>
</RegExp>
</NfoUrl>
<CreateSearchUrl dest="3" SearchStringEncoding="UTF-8">
<RegExp input="$$1" output="<url>http://www.m1905.com/search/?type=film&amp;q=\1</url>" dest="3">
<expression noclean="1"/>
</RegExp>
</CreateSearchUrl>
<GetSearchResults dest="8">
<RegExp input="$$5" output="<?xml version="1.0" encoding="iso-8859-1" standalone="yes"?><results>\1</results>" dest="8">
<RegExp input="$$1" output="<entity><title>\2 - \3</title><url>http://www.m1905.com/film/\1.shtml</url><id>\1</id></entity>" dest="5+">
<expression repeat="yes" noclean="1"><a href="film/([0-9]*?).shtml" target="_blank" class="red14link">《(.*?)》</a>.*?class="blue14">(.*?)</a></expression>
</RegExp>
<expression clear="yes" noclean="1"/>
</RegExp>
</GetSearchResults>
<GetDetails dest="3">
<RegExp input="$$5" output="<details>\1</details>" dest="3">
<RegExp input="$$2" output="<id>\1</id>" dest="5">
<expression/>
</RegExp>
<RegExp input="$$1" output="<title>\1</title>" dest="5+">
<expression trim="1" noclean="1"><span style="font-size:25px; color:#505050; font-weight:bold;">《(.*?)》</span></expression>
</RegExp>
<RegExp input="$$1" output="<year>\1</year>" dest="5+">
<expression>上映日期:<span class="blue12font" style="color: #505050">([0-9]*)</expression>
</RegExp>
<RegExp input="$$1" output="<runtime>\1</runtime>" dest="5+">
<expression trim="1">片长:<span class="blue12font" style="color: #505050">([^<]*)<</expression>
</RegExp>
<RegExp input="$$2" output="<url cache="$$2-rating.html" function="GetRating">http://www.m1905.com/list.php?catid=157&amp;movieid=$$2&amp;mydo=ajax&amp;action_ajax=show&amp;</url>" dest="5+">
<expression/>
</RegExp>
<RegExp input="$$1" output="\1" dest="6">
<expression clear="yes" noclean="1">类型:<span class="blue12font" style="color: #505050">([^<]*)<</expression>
</RegExp>
<RegExp input="$$6" output="<genre>\1</genre>" dest="5+">
<expression repeat="yes">([^ ]*) </expression>
</RegExp>
<RegExp input="$$1" output="<studio>\1</studio>" dest="5+">
<expression>发行公司:<span class="blue12font" style="color: #505050">([^<]*)<</expression>
</RegExp>
<RegExp input="$$1" output="<outline>\1</outline><plot>\1</plot>" dest="5+">
<expression>剧情简介 </li>.*?class="hui5012font">(.*?)\n</expression>
</RegExp>
<RegExp input="$$2" output="<url cache="$$2-plot.html" function="GetPlot">http://www.m1905.com/list.php?catid=105&amp;contentid=$$2</url>" dest="5+">
<expression/>
</RegExp>
<RegExp input="$$2" output="<url cache="$$2-fullcredits.html" function="GetFullcredits">http://www.m1905.com/list.php?catid=109&amp;contentid=$$2</url>" dest="5+">
<expression/>
</RegExp>
<RegExp input="$$2" output="<url cache="$$2-posters.html" function="GetM1905Poster">http://www.m1905.com/list.php?catid=127&amp;contentid=$$2</url>" dest="5+">
<expression/>
</RegExp>
<RegExp conditional="fanart" input="$$2" output="<url cache="$$2-fanart.html" function="GetM1905Fanart">http://www.m1905.com/list.php?catid=119&amp;contentid=$$2</url>" dest="5+">
<expression/>
</RegExp>
<expression noclean="1"/>
</RegExp>
</GetDetails>
<GetRating clearbuffers="no" dest="5">
<RegExp input="$$2" output="<details>\1</details>" dest="5">
<RegExp input="$$1" output="<rating>\2</rating><votes>\1</votes>" dest="2">
<expression clear="yes">([0-9]*)\|([0-9]*)\|</expression>
</RegExp>
<expression noclean="1"/>
</RegExp>
</GetRating>
<GetPlot dest="5">
<RegExp input="$$2" output="<details>\1</details>" dest="5">
<RegExp input="$$1" output="<plot>\1</plot>" dest="2">
<expression clear="yes"><div id="gut_center_center_down" class="hui34343412font">(.*?)</div></expression>
</RegExp>
<expression noclean="1"/>
</RegExp>
</GetPlot>
<GetFullcredits dest="5">
<RegExp input="$$2" output="<details>\1</details>" dest="5">
<RegExp input="$$1" output="\1" dest="6">
<expression clear="yes" noclean="1">演员 Actor:.*?class="hui5012font">(.*?)</div></expression>
</RegExp>
<RegExp input="$$6" output="<actor><thumb></thumb><name>\1</name><role></role></actor>" dest="2">
<expression clear="yes" repeat="yes" trim="1">margin-left:10px;">(.*?)</li></expression>
</RegExp>
<RegExp input="$$1" output="\1" dest="8">
<expression clear="yes" noclean="1">导演 Director:(.*?)</ul></expression>
</RegExp>
<RegExp input="$$8" output="<director>\1</director>" dest="2+">
<expression repeat="no" trim="1"><li>([^<]*)<</expression>
</RegExp>
<RegExp input="$$1" output="\1" dest="9">
<expression clear="yes" noclean="1">编剧 Writer:(.*?)</ul></expression>
</RegExp>
<RegExp input="$$9" output="<credits>\1</credits>" dest="2+">
<expression repeat="no" trim="1"><li>([^<]*)<</expression>
</RegExp>
<expression noclean="1"/>
</RegExp>
</GetFullcredits>
<GetM1905Poster dest="5">
<RegExp input="$$2" output="<details>\1</details>" dest="5">
<RegExp input="$$1" output="\1" dest="6">
<expression clear="yes" noclean="1">--中间内容开始--(.*?)--中间内容结束--</expression>
</RegExp>
<RegExp input="$$6" output="<thumb>http://www.m1905.com/\1\2</thumb>" dest="2">
<expression repeat="yes" noclean="1">(uploadfile/[0-9]+/[0-9]+/)thumb_[0-9]+_[0-9]+_([0-9]+\.jpg)</expression>
</RegExp>
<expression noclean="1"/>
</RegExp>
</GetM1905Poster>
<GetM1905Fanart dest="5">
<RegExp input="$$11" output="<details><fanart url="http://www.m1905.com/">\1</fanart></details>" dest="5">
<RegExp input="$$1" output="<thumb preview="\1\2\3">\1\3</thumb>" dest="11">
<expression clear="yes" repeat="yes" noclean="1,2,3"><a href="film/photo/still/[^<]*<img src="(uploadfile/[0-9]+/[0-9]+/)(thumb_[0-9]+_[0-9]+_)([0-9]+\.jpg)</expression>
</RegExp>
<expression noclean="1"/>
</RegExp>
</GetM1905Fanart>
</scraper>
|