merged: Linuxport revisions through to r15292.
[xbmc:xbmc-antiquated.git] / system / scrapers / video / imdb.xml
1 <?xml version="1.0" encoding="UTF-8"?>
2 <scraper name="IMDb" content="movies" thumb="imdb.gif">
3         <GetSettings dest="3">
4                 <RegExp input="$$5" output="&lt;settings&gt;\1&lt;/settings&gt;" dest="3">
5                         <RegExp input="$$1" output="&lt;setting label=&quot;Enable Full Cast Credits&quot; type=&quot;bool&quot; id=&quot;fullcredits&quot; default=&quot;false&quot;&gt;&lt;/setting&gt;" dest="5">
6                                 <expression></expression>
7                         </RegExp>
8                         <RegExp input="$$1" output="&lt;setting label=&quot;Enable IMPAwards&quot; type=&quot;bool&quot; id=&quot;impawards&quot; default=&quot;true&quot;&gt;&lt;/setting&gt;" dest="5+">
9                                 <expression></expression>
10                         </RegExp>
11                         <RegExp input="$$1" output="&lt;setting label=&quot;Enable MoviePosterDB&quot; type=&quot;bool&quot; id=&quot;movieposterdb&quot; default=&quot;false&quot;&gt;&lt;/setting&gt;" dest="5+">
12                                 <expression></expression>
13                         </RegExp>
14                         <RegExp input="$$1" output="&lt;setting label=&quot;Enable Trailer&quot; type=&quot;bool&quot; id=&quot;trailer&quot; default=&quot;true&quot;&gt;&lt;/setting&gt;" dest="5+">
15                                 <expression></expression>
16                         </RegExp>
17                         <RegExp input="$$1" output="&lt;setting label=&quot;Enable Fanart&quot; type=&quot;bool&quot; id=&quot;fanart&quot; default=&quot;true&quot;&gt;&lt;/setting&gt;" dest="5+">
18                                 <expression></expression>
19                         </RegExp>
20                         <RegExp input="$$1" output="&lt;setting label=&quot;IMDB Poster &amp;amp; Actor Thumb(s) Size&quot; type=&quot;labelenum&quot; values=&quot;192|256|384|512|1024&quot; id=&quot;imdbscale&quot; default=&quot;512&quot;&gt;&lt;/setting&gt;" dest="5+">
21                                 <expression></expression>
22                         </RegExp>
23                         <RegExp input="$$1" output="&lt;setting type=&quot;sep&quot;&gt;&lt;/setting&gt;" dest="5+">
24                                 <expression></expression>
25                         </RegExp>
26                         <RegExp input="$$1" output="&lt;setting label=&quot;Input Alternative IMDb Source&quot; type=&quot;text&quot; id=&quot;url&quot; default=&quot;akas.imdb.com&quot;&gt;&lt;/setting&gt;" dest="5+">
27                                 <expression></expression>
28                         </RegExp>
29                         <expression noclean="1"></expression>
30                 </RegExp>
31         </GetSettings>
32         <NfoUrl dest="3">
33     <RegExp input="$$1" output="&lt;url&gt;http://www.\1/title/tt\2/&lt;/url&gt;&lt;id&gt;tt\2&lt;/id&gt;"  dest="3">
34                         <expression clear="yes" noclean="1">(imdb.com/)Title\?([0-9]*)</expression>
35                 </RegExp>
36     <RegExp input="$$1" output="&lt;url&gt;http://www.\1\2/&lt;/url&gt;&lt;id&gt;tt\2&lt;/id&gt;"  dest="3+">
37                         <expression clear="yes" noclean="1">(imdb.com/title/tt)([0-9]*)</expression>
38                 </RegExp>
39         </NfoUrl>
40         <CreateSearchUrl dest="3">
41                 <RegExp input="$$1" output="&lt;url&gt;http://$INFO[url]/find?s=tt;q=\1&lt;/url&gt;" dest="3">
42                         <expression noclean="1"></expression>
43                 </RegExp>
44         </CreateSearchUrl>
45         <GetSearchResults dest="8">
46                 <RegExp input="$$5" output="&lt;?xml version=&quot;1.0&quot; encoding=&quot;iso-8859-1&quot; standalone=&quot;yes&quot;?&gt;&lt;results&gt;\1&lt;/results&gt;" dest="8">
47                         <RegExp input="$$1" output="\1" dest="7">
48                                 <expression clear="yes">/title/([t0-9]*)/faq</expression>
49                         </RegExp>
50                         <RegExp input="$$1" output="&lt;entity&gt;&lt;title&gt;\1 (\2)&lt;/title&gt;&lt;url&gt;http://$INFO[url]/title/$$7/&lt;/url&gt;&lt;id&gt;$$7&lt;/id&gt;&lt;/entity&gt;" dest="5">
51                                 <expression clear="yes" noclean="1">&lt;meta name=&quot;title&quot; content=&quot;([^&quot;]*) \(([0-9]*)\)</expression>
52                         </RegExp>
53                         <RegExp input="$$1" output="\1" dest="4">
54                                 <expression noclean="1">(&gt;&lt;a href=&quot;/title.*)</expression>
55                         </RegExp>
56                         <RegExp input="$$4" output="&lt;entity&gt;&lt;title&gt;\2 (\3)&lt;/title&gt;&lt;url&gt;http://$INFO[url]/title/\1/&lt;/url&gt;&lt;id&gt;\1&lt;/id&gt;&lt;/entity&gt;" dest="5+">
57                                 <expression repeat="yes" noclean="1,2">&gt;&lt;a href=&quot;/title/([t0-9]*)/[^&gt;]*&gt;([^&lt;]*)&lt;/a&gt; *\(([0-9]*)</expression>
58                         </RegExp>
59                         <expression clear="yes" noclean="1"></expression>
60                 </RegExp>
61         </GetSearchResults>
62         <GetDetails clearbuffers="no" dest="3">
63                 <RegExp input="$$5" output="&lt;details&gt;\1&lt;/details&gt;" dest="3">
64                         <RegExp input="$$2" output="&lt;id&gt;\1&lt;/id&gt;" dest="5">
65                                 <expression></expression>
66                         </RegExp>
67                         <RegExp input="$$1" output="&lt;title&gt;\1&lt;/title&gt;" dest="5+">
68                                 <expression trim="1" noclean="1">&lt;title&gt;([^&lt;|^(]*)</expression>
69                         </RegExp>
70                         <RegExp input="$$1" output="&lt;year&gt;\1&lt;/year&gt;" dest="5+">
71                                 <expression>a href=&quot;/Sections/Years/([0-9]*)</expression>
72                         </RegExp>
73                         <RegExp input="$$1" output="&lt;top250&gt;\1&lt;/top250&gt;" dest="5+">
74                                 <expression>Top 250: #([0-9]*)&lt;/a&gt;</expression>
75                         </RegExp>
76                         <RegExp input="$$1" output="&lt;mpaa&gt;\1&lt;/mpaa&gt;" dest="5+">
77                                 <expression>MPAA&lt;/a&gt;:&lt;/h5&gt;(.[^&lt;]*)</expression>
78                         </RegExp>
79                         <RegExp input="$$1" output="&lt;certification&gt;\1 \3&lt;/certification&gt;" dest="5+">
80                                 <expression repeat="yes">&lt;a href=&quot;/List\?certificates=[^&quot;]*&quot;&gt;([^&lt;]*)&lt;/a&gt;[^&lt;]*(&lt;i&gt;([^&lt;]*)&lt;/i&gt;)?</expression>
81                         </RegExp>
82                         <RegExp input="$$1" output="&lt;tagline&gt;\1&lt;/tagline&gt;" dest="5+">
83                                 <expression>&lt;h5&gt;Tagline:&lt;/h5&gt;([^&lt;]*)</expression>
84                         </RegExp>
85                         <RegExp input="$$1" output="&lt;runtime&gt;\1&lt;/runtime&gt;" dest="5+">
86                                 <expression trim="1">&lt;h5&gt;Runtime:&lt;/h5&gt;[^0-9]*([^&lt;]*)</expression>
87                         </RegExp>
88                         <RegExp input="$$1" output="&lt;rating&gt;\1&lt;/rating&gt;&lt;votes&gt;\2&lt;/votes&gt;" dest="5+">
89                                 <expression>&lt;b&gt;User Rating:&lt;/b&gt;[^&lt;]*&lt;b&gt;([0-9.]+)/10&lt;/b&gt;[^&lt;]*&lt;small&gt;\(&lt;a href=&quot;ratings&quot;&gt;([0-9,]+) votes&lt;/a&gt;\)&lt;/small&gt;</expression>
90                         </RegExp>
91                         <RegExp input="$$1" output="&lt;genre&gt;\1&lt;/genre&gt;" dest="5+">
92                                 <expression repeat="yes">&quot;/Sections/Genres/[^/]*/&quot;&gt;([^&lt;]*)&lt;/a&gt;</expression>
93                         </RegExp>
94                         <RegExp input="$$1" output="&lt;studio&gt;\1&lt;/studio&gt;" dest="5+">
95                                 <expression repeat="yes">&quot;/company/[^/]*/&quot;&gt;([^&lt;]*)&lt;/a&gt;</expression>
96                         </RegExp>
97                         <RegExp input="$$1" output="&lt;outline&gt;\1&lt;/outline&gt;&lt;plot&gt;\1&lt;/plot&gt;" dest="5+">
98                                 <expression>Plot:&lt;/h5&gt;\W([^[&lt;||]*) </expression>
99                         </RegExp>
100                         <RegExp input="$$2" output="&lt;url function=&quot;GetMoviePlot&quot;&gt;$$3plotsummary&lt;/url&gt;" dest="5+">
101                                 <expression></expression>
102                         </RegExp>
103                         <RegExp conditional="!fullcredits" input="$$2" output="&lt;url cache=&quot;$$2-credits.html&quot; function=&quot;GetMovieCast&quot;&gt;$$3&lt;/url&gt;" dest="5+">
104                                 <expression></expression>
105                         </RegExp>
106                         <RegExp conditional="!fullcredits" input="$$2" output="&lt;url cache=&quot;$$2-credits.html&quot; function=&quot;GetMovieDirectors&quot;&gt;$$3&lt;/url&gt;" dest="5+">
107                                 <expression></expression>
108                         </RegExp>
109                         <RegExp conditional="!fullcredits" input="$$2" output="&lt;url cache=&quot;$$2-credits.html&quot; function=&quot;GetMovieWriters&quot;&gt;$$3&lt;/url&gt;" dest="5+">
110                                 <expression></expression>
111                         </RegExp>
112                         <RegExp conditional="fullcredits" input="$$2" output="&lt;url cache=&quot;$$2-fullcredits.html&quot; function=&quot;GetMovieCast&quot;&gt;$$3fullcredits&lt;/url&gt;" dest="5+">
113                                 <expression></expression>
114                         </RegExp>
115                         <RegExp conditional="fullcredits" input="$$2" output="&lt;url cache=&quot;$$2-fullcredits.html&quot; function=&quot;GetMovieDirectors&quot;&gt;$$3fullcredits&lt;/url&gt;" dest="5+">
116                                 <expression></expression>
117                         </RegExp>
118                         <RegExp conditional="fullcredits" input="$$2" output="&lt;url cache=&quot;$$2-fullcredits.html&quot; function=&quot;GetMovieWriters&quot;&gt;$$3fullcredits&lt;/url&gt;" dest="5+">
119                                 <expression></expression>
120                         </RegExp>
121                         <RegExp conditional="impawards" input="$$2" output="&lt;url cache=&quot;$$2-posters.html&quot; function=&quot;GetIMPALink&quot;&gt;$$3posters&lt;/url&gt;" dest="5+">
122                                 <expression></expression>
123                         </RegExp>
124                         <RegExp conditional="movieposterdb" input="$$1" output="&lt;url function=&quot;GetMoviePosterDBLink&quot;&gt;http://www.movieposterdb.com/browse/search?title=\1&lt;/url&gt;" dest="5+">
125                                 <expression>/title/tt([t0-9]*)/faq</expression>
126                         </RegExp>
127                         <RegExp conditional="trailer" input="$$1" output="&lt;url function=&quot;GetTrailer&quot;&gt;http://$INFO[url]\1&lt;/url&gt;" dest="5+">
128                                 <expression>&lt;a href=&quot;([^&quot;]*(trailers-screenplay|videos-)[^&quot;]*)&quot;</expression>
129                         </RegExp>
130                         <RegExp input="$$2" output="&lt;url cache=&quot;$$2-posters.html&quot; function=&quot;GetIMDBPoster&quot;&gt;$$3posters&lt;/url&gt;" dest="5+">
131                                 <expression></expression>
132                         </RegExp>
133                         <RegExp conditional="fanart" input="$$2" output="&lt;url function=&quot;GetFanart&quot;&gt;http://www.moviebackdrops.com/tab_movie.php5?id=$$2&lt;/url&gt;" dest="5+">
134                                 <expression></expression>
135                         </RegExp>
136                         <expression noclean="1"></expression>
137                 </RegExp>
138         </GetDetails>
139         <GetMoviePlot clearbuffers="no" dest="5">
140                 <RegExp input="$$2" output="&lt;details&gt;\1&lt;/details&gt;" dest="5">
141                         <RegExp input="$$1" output="&lt;plot&gt;\1&lt;/plot&gt;" dest="2">
142                                 <expression clear="yes">&lt;p class="plotpar"&gt;\n([^\n]*)</expression>
143                         </RegExp>
144                         <expression noclean="1"></expression>
145                 </RegExp>
146         </GetMoviePlot>
147         <GetMovieCast clearbuffers="no" dest="5">
148                 <RegExp input="$$2" output="&lt;details&gt;\1&lt;/details&gt;" dest="5">
149                         <RegExp input="$$1" output="\1" dest="6">
150                                 <expression clear="yes" noclean="1">&lt;table class=&quot;cast&quot;&gt;(.*?)&lt;/table&gt;</expression>
151                         </RegExp>
152                         <RegExp input="$$6" output="&lt;actor&gt;&lt;thumb&gt;\1_SX$INFO[imdbscale]_SY$INFO[imdbscale]_\2&lt;/thumb&gt;&lt;name&gt;\3&lt;/name&gt;&lt;role&gt;\4&lt;/role&gt;&lt;/actor&gt;" dest="7">
153                                 <expression clear="yes" repeat="yes" noclean="1,2" trim="3,4">&lt;img src=&quot;(?:([^&quot;]*\.)[^&quot;]*(\.jpg))?[^&gt;]*[^&quot;]*&quot;nm&quot;&gt;&lt;a href=&quot;[^&quot;]*&quot;&gt;([^&lt;]*)&lt;[^&quot;]*&quot;ddd&quot;&gt; ... [^&quot;]*&quot;char&quot;&gt;(.*?)&lt;/td&gt;</expression>
154                         </RegExp>
155                         <RegExp input="$$7" output="&lt;actor&gt;&lt;thumb&gt;\1&lt;/thumb&gt;\2&lt;/actor&gt;" dest="2+">
156                                 <expression clear="yes" repeat="yes" noclean="1,2,3">&lt;actor&gt;&lt;thumb&gt;(?:(http.*?)|_SX[0-9]+_SY[0-9]+_)&lt;/thumb&gt;(.*?)&lt;/actor&gt;</expression>
157                         </RegExp>
158                         <expression noclean="1"></expression>
159                 </RegExp>
160         </GetMovieCast>
161         <GetMovieDirectors clearbuffers="no" dest="5">
162                 <RegExp input="$$2" output="&lt;details&gt;\1&lt;/details&gt;" dest="5">
163                         <RegExp conditional="!fullcredits" input="$$1" output="\1" dest="6">
164                                 <expression clear="yes" noclean="1">Director.*?&lt;/h5&gt;(.*?)&lt;/div&gt;</expression>
165                         </RegExp>
166                         <RegExp conditional="fullcredits" input="$$1" output="\1" dest="6">
167                                 <expression clear="yes" noclean="1">Directed by(.*?)name=&quot;</expression>
168                         </RegExp>
169                         <RegExp input="$$6" output="&lt;director&gt;\1&lt;/director&gt;" dest="2+">
170                                 <expression clear="yes" repeat="yes">&lt;a href=&quot;/name/[^&gt;]*&gt;([^&lt;]*)&lt;</expression>
171                         </RegExp>
172                         <expression noclean="1"></expression>
173                 </RegExp>
174         </GetMovieDirectors>
175         <GetMovieWriters clearbuffers="no" dest="5">
176                 <RegExp input="$$2" output="&lt;details&gt;\1&lt;/details&gt;" dest="5">
177                         <RegExp conditional="!fullcredits" input="$$1" output="\1" dest="6">
178                                 <expression clear="yes" noclean="1">Writers.*?:&lt;/h5&gt;(.*?)&lt;/div&gt;</expression>
179                         </RegExp>
180                         <RegExp conditional="fullcredits" input="$$1" output="\1" dest="6">
181                                 <expression clear="yes" noclean="1">Writing credits(.*?)name=&quot;</expression>
182                         </RegExp>
183                         <RegExp input="$$6" output="&lt;credits&gt;\1&lt;/credits&gt;" dest="2+">
184                                 <expression clear="yes" repeat="yes">&lt;a href=&quot;/name/[^&gt;]*&gt;([^&lt;]*)&lt;</expression>
185                         </RegExp>
186                         <expression noclean="1"></expression>
187                 </RegExp>
188         </GetMovieWriters>
189         <GetIMPALink clearbuffers="no" dest="5">
190                 <RegExp input="$$1" output="&lt;details&gt;&lt;url function=&quot;GetIMPAPosters&quot;&gt;http://\1impawards.com/\2&lt;/url&gt;&lt;/details&gt;" dest="5">
191                         <expression clear="yes" noclean="1,2">http://([^&quot;]*)impawards.com/([^&quot;]*)&quot;&gt;</expression>
192                 </RegExp>
193         </GetIMPALink>
194         <GetIMPAPosters clearbuffers="no" dest="5">
195                 <RegExp input="$$1" output="&lt;details&gt;&lt;url function=&quot;GetIMPAPosters&quot;&gt;http://www.impawards.com/\1&lt;/url&gt;&lt;/details&gt;" dest="5">
196                         <expression clear="yes">&lt;meta http-equiv=&quot;REFRESH&quot; content=&quot;0;URL=[^/]*/([^&quot;]*)&quot;&gt;</expression>
197                 </RegExp>
198                 <RegExp input="$$1" output="\1" dest="4">
199                         <expression clear="yes" noclean="1">value=&quot;/([^&quot;]*)/[^&quot;]*\.html&quot;&gt;</expression>
200                 </RegExp>
201                 <RegExp input="$$1" output="&lt;thumb&gt;http://www.impawards.com/$$4/posters/\1&lt;/thumb&gt;" dest="8+">
202                         <expression clear="yes" noclean="1">&lt;img SRC=&quot;posters/([^&quot;]*)&quot;</expression>
203                 </RegExp>
204                 <RegExp input="$$1" output="&lt;thumb&gt;http://www.impawards.com/$$4/posters/\1&lt;/thumb&gt;" dest="9+">
205                         <expression clear="yes" repeat="yes" noclean="1">thumbs/imp_([^&gt;]*ver[^&gt;]*.jpg)&gt;</expression>
206                 </RegExp>
207         </GetIMPAPosters>
208         <GetMoviePosterDBLink dest="6" clearbuffers="no">\r
209                 <RegExp input="$$1" output="&lt;details&gt;&lt;url function=&quot;GetMoviePosterDB&quot;&gt;\1&lt;/url&gt;&lt;/details&gt;" dest="6">\r
210                         <expression>(http://www.movieposterdb.com/movie/[^&quot;]*)&quot;</expression>
211                 </RegExp>
212         </GetMoviePosterDBLink>\r
213         <GetMoviePosterDB clearbuffers="no" dest="12">
214                 <RegExp input="$$1" output="&lt;thumb&gt;\1o_\2&lt;/thumb&gt;" dest="10+">
215                         <expression clear="yes" repeat="yes" noclean="1,2">&quot;poster&quot;.*?src=&quot;(.*?)[a-z]_(.*?)&quot;</expression>
216                 </RegExp>
217         </GetMoviePosterDB>
218         <GetTrailer clearbuffers="no" dest="5">
219                 <RegExp conditional="trailer" input="$$1" output="&lt;details&gt;&lt;url function=&quot;GetTrailerLink&quot;&gt;http://$INFO[url]\1player\2&lt;/url&gt;&lt;/details&gt;" dest="5">
220                         <expression noclean="1">videoSrc = &apos;[^&apos;]*(/video/[^/]*/[^/]*/)[^\?]*(\?bitrate=[0-9]*)?</expression>
221                 </RegExp>
222         </GetTrailer>
223         <GetTrailerLink clearbuffers="no" dest="5">
224                 <RegExp conditional="trailer" input="$$2" output="&lt;details&gt;\1&lt;/details&gt;" dest="5">
225                         <RegExp conditional="trailer" input="$$1" output="&lt;trailer urlencoded=&quot;yes&quot;&gt;\1&lt;/trailer&gt;" dest="2">
226                                 <expression noclean="1">&quot;file&quot;[^&quot;]*&quot;([^&quot;]*)</expression>
227                         </RegExp>
228                         <expression noclean="1"></expression>
229                 </RegExp>
230         </GetTrailerLink>
231         <GetIMDBPoster dest="5">
232                 <RegExp input="$$8$$9$$10$$11" output="&lt;details&gt;&lt;thumbs&gt;\1&lt;/thumbs&gt;&lt;/details&gt;" dest="5">
233                         <RegExp input="$$1" output="\1_SX$INFO[imdbscale]_SY$INFO[imdbscale]_\2" dest="6">
234                                 <expression noclean="1,2">&lt;a name=&quot;poster&quot;.*?src=&quot;(.*?)_S.*?(.jpg)&quot;.*?&lt;/a&gt;</expression>
235                         </RegExp>
236                         <RegExp input="$$6" output="&lt;thumb&gt;\1&lt;/thumb&gt;" dest="11">
237                                 <expression clear="yes" noclean="1">(.*?_SX[0-9]+_SY[0-9]+_.jpg)</expression>
238                         </RegExp>
239                         <expression noclean="1"></expression>
240                 </RegExp>
241         </GetIMDBPoster>
242         <GetFanart dest="5">
243                 <RegExp input="$$2" output="&lt;details&gt;&lt;fanart url=&quot;http://www.moviebackdrops.com/&quot;>\1&lt;/fanart&gt;&lt;/details&gt;" dest="5">
244                         <RegExp input="$$1" output="&lt;thumb&gt;\1&lt;/thumb&gt;" dest="2">
245                                 <expression repeat="yes">a href=&quot;(/backdrops/[^&quot;]+)&quot;</expression>
246                         </RegExp>
247                         <expression noclean="1">(.+)</expression>
248                 </RegExp>
249         </GetFanart>
250 </scraper>