Merged from linuxport rev21200:21590. Updated.
[xbmc:xbmc-antiquated.git] / XBMC / system / scrapers / video / imdb.xml
1 <?xml version="1.0" encoding="UTF-8"?>
2 <scraper framework="1.0" date="2009-07-02" name="IMDb" content="movies" thumb="imdb.png" language="en">
3         <GetSettings dest="3">
4                 <RegExp input="$$5" output="&lt;settings&gt;\1&lt;/settings&gt;" dest="3">
5                         <RegExp input="$$1" output="&lt;setting label=&quot;Enable Full Cast Credits&quot; type=&quot;bool&quot; id=&quot;fullcredits&quot; default=&quot;false&quot;&gt;&lt;/setting&gt;" dest="5">
6                                 <expression></expression>
7                         </RegExp>
8                         <RegExp input="$$1" output="&lt;setting label=&quot;Enable IMPAwards&quot; type=&quot;bool&quot; id=&quot;impawards&quot; default=&quot;true&quot;&gt;&lt;/setting&gt;" dest="5+">
9                                 <expression></expression>
10                         </RegExp>
11                         <RegExp input="$$1" output="&lt;setting label=&quot;Enable MoviePosterDB&quot; type=&quot;bool&quot; id=&quot;movieposterdb&quot; default=&quot;false&quot;&gt;&lt;/setting&gt;" dest="5+">
12                                 <expression></expression>
13                         </RegExp>
14                         <RegExp input="$$1" output="&lt;setting label=&quot;Enable Trailer&quot; type=&quot;bool&quot; id=&quot;trailer&quot; default=&quot;true&quot;&gt;&lt;/setting&gt;" dest="5+">
15                                 <expression></expression>
16                         </RegExp>
17                         <RegExp input="$$1" output="&lt;setting label=&quot;Enable Fanart&quot; type=&quot;bool&quot; id=&quot;fanart&quot; default=&quot;true&quot;&gt;&lt;/setting&gt;" dest="5+">
18                                 <expression></expression>
19                         </RegExp>
20                         <RegExp input="$$1" output="&lt;setting label=&quot;IMDB Poster &amp;amp; Actor Thumb(s) Size&quot; type=&quot;labelenum&quot; values=&quot;192|256|384|512|1024&quot; id=&quot;imdbscale&quot; default=&quot;512&quot;&gt;&lt;/setting&gt;" dest="5+">
21                                 <expression></expression>
22                         </RegExp>
23                         <RegExp input="$$1" output="&lt;setting type=&quot;sep&quot;&gt;&lt;/setting&gt;" dest="5+">
24                                 <expression></expression>
25                         </RegExp>
26                         <RegExp input="$$1" output="&lt;setting label=&quot;Input Alternative IMDb Source&quot; type=&quot;text&quot; id=&quot;url&quot; default=&quot;akas.imdb.com&quot;&gt;&lt;/setting&gt;" dest="5+">
27                                 <expression></expression>
28                         </RegExp>
29                         <expression noclean="1"></expression>
30                 </RegExp>
31         </GetSettings>
32         <NfoUrl dest="3">
33                 <RegExp input="$$1" output="&lt;url&gt;http://www.\1/title/tt\2/&lt;/url&gt;&lt;id&gt;tt\2&lt;/id&gt;"  dest="3">
34                         <expression clear="yes" noclean="1">(imdb.com/)Title\?([0-9]*)</expression>
35                 </RegExp>
36                 <RegExp input="$$1" output="&lt;url&gt;http://www.\1\2/&lt;/url&gt;&lt;id&gt;tt\2&lt;/id&gt;"  dest="3+">
37                         <expression clear="yes" noclean="1">(imdb.com/title/tt)([0-9]*)</expression>
38                 </RegExp>
39         </NfoUrl>
40         <CreateSearchUrl dest="3">
41                 <RegExp input="$$1" output="&lt;url&gt;http://$INFO[url]/find?s=tt;q=\1$$4&lt;/url&gt;" dest="3">
42                         <RegExp input="$$2" output="%20(\1)" dest="4">
43                                 <expression clear="yes">(.+)</expression>
44                         </RegExp>
45                         <expression noclean="1"></expression>
46                 </RegExp>
47         </CreateSearchUrl>
48         <GetSearchResults dest="8">
49                 <RegExp input="$$5" output="&lt;?xml version=&quot;1.0&quot; encoding=&quot;iso-8859-1&quot; standalone=&quot;yes&quot;?&gt;&lt;results&gt;\1&lt;/results&gt;" dest="8">
50                         <RegExp input="$$1" output="\1" dest="7">
51                                 <expression clear="yes">/title/([t0-9]*)/faq</expression>
52                         </RegExp>
53                         <RegExp input="$$1" output="&lt;entity&gt;&lt;title&gt;\1&lt;/title&gt;&lt;year&gt;\2&lt;/year&gt;&lt;url&gt;http://$INFO[url]/title/$$7/&lt;/url&gt;&lt;id&gt;$$7&lt;/id&gt;&lt;/entity&gt;" dest="5">
54                                 <expression clear="yes" noclean="1">&lt;meta name=&quot;title&quot; content=&quot;([^&quot;]*) \(([0-9]*)\)</expression>
55                         </RegExp>
56                         <RegExp input="$$1" output="\1" dest="4">
57                                 <expression noclean="1">(&gt;&lt;a href=&quot;/title.*)</expression>
58                         </RegExp>
59                         <RegExp input="$$4" output="&lt;entity&gt;&lt;title&gt;\2&lt;/title&gt;&lt;year&gt;\3&lt;/year&gt;&lt;url&gt;http://$INFO[url]/title/\1/&lt;/url&gt;&lt;id&gt;\1&lt;/id&gt;&lt;/entity&gt;" dest="5+">
60                                 <expression repeat="yes" noclean="1,2">&gt;&lt;a href=&quot;/title/([t0-9]*)/[^&gt;]*&gt;([^&lt;]*)&lt;/a&gt; *\(([0-9]*)</expression>
61                         </RegExp>
62                         <expression clear="yes" noclean="1"></expression>
63                 </RegExp>
64         </GetSearchResults>
65         <GetDetails clearbuffers="no" dest="3">
66                 <RegExp input="$$5" output="&lt;details&gt;\1&lt;/details&gt;" dest="3">
67                         <RegExp input="$$2" output="&lt;id&gt;\1&lt;/id&gt;" dest="5">
68                                 <expression></expression>
69                         </RegExp>
70                         <RegExp input="$$1" output="&lt;title&gt;\1&lt;/title&gt;" dest="5+">
71                                 <expression trim="1" noclean="1">&lt;title&gt;([^&lt;|^(]*)</expression>
72                         </RegExp>
73                         <RegExp input="$$1" output="&lt;year&gt;\1&lt;/year&gt;" dest="5+">
74                                 <expression>a href=&quot;/Sections/Years/([0-9]*)</expression>
75                         </RegExp>
76                         <RegExp input="$$1" output="&lt;top250&gt;\1&lt;/top250&gt;" dest="5+">
77                                 <expression>Top 250: #([0-9]*)&lt;/a&gt;</expression>
78                         </RegExp>
79                         <RegExp input="$$1" output="&lt;mpaa&gt;\1&lt;/mpaa&gt;" dest="5+">
80                                 <expression>MPAA&lt;/a&gt;:&lt;/h5&gt;(.[^&lt;]*)</expression>
81                         </RegExp>
82                         <RegExp input="$$1" output="&lt;certification&gt;\1 \3&lt;/certification&gt;" dest="5+">
83                                 <expression repeat="yes">&lt;a href=&quot;/List\?certificates=[^&quot;]*&quot;&gt;([^&lt;]*)&lt;/a&gt;[^&lt;]*(&lt;i&gt;([^&lt;]*)&lt;/i&gt;)?</expression>
84                         </RegExp>
85                         <RegExp input="$$1" output="&lt;tagline&gt;\1&lt;/tagline&gt;" dest="5+">
86                                 <expression>&lt;h5&gt;Tagline:&lt;/h5&gt;([^&lt;]*)</expression>
87                         </RegExp>
88                         <RegExp input="$$1" output="&lt;runtime&gt;\1&lt;/runtime&gt;" dest="5+">
89                                 <expression trim="1">&lt;h5&gt;Runtime:&lt;/h5&gt;[^0-9]*([^&lt;]*)</expression>
90                         </RegExp>
91                         <RegExp input="$$1" output="&lt;rating&gt;\1&lt;/rating&gt;&lt;votes&gt;\2&lt;/votes&gt;" dest="5+">
92                                 <expression>&lt;b&gt;([0-9.]+)/10&lt;/b&gt;[^&lt;]*&lt;a href=&quot;ratings&quot; class=&quot;tn15more&quot;&gt;([0-9,]+) votes&lt;/a&gt;</expression>
93                         </RegExp>
94                         <RegExp input="$$1" output="&lt;genre&gt;\1&lt;/genre&gt;" dest="5+">
95                                 <expression repeat="yes">&quot;/Sections/Genres/[^/]*/&quot;&gt;([^&lt;]*)&lt;/a&gt;</expression>
96                         </RegExp>
97                         <RegExp input="$$1" output="&lt;studio&gt;\1&lt;/studio&gt;" dest="5+">
98                                 <expression repeat="yes">&quot;/company/[^/]*/&quot;&gt;([^&lt;]*)&lt;/a&gt;</expression>
99                         </RegExp>
100                         <RegExp input="$$1" output="&lt;outline&gt;\1&lt;/outline&gt;&lt;plot&gt;\1&lt;/plot&gt;" dest="5+">
101                                 <expression>Plot:&lt;/h5&gt;(.*?)&lt;a class=&quot;tn15more</expression>
102                         </RegExp>
103                         <RegExp input="$$2" output="&lt;url function=&quot;GetMoviePlot&quot;&gt;$$3plotsummary&lt;/url&gt;" dest="5+">
104                                 <expression></expression>
105                         </RegExp>
106                         <RegExp conditional="!fullcredits" input="$$2" output="&lt;url cache=&quot;$$2-credits.html&quot; function=&quot;GetMovieCast&quot;&gt;$$3&lt;/url&gt;" dest="5+">
107                                 <expression></expression>
108                         </RegExp>
109                         <RegExp conditional="!fullcredits" input="$$2" output="&lt;url cache=&quot;$$2-credits.html&quot; function=&quot;GetMovieDirectors&quot;&gt;$$3&lt;/url&gt;" dest="5+">
110                                 <expression></expression>
111                         </RegExp>
112                         <RegExp conditional="!fullcredits" input="$$2" output="&lt;url cache=&quot;$$2-credits.html&quot; function=&quot;GetMovieWriters&quot;&gt;$$3&lt;/url&gt;" dest="5+">
113                                 <expression></expression>
114                         </RegExp>
115                         <RegExp conditional="fullcredits" input="$$2" output="&lt;url cache=&quot;$$2-fullcredits.html&quot; function=&quot;GetMovieCast&quot;&gt;$$3fullcredits&lt;/url&gt;" dest="5+">
116                                 <expression></expression>
117                         </RegExp>
118                         <RegExp conditional="fullcredits" input="$$2" output="&lt;url cache=&quot;$$2-fullcredits.html&quot; function=&quot;GetMovieDirectors&quot;&gt;$$3fullcredits&lt;/url&gt;" dest="5+">
119                                 <expression></expression>
120                         </RegExp>
121                         <RegExp conditional="fullcredits" input="$$2" output="&lt;url cache=&quot;$$2-fullcredits.html&quot; function=&quot;GetMovieWriters&quot;&gt;$$3fullcredits&lt;/url&gt;" dest="5+">
122                                 <expression></expression>
123                         </RegExp>
124                         <RegExp conditional="impawards" input="$$2" output="&lt;url cache=&quot;$$2-posters.html&quot; function=&quot;GetIMPALink&quot;&gt;$$3posters&lt;/url&gt;" dest="5+">
125                                 <expression></expression>
126                         </RegExp>
127                         <RegExp conditional="movieposterdb" input="$$1" output="&lt;url function=&quot;GetMoviePosterDBLink&quot;&gt;http://www.movieposterdb.com/browse/search?title=\1&lt;/url&gt;" dest="5+">
128                                 <expression>/title/tt([t0-9]*)/faq</expression>
129                         </RegExp>
130                         <RegExp conditional="trailer" input="$$1" output="&lt;url function=&quot;GetTrailer&quot;&gt;http://$INFO[url]/video/imdb/vi\1/player&lt;/url&gt;" dest="5+">
131                                 <expression>/vi([0-9]*)/&quot;</expression>
132                         </RegExp>
133                         <RegExp input="$$2" output="&lt;url cache=&quot;$$2-posters.html&quot; function=&quot;GetIMDBPoster&quot;&gt;$$3posters&lt;/url&gt;" dest="5+">
134                                 <expression></expression>
135                         </RegExp>
136                         <RegExp conditional="fanart" input="$$2" output="&lt;url function=&quot;GetTMDBId&quot;&gt;http://api.themoviedb.org/2.0/Movie.imdbLookup?imdb_id=$$2&amp;amp;api_key=57983e31fb435df4df77afb854740ea9&lt;/url&gt;" dest="5+">
137                                 <expression></expression>
138                         </RegExp>
139                         <expression noclean="1"></expression>
140                 </RegExp>
141         </GetDetails>
142         <GetMoviePlot clearbuffers="no" dest="5">
143                 <RegExp input="$$2" output="&lt;details&gt;\1&lt;/details&gt;" dest="5">
144                         <RegExp input="$$1" output="&lt;plot&gt;\1&lt;/plot&gt;" dest="2">
145                                 <expression clear="yes">&lt;p class="plotpar"&gt;\n([^\n]*)</expression>
146                         </RegExp>
147                         <expression noclean="1"></expression>
148                 </RegExp>
149         </GetMoviePlot>
150         <GetMovieCast clearbuffers="no" dest="5">
151                 <RegExp input="$$2" output="&lt;details&gt;\1&lt;/details&gt;" dest="5">
152                         <RegExp input="$$1" output="\1" dest="6">
153                                 <expression clear="yes" noclean="1">&lt;table class=&quot;cast&quot;&gt;(.*?)&lt;/table&gt;</expression>
154                         </RegExp>
155                         <RegExp input="$$6" output="&lt;actor&gt;&lt;thumb&gt;\1_SX$INFO[imdbscale]_SY$INFO[imdbscale]_\2&lt;/thumb&gt;&lt;name&gt;\3&lt;/name&gt;&lt;role&gt;\4&lt;/role&gt;&lt;/actor&gt;" dest="7">
156                                 <expression clear="yes" repeat="yes" noclean="1,2" trim="3,4">&lt;img src=&quot;(?:([^&quot;]*\.)[^&quot;]*(\.jpg))?[^&gt;]*[^&quot;]*&quot;nm&quot;&gt;&lt;a href=&quot;[^&quot;]*[^&gt;]*&gt;([^&lt;]*)&lt;[^&quot;]*&quot;ddd&quot;&gt; ... [^&quot;]*&quot;char&quot;&gt;(.*?)&lt;/td&gt;</expression>
157                         </RegExp>
158                         <RegExp input="$$7" output="&lt;actor&gt;&lt;thumb&gt;\1&lt;/thumb&gt;\2&lt;/actor&gt;" dest="2+">
159                                 <expression clear="yes" repeat="yes" noclean="1,2,3">&lt;actor&gt;&lt;thumb&gt;(?:(http.*?)|_SX[0-9]+_SY[0-9]+_)&lt;/thumb&gt;(.*?)&lt;/actor&gt;</expression>
160                         </RegExp>
161                         <expression noclean="1"></expression>
162                 </RegExp>
163         </GetMovieCast>
164         <GetMovieDirectors clearbuffers="no" dest="5">
165                 <RegExp input="$$2" output="&lt;details&gt;\1&lt;/details&gt;" dest="5">
166                         <RegExp conditional="!fullcredits" input="$$1" output="\1" dest="6">
167                                 <expression clear="yes" noclean="1">&gt;Director.*?&lt;/h5&gt;(.*?)&lt;/div&gt;</expression>
168                         </RegExp>
169                         <RegExp conditional="fullcredits" input="$$1" output="\1" dest="6">
170                                 <expression clear="yes" noclean="1">Directed by(.*?)name=&quot;</expression>
171                         </RegExp>
172                         <RegExp input="$$6" output="&lt;director&gt;\1&lt;/director&gt;" dest="2+">
173                                 <expression clear="yes" repeat="yes">&lt;a href=&quot;/name/[^&gt;]*&gt;([^&lt;]*)&lt;</expression>
174                         </RegExp>
175                         <expression noclean="1"></expression>
176                 </RegExp>
177         </GetMovieDirectors>
178         <GetMovieWriters clearbuffers="no" dest="5">
179                 <RegExp input="$$2" output="&lt;details&gt;\1&lt;/details&gt;" dest="5">
180                         <RegExp conditional="!fullcredits" input="$$1" output="\1" dest="6">
181                                 <expression clear="yes" noclean="1">&gt;Writer.*?:&lt;/h5&gt;(.*?)&lt;/div&gt;</expression>
182                         </RegExp>
183                         <RegExp conditional="fullcredits" input="$$1" output="\1" dest="6">
184                                 <expression clear="yes" noclean="1">Writing credits(.*?)name=&quot;</expression>
185                         </RegExp>
186                         <RegExp input="$$6" output="&lt;credits&gt;\1&lt;/credits&gt;" dest="2+">
187                                 <expression clear="yes" repeat="yes">&lt;a href=&quot;/name/[^&gt;]*&gt;([^&lt;]*)&lt;</expression>
188                         </RegExp>
189                         <expression noclean="1"></expression>
190                 </RegExp>
191         </GetMovieWriters>
192         <GetIMPALink clearbuffers="no" dest="5">
193                 <RegExp input="$$1" output="&lt;details&gt;&lt;url function=&quot;GetIMPAPosters&quot;&gt;http://\1impawards.com/\2&lt;/url&gt;&lt;/details&gt;" dest="5">
194                         <expression clear="yes" noclean="1,2">http://([^&quot;]*)impawards.com/([^&quot;]*)&quot;&gt;</expression>
195                 </RegExp>
196         </GetIMPALink>
197         <GetIMPAPosters clearbuffers="no" dest="5">
198                 <RegExp input="$$1" output="&lt;details&gt;&lt;url function=&quot;GetIMPAPosters&quot;&gt;http://www.impawards.com/\1&lt;/url&gt;&lt;/details&gt;" dest="5">
199                         <expression clear="yes">&lt;meta http-equiv=&quot;REFRESH&quot; content=&quot;0;URL=[^/]*/([^&quot;]*)&quot;&gt;</expression>
200                 </RegExp>
201                 <RegExp input="$$1" output="\1" dest="4">
202                         <expression clear="yes" noclean="1">value=&quot;/([^&quot;]*)/[^&quot;]*\.html&quot;&gt;</expression>
203                 </RegExp>
204                 <RegExp input="$$1" output="&lt;thumb&gt;http://www.impawards.com/$$4/posters/\2&lt;/thumb&gt;" dest="8+">
205                         <expression clear="yes" noclean="1">&lt;img (SRC|src)=&quot;posters/([^&quot;]*)&quot;</expression>
206                 </RegExp>
207                 <RegExp input="$$1" output="&lt;thumb&gt;http://www.impawards.com/$$4/posters/\1&lt;/thumb&gt;" dest="9+">
208                         <expression clear="yes" repeat="yes" noclean="1">thumbs/imp_([^&gt;]*ver[^&gt;]*.jpg)&gt;</expression>
209                 </RegExp>
210         </GetIMPAPosters>
211         <GetMoviePosterDBLink dest="6" clearbuffers="no">
212                 <RegExp input="$$1" output="&lt;details&gt;&lt;url function=&quot;GetMoviePosterDB&quot;&gt;\1&lt;/url&gt;&lt;/details&gt;" dest="6">
213                         <expression>(http://www.movieposterdb.com/movie/[^&quot;]*)&quot;</expression>
214                 </RegExp>
215         </GetMoviePosterDBLink>
216         <GetMoviePosterDB clearbuffers="no" dest="12">
217                 <RegExp input="$$1" output="&lt;thumb&gt;\1l_\2&lt;/thumb&gt;" dest="10+">
218                         <expression clear="yes" repeat="yes" noclean="1,2">&quot;poster&quot;.*?src=&quot;(.*?)[a-z]_(.*?)&quot;</expression>
219                 </RegExp>
220         </GetMoviePosterDB>
221         <GetTrailer clearbuffers="no" dest="5">
222                 <RegExp conditional="trailer" input="$$2" output="&lt;details&gt;&lt;trailer urlencoded=&quot;yes&quot;&gt;\1&lt;/trailer&gt;&lt;/details&gt;" dest="5">
223                         <RegExp input="$$1" output="\1" dest="2">
224                                 <expression noclean="1">&quot;file&quot;[^&quot;]*&quot;([^&quot;]*)</expression>
225                         </RegExp>
226                         <RegExp input="$$1" output="$$2/\1" dest="2">
227                                 <expression noclean="1">&quot;id&quot;[^&quot;]*&quot;([^&quot;]*)</expression>
228                         </RegExp>
229                         <expression noclean="1"></expression>
230                 </RegExp>
231         </GetTrailer>
232         <GetIMDBPoster dest="5">
233                 <RegExp input="$$8$$9$$10$$11" output="&lt;details&gt;&lt;thumbs&gt;\1&lt;/thumbs&gt;&lt;/details&gt;" dest="5">
234                         <RegExp input="$$1" output="\1_SX$INFO[imdbscale]_SY$INFO[imdbscale]_\2" dest="6">
235                                 <expression noclean="1,2">&lt;a name=&quot;poster&quot;.*?src=&quot;(.*?)_S.*?(.jpg)&quot;.*?&lt;/a&gt;</expression>
236                         </RegExp>
237                         <RegExp input="$$6" output="&lt;thumb&gt;\1&lt;/thumb&gt;" dest="11">
238                                 <expression clear="yes" noclean="1">(.*?_SX[0-9]+_SY[0-9]+_.jpg)</expression>
239                         </RegExp>
240                         <expression noclean="1"></expression>
241                 </RegExp>
242         </GetIMDBPoster>
243         <GetTMDBId dest="5">
244                 <RegExp conditional="fanart" input="$$1" output="&lt;details&gt;&lt;url function=&quot;GetTMDBFanart&quot;&gt;http://api.themoviedb.org/2.0/Movie.getInfo?id=\1&amp;amp;api_key=57983e31fb435df4df77afb854740ea9&lt;/url&gt;&lt;/details&gt;" dest="5">
245                         <expression>&lt;id&gt;([0-9]*)&lt;/id&gt;</expression>
246                 </RegExp>
247         </GetTMDBId>
248         <GetTMDBFanart dest="5">
249                 <RegExp input="$$2" output="&lt;details&gt;&lt;fanart url=&quot;http://themoviedb.org/image/backdrops&quot;&gt;\1&lt;/fanart&gt;&lt;/details&gt;" dest="5">
250                         <RegExp input="$$1" output="&lt;thumb preview=&quot;/\1/\2_poster.\3&quot;&gt;/\1/\2.\3&lt;/thumb&gt;" dest="2">
251                                 <expression repeat="yes">&lt;backdrop size=&quot;original&quot;&gt;.*?/([0-9]+)/([^\.]+)\.([^&lt;]*)&lt;/backdrop&gt;</expression>
252                         </RegExp>
253                         <expression noclean="1">(.+)</expression>
254                 </RegExp>
255         </GetTMDBFanart>
256         </scraper>