Index: imdb.xml =================================================================== --- imdb.xml (revision 30958) +++ imdb.xml (working copy) @@ -1,5 +1,5 @@ - - + + common/imdb.xml common/tmdb.xml common/movieposterdb.xml @@ -35,15 +35,15 @@ - - (imdb.com)/Title\?([0-9]*) + + (imdb.com)/Title\?([0-9]*) - + (imdb.com/title/tt)([0-9]*) - - + + (.+) @@ -55,13 +55,13 @@ og:url" content=".+?/title/([t0-9]*)/ - + <meta name="title" content="([^"]*) \([^\)0-9]*([0-9]+)\) (><a href="/title.*) - + ><a href="/title/([t0-9]*)/[^>]*>([^<]*)</a> *\(([0-9]*) @@ -76,44 +76,35 @@ <h1 class="header" itemprop="name">([^<]*) - a href="/year/([0-9]*) + a href="/year/([0-9]*) Top 250 #([0-9]*)</a> - MPAA</a>\)</h4>\n([^<]*) + MPAA</a>\)</h4>\n?<span itemprop="contentRating">([^<]*) - <a href="/search/title\?certificates=[^"]*">([^<]*)</a>[^<]*(<i>([^<]*)</i>)? + <a href="/search/title\?certificates=[^"]*">([^<]*)</a>[^<]*(<i>([^<]*)</i>)? - >Taglines:</h4>([^<]*) + <h4[^>]*?>Taglines:</h4>\n?([^<]*) - >Runtime:</h4>[^0-9]*([,0-9]+) min + <h4[^>]*?>Runtime:</h4>[^0-9]*([0-9]+) - - "star-bar-user-rate"><b>([0-9.]+).*?>.*?title="([0-9,]+)\s + + <span itemprop="ratingValue">([0-9.]+).*?>.*?title="([0-9,]+)\s - - >([0-9,]+) votes</a> - "/genre/[^/]*">([^<]*)</a> "/company/[^/]*/">([^<]*)</a> - - - reviews</a></span>(.*?)(?:<a href="plotsummary">|</p>) + + <p>\n<p itemprop="description">([^<]+)</p> - - ([^\n]+) - - - @@ -144,17 +135,17 @@ /title/tt([t0-9]*)/faq - - /vi([0-9]*)/ + + /vi([0-9]*)/ - - - - <h1>([^<]*) - - ([a-zA-Z0-9]+) - - + + + + <h1>([^<]*) + + ([a-zA-Z0-9]+) + + Index: common/imdb.xml =================================================================== --- common/imdb.xml (revision 30958) +++ common/imdb.xml (working copy) @@ -23,47 +23,41 @@ - - Writers?\:(.*?)</div> + + Writer[s]?.*?</h4>(.*?)<div class - - Writing credits(.*?)name=" - - /name/[^>"]*">([^<]*)< + <a href="/name[^>]*>([^<]*)< - - <table class="cast_list">(.*?)</table> + + <table class="cast_list">(.*?)</table> - - <table class="cast">(.*?)</table> + + <noscript><img \n[^a]*alt="([^"]*)"[^"]*"[^"]*"[^s]*src="(?:([^"]*\.)[^"]*(\.jpg))[^>]*.*?ter">[^>]*>\n\s*(<[^>]*>)?([^<\(]*)? - - <img src="(?:([^"]*\.)[^"]*(\.jpg))?[^>]*[^"]*"nm"><a href="[^"]*[^>]*>([^<]*)<[^"]*"ddd">([^<]<)?[^"]*"char">(.*?)</td> + + <img \n[^a]*alt="([^"]*)"[^"]*"[^"]*"[^s]*src="(?:[^"]*\.[^"]*\.png)" class="" />*.*?ter">[^>]*>\n\s*(<[^>]*>)?([^<\(]*)? - <actor><thumb>(?:(http.*?)|_SX[0-9]+_SY[0-9]+_)</thumb>(.*?)</actor> + <actor><thumb>(?:(http.*?)|_SX[0-9]+_SY[0-9]+_)?</thumb>(.*?)</actor> - + - - Directors?\:(.*?)</div> + + Director[s]?.*?</h4>(.*?)<div class - - Directed by(.*?)</table> - - /name/[^>"]*">([^<]*)< + <a href="/name[^>]*>([^<]*)< - +