From: Mikael Frykholm Date: Fri, 1 Feb 2013 07:52:46 +0000 (+0100) Subject: Some refactoring for finding videoid. Added better title detection. X-Git-Url: https://git.frykholm.com/svtplaydump.git/commitdiff_plain/a750237037e1bb3920eab83b594a39758efe662e Some refactoring for finding videoid. Added better title detection. --- diff --git a/svtplaydump.py b/svtplaydump.py index 0718c30..066ed41 100755 --- a/svtplaydump.py +++ b/svtplaydump.py @@ -41,16 +41,12 @@ import sys def main(argv=None): if argv is None: argv=sys.argv + page = urllib2.urlopen(argv[1]).read() + soup = BeautifulSoup(page,convertEntities=BeautifulSoup.HTML_ENTITIES) + videoid = re.findall("svt_article_id=(.*)[&]*",page)[0] + flashvars = json.loads(urllib2.urlopen("http://www.svt.se/wd?widgetId=248134§ionId=1024&articleId=%s&position=0&format=json&type=embed&contextSectionId=1024"%videoid).read()) try: - videoid = re.findall("/video/(.*)[/]*",argv[1])[0] - soup = BeautifulSoup(urllib2.urlopen("http://www.svtplay.se/video/%s/?type=embed"%videoid).read()) - flashvars = json.loads(soup.find("param", {"name":"flashvars",'value':True})['value'][5:]) - except(IndexError): - page = urllib2.urlopen(argv[1]).read() - videoid = re.findall("svt_article_id=(.*)[&]*",page)[0] - flashvars = json.loads(urllib2.urlopen("http://www.svt.se/wd?widgetId=248134§ionId=1024&articleId=%s&position=0&format=json&type=embed&contextSectionId=1024"%videoid).read()) - try: - title = flashvars['statistics']['title'] + title = soup.find('meta',{'property':'og:title'}).attrMap['content'] except: title = "unnamed" if 'dynamicStreams' in flashvars: