From ed465c527fa47649c08c4eb4314b92203d101ac7 Mon Sep 17 00:00:00 2001 From: j <0x006A@0x2620.org> Date: Sun, 15 Mar 2015 02:38:38 +0530 Subject: [PATCH] better title --- ox/web/ubu.py | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/ox/web/ubu.py b/ox/web/ubu.py index da90bad..32094e9 100644 --- a/ox/web/ubu.py +++ b/ox/web/ubu.py @@ -39,6 +39,12 @@ def get_data(url): if 'title' in m: m['title'] = re.sub('(.*?) \(\d{4}\)$', '\\1', m['title']) + if not 'title' in m: + match = re.compile(".*?&(.*?)").findall(data) + if match: + m['title'] = match[0].strip() + if ' - ' in m['title']: + m['title'] = m['title'].split(' - ', 1)[-1] match = re.compile("flashvars','file=(.*?.flv)'").findall(data) if match: m['flv'] = match[0]