From d1299f940f32810ad1ce1680270a4c71b9103c03 Mon Sep 17 00:00:00 2001 From: j <0x006A@0x2620.org> Date: Tue, 21 Aug 2012 09:55:16 +0200 Subject: [PATCH] add filmsdivision --- ox/web/filmsdivision.py | 39 +++++++++++++++++++++++++++++++++++++++ 1 file changed, 39 insertions(+) create mode 100644 ox/web/filmsdivision.py diff --git a/ox/web/filmsdivision.py b/ox/web/filmsdivision.py new file mode 100644 index 0000000..7698577 --- /dev/null +++ b/ox/web/filmsdivision.py @@ -0,0 +1,39 @@ +# -*- coding: utf-8 -*- +# vi:si:et:sw=4:sts=4:ts=4 +import re +import string +import subprocess +import ox + + +def get_ids(): + result = [] + for i in string.letters[26:]: + url = "http://www.filmsdivision.org/search.php?title=%s" % i + data = ox.cache.read_url(url) + links = re.compile('view_video.php\?movId=(.*?)[\'"]', re.DOTALL).findall(data) + result += links + return list(set(result)) + +def get_data(id): + result = {} + url = "http://www.filmsdivision.org/view_video.php?movId=%s" % id + data = ox.cache.read_url(url) + result['title'] = re.compile('