From 121a2c9ac3ae82b2d1b81372a1338c8e4785da49 Mon Sep 17 00:00:00 2001 From: j Date: Sat, 15 Nov 2014 01:05:33 +0000 Subject: [PATCH] ignore osx resource forks --- oml/media/epub.py | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/oml/media/epub.py b/oml/media/epub.py index e60bd83..fa4361a 100644 --- a/oml/media/epub.py +++ b/oml/media/epub.py @@ -85,11 +85,13 @@ def info(epub): return data def extract_text(path): - data = b'' + data = '' z = zipfile.ZipFile(path) for f in z.filelist: + if '/._' in f.filename or f.filename.startswith('._'): + continue if f.filename.endswith('html'): - data += z.read(f.filename) + data += z.read(f.filename).decode() return data def extract_isbn(data):