From 846686c2de0bce3e22d369183326bfec302c0b3d Mon Sep 17 00:00:00 2001 From: Jamie Osborne Date: Tue, 26 Dec 2017 23:23:11 +0000 Subject: [PATCH 1/2] Case insensitive replacement of synopsis tags - Some pages have tags using capital letters: https://www.audible.com/pd/B002V8N9VG --- Contents/Code/__init__.py | 14 +++----------- 1 file changed, 3 insertions(+), 11 deletions(-) diff --git a/Contents/Code/__init__.py b/Contents/Code/__init__.py index 192371a..a9db443 100644 --- a/Contents/Code/__init__.py +++ b/Contents/Code/__init__.py @@ -542,17 +542,9 @@ def update(self, metadata, media, lang, force=False): #cleanup synopsis - synopsis = synopsis.replace("", "") - synopsis = synopsis.replace("", "") - synopsis = synopsis.replace("", "") - synopsis = synopsis.replace("", "") - synopsis = synopsis.replace("", "") - synopsis = synopsis.replace("", "") - synopsis = synopsis.replace("
", "") - synopsis = synopsis.replace("

", "") - synopsis = synopsis.replace("

", "\n") - - + synopsis = re.sub(r'<([pP]|br|br ?/)>', '\n', synopsis) + synopsis = re.sub(r'<(/?[iIuUbBpP])>', '', synopsis.strip()) + self.Log('date: %s', date) self.Log('title: %s', title) self.Log('author: %s', author) From 4bcca23525ef6c92b11bdfea5941236548bbdc84 Mon Sep 17 00:00:00 2001 From: Jamie Osborne Date: Sat, 30 Dec 2017 23:55:39 +0000 Subject: [PATCH 2/2] Also handle lists inside of summary text - https://www.audible.com/pd/B00OZ7WJQM --- Contents/Code/__init__.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/Contents/Code/__init__.py b/Contents/Code/__init__.py index a9db443..d6c37cb 100644 --- a/Contents/Code/__init__.py +++ b/Contents/Code/__init__.py @@ -542,8 +542,8 @@ def update(self, metadata, media, lang, force=False): #cleanup synopsis - synopsis = re.sub(r'<([pP]|br|br ?/)>', '\n', synopsis) - synopsis = re.sub(r'<(/?[iIuUbBpP])>', '', synopsis.strip()) + synopsis = re.sub(r'<([pP]|li|br|br ?/)>', '\n', synopsis) + synopsis = re.sub(r'', '', synopsis.strip()) self.Log('date: %s', date) self.Log('title: %s', title)