mirror of
https://github.com/kovidgoyal/calibre.git
synced 2025-07-09 03:04:10 -04:00
Filter audio books from amazon metadata download results
This commit is contained in:
parent
773c564174
commit
4cc36cac1a
@ -549,7 +549,8 @@ class Amazon(Source):
|
|||||||
r'//div[@id="Results"]/descendant::td[starts-with(@id, "search:Td:")]'):
|
r'//div[@id="Results"]/descendant::td[starts-with(@id, "search:Td:")]'):
|
||||||
for a in td.xpath(r'descendant::td[@class="dataColumn"]/descendant::a[@href]/span[@class="srTitle"]/..'):
|
for a in td.xpath(r'descendant::td[@class="dataColumn"]/descendant::a[@href]/span[@class="srTitle"]/..'):
|
||||||
title = tostring(a, method='text', encoding=unicode).lower()
|
title = tostring(a, method='text', encoding=unicode).lower()
|
||||||
if 'bulk pack' not in title:
|
if ('bulk pack' not in title and '[audiobook]' not in
|
||||||
|
title and '[audio cd]' not in title):
|
||||||
matches.append(a.get('href'))
|
matches.append(a.get('href'))
|
||||||
break
|
break
|
||||||
|
|
||||||
|
@ -313,7 +313,7 @@ class Source(Plugin):
|
|||||||
title_patterns = [(re.compile(pat, re.IGNORECASE), repl) for pat, repl in
|
title_patterns = [(re.compile(pat, re.IGNORECASE), repl) for pat, repl in
|
||||||
[
|
[
|
||||||
# Remove things like: (2010) (Omnibus) etc.
|
# Remove things like: (2010) (Omnibus) etc.
|
||||||
(r'(?i)[({\[](\d{4}|omnibus|anthology|hardcover|paperback|turtleback|mass\s*market|edition|ed\.)[\])}]', ''),
|
(r'(?i)[({\[](\d{4}|omnibus|anthology|hardcover|audiobook|audio\scd|paperback|turtleback|mass\s*market|edition|ed\.)[\])}]', ''),
|
||||||
# Remove any strings that contain the substring edition inside
|
# Remove any strings that contain the substring edition inside
|
||||||
# parentheses
|
# parentheses
|
||||||
(r'(?i)[({\[].*?(edition|ed.).*?[\]})]', ''),
|
(r'(?i)[({\[].*?(edition|ed.).*?[\]})]', ''),
|
||||||
|
Loading…
x
Reference in New Issue
Block a user