mirror of
https://github.com/kovidgoyal/calibre.git
synced 2025-07-09 03:04:10 -04:00
Store: SearchResult uses a different representation for DRM. Add Details download thread/pool. Change Amazon plugin to use details function instead of reading data in the search function.
This commit is contained in:
parent
b415c44cb6
commit
08b8ef818c
@ -76,11 +76,17 @@ class StorePlugin(object): # {{{
|
|||||||
return items as a generator.
|
return items as a generator.
|
||||||
|
|
||||||
Don't be lazy with the search! Load as much data as possible in the
|
Don't be lazy with the search! Load as much data as possible in the
|
||||||
:class:`calibre.gui2.store.search_result.SearchResult` object. If you have to parse
|
:class:`calibre.gui2.store.search_result.SearchResult` object.
|
||||||
multiple pages to get all of the data then do so. However, if data (such as cover_url)
|
However, if data (such as cover_url)
|
||||||
isn't available because the store does not display cover images then it's okay to
|
isn't available because the store does not display cover images then it's okay to
|
||||||
ignore it.
|
ignore it.
|
||||||
|
|
||||||
|
At the very least a :class:`calibre.gui2.store.search_result.SearchResult`
|
||||||
|
returned by this function must have the title, author and id.
|
||||||
|
|
||||||
|
If you have to parse multiple pages to get all of the data then implement
|
||||||
|
:meth:`get_deatils` for retrieving additional information.
|
||||||
|
|
||||||
Also, by default search results can only include ebooks. A plugin can offer users
|
Also, by default search results can only include ebooks. A plugin can offer users
|
||||||
an option to include physical books in the search results but this must be
|
an option to include physical books in the search results but this must be
|
||||||
disabled by default.
|
disabled by default.
|
||||||
@ -97,6 +103,9 @@ class StorePlugin(object): # {{{
|
|||||||
'''
|
'''
|
||||||
raise NotImplementedError()
|
raise NotImplementedError()
|
||||||
|
|
||||||
|
def get_details(self, search_result, timeout=60):
|
||||||
|
raise NotImplementedError()
|
||||||
|
|
||||||
def get_settings(self):
|
def get_settings(self):
|
||||||
'''
|
'''
|
||||||
This is only useful for plugins that implement
|
This is only useful for plugins that implement
|
||||||
|
@ -160,16 +160,6 @@ class AmazonKindleStore(StorePlugin):
|
|||||||
author = author.split('by')[-1]
|
author = author.split('by')[-1]
|
||||||
price = ''.join(data.xpath('div[@class="newPrice"]/span/text()'))
|
price = ''.join(data.xpath('div[@class="newPrice"]/span/text()'))
|
||||||
|
|
||||||
with closing(br.open(asin_href, timeout=timeout/4)) as nf:
|
|
||||||
idata = html.fromstring(nf.read())
|
|
||||||
if idata.xpath('boolean(//div[@class="content"]//li/b[contains(text(), "Simultaneous Device Usage")])'):
|
|
||||||
if idata.xpath('boolean(//div[@class="content"]//li[contains(., "Unlimited") and contains(b, "Simultaneous Device Usage")])'):
|
|
||||||
drm = False
|
|
||||||
else:
|
|
||||||
drm = None
|
|
||||||
else:
|
|
||||||
drm = True
|
|
||||||
|
|
||||||
counter -= 1
|
counter -= 1
|
||||||
|
|
||||||
s = SearchResult()
|
s = SearchResult()
|
||||||
@ -178,6 +168,21 @@ class AmazonKindleStore(StorePlugin):
|
|||||||
s.author = author.strip()
|
s.author = author.strip()
|
||||||
s.price = price.strip()
|
s.price = price.strip()
|
||||||
s.detail_item = asin.strip()
|
s.detail_item = asin.strip()
|
||||||
s.drm = drm
|
|
||||||
|
|
||||||
yield s
|
yield s
|
||||||
|
|
||||||
|
def get_details(self, search_result, timeout):
|
||||||
|
url = 'http://amazon.com/dp/'
|
||||||
|
|
||||||
|
br = browser()
|
||||||
|
with closing(br.open(url + search_result.detail_item, timeout=timeout)) as nf:
|
||||||
|
idata = html.fromstring(nf.read())
|
||||||
|
if idata.xpath('boolean(//div[@class="content"]//li/b[contains(text(), "Simultaneous Device Usage")])'):
|
||||||
|
if idata.xpath('boolean(//div[@class="content"]//li[contains(., "Unlimited") and contains(b, "Simultaneous Device Usage")])'):
|
||||||
|
search_result.drm = SearchResult.DRM_UNLOCKED
|
||||||
|
else:
|
||||||
|
search_result.drm = SearchResult.DRM_UNKNOWN
|
||||||
|
else:
|
||||||
|
search_result.drm = SearchResult.DRM_LOCKED
|
||||||
|
|
||||||
|
|
@ -21,6 +21,7 @@ from calibre import browser
|
|||||||
from calibre.gui2 import NONE
|
from calibre.gui2 import NONE
|
||||||
from calibre.gui2.progress_indicator import ProgressIndicator
|
from calibre.gui2.progress_indicator import ProgressIndicator
|
||||||
from calibre.gui2.store.search_ui import Ui_Dialog
|
from calibre.gui2.store.search_ui import Ui_Dialog
|
||||||
|
from calibre.gui2.store.search_result import SearchResult
|
||||||
from calibre.library.caches import _match, CONTAINS_MATCH, EQUALS_MATCH, \
|
from calibre.library.caches import _match, CONTAINS_MATCH, EQUALS_MATCH, \
|
||||||
REGEXP_MATCH
|
REGEXP_MATCH
|
||||||
from calibre.utils.config import DynamicConfig
|
from calibre.utils.config import DynamicConfig
|
||||||
@ -123,6 +124,8 @@ class SearchDialog(QDialog, Ui_Dialog):
|
|||||||
store_names = self.store_plugins.keys()
|
store_names = self.store_plugins.keys()
|
||||||
if not store_names:
|
if not store_names:
|
||||||
return
|
return
|
||||||
|
# Remove all of our internal filtering logic from the query.
|
||||||
|
query = self.clean_query(query)
|
||||||
shuffle(store_names)
|
shuffle(store_names)
|
||||||
# Add plugins that the user has checked to the search pool's work queue.
|
# Add plugins that the user has checked to the search pool's work queue.
|
||||||
for n in store_names:
|
for n in store_names:
|
||||||
@ -134,6 +137,29 @@ class SearchDialog(QDialog, Ui_Dialog):
|
|||||||
self.search_pool.start_threads()
|
self.search_pool.start_threads()
|
||||||
self.pi.startAnimation()
|
self.pi.startAnimation()
|
||||||
|
|
||||||
|
def clean_query(self, query):
|
||||||
|
query = query.lower()
|
||||||
|
# Remove control modifiers.
|
||||||
|
query = query.replace('\\', '')
|
||||||
|
query = query.replace('!', '')
|
||||||
|
query = query.replace('=', '')
|
||||||
|
query = query.replace('~', '')
|
||||||
|
query = query.replace('>', '')
|
||||||
|
query = query.replace('<', '')
|
||||||
|
# Remove the prefix.
|
||||||
|
for loc in ( 'all', 'author', 'authors', 'title'):
|
||||||
|
query = re.sub(r'%s:"?(?P<a>[^\s"]+)"?' % loc, '\g<a>', query)
|
||||||
|
# Remove the prefix and search text.
|
||||||
|
for loc in ('cover', 'drm', 'format', 'formats', 'price', 'store'):
|
||||||
|
query = re.sub(r'%s:"[^"]"' % loc, '', query)
|
||||||
|
query = re.sub(r'%s:[^\s]*' % loc, '', query)
|
||||||
|
# Remove logic.
|
||||||
|
query = re.sub(r'(^|\s)(and|not|or)(\s|$)', ' ', query)
|
||||||
|
# Remove excess whitespace.
|
||||||
|
query = re.sub(r'\s{2,}', ' ', query)
|
||||||
|
query = query.strip()
|
||||||
|
return query
|
||||||
|
|
||||||
def save_state(self):
|
def save_state(self):
|
||||||
self.config['store_search_geometry'] = self.saveGeometry()
|
self.config['store_search_geometry'] = self.saveGeometry()
|
||||||
self.config['store_search_store_splitter_state'] = self.store_splitter.saveState()
|
self.config['store_search_store_splitter_state'] = self.store_splitter.saveState()
|
||||||
@ -183,9 +209,9 @@ class SearchDialog(QDialog, Ui_Dialog):
|
|||||||
self.pi.stopAnimation()
|
self.pi.stopAnimation()
|
||||||
|
|
||||||
while self.search_pool.has_results():
|
while self.search_pool.has_results():
|
||||||
res = self.search_pool.get_result()
|
res, store_plugin = self.search_pool.get_result()
|
||||||
if res:
|
if res:
|
||||||
self.results_view.model().add_result(res)
|
self.results_view.model().add_result(res, store_plugin)
|
||||||
|
|
||||||
def open_store(self, index):
|
def open_store(self, index):
|
||||||
result = self.results_view.model().get_result(index)
|
result = self.results_view.model().get_result(index)
|
||||||
@ -307,38 +333,15 @@ class SearchThread(Thread):
|
|||||||
while self._run and not self.tasks.empty():
|
while self._run and not self.tasks.empty():
|
||||||
try:
|
try:
|
||||||
query, store_name, store_plugin, timeout = self.tasks.get()
|
query, store_name, store_plugin, timeout = self.tasks.get()
|
||||||
query = self._clean_query(query)
|
|
||||||
for res in store_plugin.search(query, timeout=timeout):
|
for res in store_plugin.search(query, timeout=timeout):
|
||||||
if not self._run:
|
if not self._run:
|
||||||
return
|
return
|
||||||
res.store_name = store_name
|
res.store_name = store_name
|
||||||
self.results.put(res)
|
self.results.put((res, store_plugin))
|
||||||
self.tasks.task_done()
|
self.tasks.task_done()
|
||||||
except:
|
except:
|
||||||
traceback.print_exc()
|
traceback.print_exc()
|
||||||
|
|
||||||
def _clean_query(self, query):
|
|
||||||
query = query.lower()
|
|
||||||
# Remove control modifiers.
|
|
||||||
query = query.replace('\\', '')
|
|
||||||
query = query.replace('!', '')
|
|
||||||
query = query.replace('=', '')
|
|
||||||
query = query.replace('~', '')
|
|
||||||
query = query.replace('>', '')
|
|
||||||
query = query.replace('<', '')
|
|
||||||
# Remove the prefix.
|
|
||||||
for loc in ( 'all', 'author', 'authors', 'title'):
|
|
||||||
query = re.sub(r'%s:"?(?P<a>[^\s"]+)"?' % loc, '\g<a>', query)
|
|
||||||
# Remove the prefix and search text.
|
|
||||||
for loc in ('cover', 'drm', 'format', 'formats', 'price', 'store'):
|
|
||||||
query = re.sub(r'%s:"[^"]"' % loc, '', query)
|
|
||||||
query = re.sub(r'%s:[^\s]*' % loc, '', query)
|
|
||||||
# Remove logic.
|
|
||||||
query = re.sub(r'(^|\s)(and|not|or)(\s|$)', ' ', query)
|
|
||||||
# Remove excess whitespace.
|
|
||||||
query = re.sub(r'\s{2,}', ' ', query)
|
|
||||||
return query
|
|
||||||
|
|
||||||
|
|
||||||
class CoverThreadPool(GenericDownloadThreadPool):
|
class CoverThreadPool(GenericDownloadThreadPool):
|
||||||
'''
|
'''
|
||||||
@ -381,6 +384,42 @@ class CoverThread(Thread):
|
|||||||
continue
|
continue
|
||||||
|
|
||||||
|
|
||||||
|
class DetailsThreadPool(GenericDownloadThreadPool):
|
||||||
|
'''
|
||||||
|
Once started all threads run until abort is called.
|
||||||
|
'''
|
||||||
|
|
||||||
|
def add_task(self, search_result, store_plugin, update_callback, timeout=10):
|
||||||
|
self.tasks.put((search_result, store_plugin, update_callback, timeout))
|
||||||
|
|
||||||
|
|
||||||
|
class DetailsThread(Thread):
|
||||||
|
|
||||||
|
def __init__(self, tasks, results):
|
||||||
|
Thread.__init__(self)
|
||||||
|
self.daemon = True
|
||||||
|
self.tasks = tasks
|
||||||
|
self.results = results
|
||||||
|
self._run = True
|
||||||
|
|
||||||
|
def abort(self):
|
||||||
|
self._run = False
|
||||||
|
|
||||||
|
def run(self):
|
||||||
|
while self._run:
|
||||||
|
try:
|
||||||
|
time.sleep(.1)
|
||||||
|
while not self.tasks.empty():
|
||||||
|
if not self._run:
|
||||||
|
break
|
||||||
|
result, store_plugin, callback, timeout = self.tasks.get()
|
||||||
|
if result:
|
||||||
|
store_plugin.get_details(result, timeout)
|
||||||
|
callback()
|
||||||
|
self.tasks.task_done()
|
||||||
|
except:
|
||||||
|
continue
|
||||||
|
|
||||||
class Matches(QAbstractItemModel):
|
class Matches(QAbstractItemModel):
|
||||||
|
|
||||||
HEADERS = [_('Cover'), _('Title'), _('Author(s)'), _('Price'), _('DRM'), _('Store')]
|
HEADERS = [_('Cover'), _('Title'), _('Author(s)'), _('Price'), _('DRM'), _('Store')]
|
||||||
@ -402,9 +441,12 @@ class Matches(QAbstractItemModel):
|
|||||||
self.search_filter = SearchFilter()
|
self.search_filter = SearchFilter()
|
||||||
self.cover_pool = CoverThreadPool(CoverThread, 2)
|
self.cover_pool = CoverThreadPool(CoverThread, 2)
|
||||||
self.cover_pool.start_threads()
|
self.cover_pool.start_threads()
|
||||||
|
self.details_pool = DetailsThreadPool(DetailsThread, 4)
|
||||||
|
self.details_pool.start_threads()
|
||||||
|
|
||||||
def closing(self):
|
def closing(self):
|
||||||
self.cover_pool.abort()
|
self.cover_pool.abort()
|
||||||
|
self.details_pool.abort()
|
||||||
|
|
||||||
def clear_results(self):
|
def clear_results(self):
|
||||||
self.all_matches = []
|
self.all_matches = []
|
||||||
@ -414,13 +456,16 @@ class Matches(QAbstractItemModel):
|
|||||||
self.query = ''
|
self.query = ''
|
||||||
self.cover_pool.abort()
|
self.cover_pool.abort()
|
||||||
self.cover_pool.start_threads()
|
self.cover_pool.start_threads()
|
||||||
|
self.details_pool.abort()
|
||||||
|
self.details_pool.start_threads()
|
||||||
self.reset()
|
self.reset()
|
||||||
|
|
||||||
def add_result(self, result):
|
def add_result(self, result, store_plugin):
|
||||||
self.layoutAboutToBeChanged.emit()
|
self.layoutAboutToBeChanged.emit()
|
||||||
self.all_matches.append(result)
|
self.all_matches.append(result)
|
||||||
self.search_filter.add_search_result(result)
|
self.search_filter.add_search_result(result)
|
||||||
self.cover_pool.add_task(result, self.filter_results)
|
self.cover_pool.add_task(result, self.filter_results)
|
||||||
|
self.details_pool.add_task(result, store_plugin, self.filter_results)
|
||||||
self.filter_results()
|
self.filter_results()
|
||||||
self.layoutChanged.emit()
|
self.layoutChanged.emit()
|
||||||
|
|
||||||
@ -438,7 +483,7 @@ class Matches(QAbstractItemModel):
|
|||||||
else:
|
else:
|
||||||
self.matches = list(self.search_filter.universal_set())
|
self.matches = list(self.search_filter.universal_set())
|
||||||
self.reorder_matches()
|
self.reorder_matches()
|
||||||
self.layoutAboutToBeChanged.emit()
|
self.layoutChanged.emit()
|
||||||
|
|
||||||
def set_query(self, query):
|
def set_query(self, query):
|
||||||
self.query = query
|
self.query = query
|
||||||
@ -487,11 +532,11 @@ class Matches(QAbstractItemModel):
|
|||||||
p.loadFromData(result.cover_data)
|
p.loadFromData(result.cover_data)
|
||||||
return QVariant(p)
|
return QVariant(p)
|
||||||
if col == 4:
|
if col == 4:
|
||||||
if result.drm:
|
if result.drm == SearchResult.DRM_LOCKED:
|
||||||
return QVariant(self.DRM_LOCKED_ICON)
|
return QVariant(self.DRM_LOCKED_ICON)
|
||||||
if result.drm == False:
|
if result.drm == SearchResult.DRM_UNLOCKED:
|
||||||
return QVariant(self.DRM_UNLOCKED_ICON)
|
return QVariant(self.DRM_UNLOCKED_ICON)
|
||||||
else:
|
elif result.drm == SearchResult.DRM_UNKNOWN:
|
||||||
return QVariant(self.DRM_UNKNOWN_ICON)
|
return QVariant(self.DRM_UNKNOWN_ICON)
|
||||||
elif role == Qt.SizeHintRole:
|
elif role == Qt.SizeHintRole:
|
||||||
return QSize(64, 64)
|
return QSize(64, 64)
|
||||||
@ -596,7 +641,7 @@ class SearchFilter(SearchQueryParser):
|
|||||||
accessor = q[locvalue]
|
accessor = q[locvalue]
|
||||||
if query == 'true':
|
if query == 'true':
|
||||||
if locvalue == 'drm':
|
if locvalue == 'drm':
|
||||||
if accessor(sr) == True:
|
if accessor(sr) == SearchResult.DRM_LOCKED:
|
||||||
matches.add(sr)
|
matches.add(sr)
|
||||||
else:
|
else:
|
||||||
if accessor(sr) is not None:
|
if accessor(sr) is not None:
|
||||||
@ -604,7 +649,7 @@ class SearchFilter(SearchQueryParser):
|
|||||||
continue
|
continue
|
||||||
if query == 'false':
|
if query == 'false':
|
||||||
if locvalue == 'drm':
|
if locvalue == 'drm':
|
||||||
if accessor(sr) == False:
|
if accessor(sr) == SearchResult.DRM_UNKNOWN:
|
||||||
matches.add(sr)
|
matches.add(sr)
|
||||||
else:
|
else:
|
||||||
if accessor(sr) is None:
|
if accessor(sr) is None:
|
||||||
|
@ -8,6 +8,10 @@ __docformat__ = 'restructuredtext en'
|
|||||||
|
|
||||||
class SearchResult(object):
|
class SearchResult(object):
|
||||||
|
|
||||||
|
DRM_LOCKED = 1
|
||||||
|
DRM_UNLOCKED = 2
|
||||||
|
DRM_UNKNOWN = 3
|
||||||
|
|
||||||
def __init__(self):
|
def __init__(self):
|
||||||
self.store_name = ''
|
self.store_name = ''
|
||||||
self.cover_url = ''
|
self.cover_url = ''
|
||||||
@ -16,8 +20,5 @@ class SearchResult(object):
|
|||||||
self.author = ''
|
self.author = ''
|
||||||
self.price = ''
|
self.price = ''
|
||||||
self.detail_item = ''
|
self.detail_item = ''
|
||||||
# None = Unknown.
|
|
||||||
# True = Has DRM.
|
|
||||||
# False = Does not have DRM.
|
|
||||||
self.drm = None
|
self.drm = None
|
||||||
self.formats = ''
|
self.formats = ''
|
||||||
|
Loading…
x
Reference in New Issue
Block a user