From 33eac400fdd9c0cd0788e0052bdf8824fd5eae42 Mon Sep 17 00:00:00 2001
From: Kovid Goyal <kovid@kovidgoyal.net>
Date: Mon, 22 Mar 2021 15:47:16 +0530
Subject: [PATCH] Get books: Fix smashwords plugin not working because of
 website changes

Fixes #1918737 [smashwords search doesn't work](https://bugs.launchpad.net/calibre/+bug/1918737)
---
 .../gui2/store/stores/smashwords_plugin.py    | 27 ++++++++++---------
 1 file changed, 14 insertions(+), 13 deletions(-)

diff --git a/src/calibre/gui2/store/stores/smashwords_plugin.py b/src/calibre/gui2/store/stores/smashwords_plugin.py
index 4d9cdf37fa..a27597882a 100644
--- a/src/calibre/gui2/store/stores/smashwords_plugin.py
+++ b/src/calibre/gui2/store/stores/smashwords_plugin.py
@@ -1,7 +1,7 @@
 # -*- coding: utf-8 -*-
 from __future__ import absolute_import, division, print_function, unicode_literals
 
-store_version = 5  # Needed for dynamic plugin loading
+store_version = 6  # Needed for dynamic plugin loading
 
 __license__ = 'GPL 3'
 __copyright__ = '2011, John Schember <john@nachtimwald.com>'
@@ -27,7 +27,7 @@ from calibre.gui2.store.search_result import SearchResult
 from calibre.gui2.store.web_store_dialog import WebStoreDialog
 
 
-def search(query, max_results=10, timeout=60):
+def search(query, max_results=10, timeout=60, save_raw=None):
     url = 'https://www.smashwords.com/books/search?query=' + quote(query)
 
     br = browser()
@@ -38,23 +38,24 @@ def search(query, max_results=10, timeout=60):
 
     counter = max_results
     with closing(br.open(url, timeout=timeout)) as f:
-        doc = html.fromstring(f.read())
-        for data in doc.xpath('//div[@id="pageContent"]//div[@class="library-book"]'):
+        raw = f.read()
+        if save_raw:
+            with open(save_raw, 'wb') as r:
+                r.write(raw)
+        doc = html.fromstring(raw)
+        for data in doc.xpath('//div[@id="pageContent"]//div[contains(@class, "library-book")]'):
             if counter <= 0:
                 break
             data = html.fromstring(html.tostring(data))
 
-            id = None
-            id_a = ''.join(data.xpath('//a[contains(@class, "library-title")]/@href'))
-            if id_a:
-                id = id_a.split('/')[-1]
-            if not id:
+            id_a = ''.join(data.xpath('//span[contains(@class, "library-title")]/a/@href'))
+            if not id_a:
                 continue
 
             cover_url = ''.join(data.xpath('//img[contains(@class, "book-list-image")]/@src'))
 
-            title = ''.join(data.xpath('.//a[contains(@class, "library-title")]/text()'))
-            author = ''.join(data.xpath('.//a[@itemprop="author"]//text()'))
+            title = ''.join(data.xpath('.//span[contains(@class, "library-title")]//text()'))
+            author = ''.join(data.xpath('.//span[contains(@class, "library-by-line")]/a//text()'))
 
             price = ''.join(data.xpath('.//div[@class="subnote"]//text()'))
             if 'Price:' in price:
@@ -74,7 +75,7 @@ def search(query, max_results=10, timeout=60):
             s.title = title.strip()
             s.author = author.strip()
             s.price = price
-            s.detail_item = '/books/view/' + id.strip()
+            s.detail_item = id_a
             s.drm = SearchResult.DRM_UNLOCKED
 
             yield s
@@ -119,5 +120,5 @@ class SmashwordsStore(BasicStoreConfig, StorePlugin):
 
 if __name__ == '__main__':
     import sys
-    for r in search(' '.join(sys.argv[1:])):
+    for r in search(' '.join(sys.argv[1:]), save_raw='/t/raw.html'):
         print(r)