From 5398c0fc64b68fb67cf30285cb746431aa0488e5 Mon Sep 17 00:00:00 2001
From: Charles Haley <>
Date: Tue, 26 Apr 2011 11:17:50 +0100
Subject: [PATCH] First cut at amazon.uk store plugin.

---
 src/calibre/gui2/store/amazon_plugin.py    |   6 +-
 src/calibre/gui2/store/amazon_uk_plugin.py | 188 ++-------------------
 2 files changed, 15 insertions(+), 179 deletions(-)

diff --git a/src/calibre/gui2/store/amazon_plugin.py b/src/calibre/gui2/store/amazon_plugin.py
index a68e4611f0..55fb613288 100644
--- a/src/calibre/gui2/store/amazon_plugin.py
+++ b/src/calibre/gui2/store/amazon_plugin.py
@@ -116,8 +116,9 @@ class AmazonKindleStore(StorePlugin):
             store_link = 'http://www.amazon.com/dp/%(asin)s/?tag=%(tag)s' % aff_id
         open_url(QUrl(store_link))
 
+    search_url = 'http://www.amazon.com/s/url=search-alias%3Ddigital-text&field-keywords='
     def search(self, query, max_results=10, timeout=60):
-        url = 'http://www.amazon.com/s/url=search-alias%3Ddigital-text&field-keywords=' + urllib2.quote(query)
+        url =  self.search_url + urllib2.quote(query)
         br = browser()
 
         counter = max_results
@@ -179,8 +180,9 @@ class AmazonKindleStore(StorePlugin):
 
                 yield s
 
+    details_url = 'http://amazon.com/dp/'
     def get_details(self, search_result, timeout):
-        url = 'http://amazon.com/dp/'
+        url = self.details_url
 
         br = browser()
         with closing(br.open(url + search_result.detail_item, timeout=timeout)) as nf:
diff --git a/src/calibre/gui2/store/amazon_uk_plugin.py b/src/calibre/gui2/store/amazon_uk_plugin.py
index a68e4611f0..e24ddb485e 100644
--- a/src/calibre/gui2/store/amazon_uk_plugin.py
+++ b/src/calibre/gui2/store/amazon_uk_plugin.py
@@ -6,192 +6,26 @@ __license__ = 'GPL 3'
 __copyright__ = '2011, John Schember <john@nachtimwald.com>'
 __docformat__ = 'restructuredtext en'
 
-import random
-import re
-import urllib2
-from contextlib import closing
-
-from lxml import html
 
 from PyQt4.Qt import QUrl
 
-from calibre import browser
 from calibre.gui2 import open_url
-from calibre.gui2.store import StorePlugin
-from calibre.gui2.store.search_result import SearchResult
+from calibre.gui2.store.amazon_plugin import AmazonKindleStore
 
-class AmazonKindleStore(StorePlugin):
+class AmazonUKKindleStore(AmazonKindleStore):
+
+    '''
+    For comments on the implementation, please see amazon_plugin.py
+    '''
 
     def open(self, parent=None, detail_item=None, external=False):
-        '''
-        Amazon comes with a number of difficulties.
-
-        QWebView has major issues with Amazon.com. The largest of
-        issues is it simply doesn't work on a number of pages.
-
-        When connecting to a number parts of Amazon.com (Kindle library
-        for instance) QNetworkAccessManager fails to connect with a
-        NetworkError of 399 - ProtocolFailure. The strange thing is,
-        when I check QNetworkRequest.HttpStatusCodeAttribute when the
-        399 error is returned the status code is 200 (Ok). However, once
-        the QNetworkAccessManager decides there was a NetworkError it
-        does not download the page from Amazon. So I can't even set the
-        HTML in the QWebView myself.
-
-        There is http://bugreports.qt.nokia.com/browse/QTWEBKIT-259 an
-        open bug about the issue but it is not correct. We can set the
-        useragent (Arora does) to something else and the above issue
-        will persist. This http://developer.qt.nokia.com/forums/viewthread/793
-        gives a bit more information about the issue but as of now (27/Feb/2011)
-        there is no solution or work around.
-
-        We cannot change the The linkDelegationPolicy to allow us to avoid
-        QNetworkAccessManager because it only works links. Forms aren't
-        included so the same issue persists on any part of the site (login)
-        that use a form to load a new page.
-
-        Using an aStore was evaluated but I've decided against using it.
-        There are three major issues with an aStore. Because checkout is
-        handled by sending the user to Amazon we can't put it in a QWebView.
-        If we're sending the user to Amazon sending them there directly is
-        nicer. Also, we cannot put the aStore in a QWebView and let it open the
-        redirection the users default browser because the cookies with the
-        shopping cart won't transfer.
-
-        Another issue with the aStore is how it handles the referral. It only
-        counts the referral for the items in the shopping card / the item
-        that directed the user to Amazon. Kindle books do not use the shopping
-        cart and send the user directly to Amazon for the purchase. In this
-        instance we would only get referral credit for the one book that the
-        aStore directs to Amazon that the user buys. Any other purchases we
-        won't get credit for.
-
-        The last issue with the aStore is performance. Even though it's an
-        Amazon site it's alow. So much slower than Amazon.com that it makes
-        me not want to browse books using it. The look and feel are lesser
-        issues. So is the fact that it almost seems like the purchase is
-        with calibre. This can cause some support issues because we can't
-        do much for issues with Amazon.com purchase hiccups.
-
-        Another option that was evaluated was the Product Advertising API.
-        The reasons against this are complexity. It would take a lot of work
-        to basically re-create Amazon.com within calibre. The Product
-        Advertising API is also designed with being run on a server not
-        in an app. The signing keys would have to be made avaliable to ever
-        calibre user which means bad things could be done with our account.
-
-        The Product Advertising API also assumes the same browser for easy
-        shopping cart transfer to Amazon. With QWebView not working and there
-        not being an easy way to transfer cookies between a QWebView and the
-        users default browser this won't work well.
-
-        We could create our own website on the calibre server and create an
-        Amazon Product Advertising API store. However, this goes back to the
-        complexity argument. Why spend the time recreating Amazon.com
-
-        The final and largest issue against using the Product Advertising API
-        is the Efficiency Guidelines:
-
-        "Each account used to access the Product Advertising API will be allowed
-        an initial usage limit of 2,000 requests per hour. Each account will
-        receive an additional 500 requests per hour (up to a maximum of 25,000
-        requests per hour) for every $1 of shipped item revenue driven per hour
-        in a trailing 30-day period. Usage thresholds are recalculated daily based
-        on revenue performance."
-
-        With over two million users a limit of 2,000 request per hour could
-        render our store unusable for no other reason than Amazon rate
-        limiting our traffic.
-
-        The best (I use the term lightly here) solution is to open Amazon.com
-        in the users default browser and set the affiliate id as part of the url.
-        '''
-        aff_id = {'tag': 'josbl0e-cpb-20'}
-        # Use Kovid's affiliate id 30% of the time.
-        if random.randint(1, 10) in (1, 2, 3):
-            aff_id['tag'] = 'calibrebs-20'
-        store_link = 'http://www.amazon.com/Kindle-eBooks/b/?ie=UTF&node=1286228011&ref_=%(tag)s&ref=%(tag)s&tag=%(tag)s&linkCode=ur2&camp=1789&creative=390957' % aff_id
+        aff_id = {'tag': 'calcharles-21'}
+        store_link = 'http://www.amazon.co.uk/Kindle-eBooks/b/?ie=UTF&node=1286228011&ref_=%(tag)s&ref=%(tag)s&tag=%(tag)s&linkCode=ur2&camp=1789&creative=390957' % aff_id
         if detail_item:
             aff_id['asin'] = detail_item
-            store_link = 'http://www.amazon.com/dp/%(asin)s/?tag=%(tag)s' % aff_id
+            store_link = 'http://www.amazon.co.uk/dp/%(asin)s/?tag=%(tag)s' % aff_id
         open_url(QUrl(store_link))
 
-    def search(self, query, max_results=10, timeout=60):
-        url = 'http://www.amazon.com/s/url=search-alias%3Ddigital-text&field-keywords=' + urllib2.quote(query)
-        br = browser()
-
-        counter = max_results
-        with closing(br.open(url, timeout=timeout)) as f:
-            doc = html.fromstring(f.read())
-            for data in doc.xpath('//div[@class="productData"]'):
-                if counter <= 0:
-                    break
-
-                # Even though we are searching digital-text only Amazon will still
-                # put in results for non Kindle books (author pages). Se we need
-                # to explicitly check if the item is a Kindle book and ignore it
-                # if it isn't.
-                type = ''.join(data.xpath('//span[@class="format"]/text()'))
-                if 'kindle' not in type.lower():
-                    continue
-
-                # We must have an asin otherwise we can't easily reference the
-                # book later.
-                asin_href = None
-                asin_a = data.xpath('div[@class="productTitle"]/a[1]')
-                if asin_a:
-                    asin_href = asin_a[0].get('href', '')
-                    m = re.search(r'/dp/(?P<asin>.+?)(/|$)', asin_href)
-                    if m:
-                        asin = m.group('asin')
-                    else:
-                        continue
-                else:
-                    continue
-
-                cover_url = ''
-                if asin_href:
-                    cover_img = data.xpath('//div[@class="productImage"]/a[@href="%s"]/img/@src' % asin_href)
-                    if cover_img:
-                        cover_url = cover_img[0]
-                        parts = cover_url.split('/')
-                        bn = parts[-1]
-                        f, _, ext = bn.rpartition('.')
-                        if '_' in f:
-                            bn = f.partition('_')[0]+'_SL160_.'+ext
-                            parts[-1] = bn
-                            cover_url = '/'.join(parts)
-
-                title = ''.join(data.xpath('div[@class="productTitle"]/a/text()'))
-                author = ''.join(data.xpath('div[@class="productTitle"]/span[@class="ptBrand"]/text()'))
-                author = author.split('by')[-1]
-                price = ''.join(data.xpath('div[@class="newPrice"]/span/text()'))
-
-                counter -= 1
-
-                s = SearchResult()
-                s.cover_url = cover_url
-                s.title = title.strip()
-                s.author = author.strip()
-                s.price = price.strip()
-                s.detail_item = asin.strip()
-                s.formats = 'Kindle'
-
-                yield s
-
-    def get_details(self, search_result, timeout):
-        url = 'http://amazon.com/dp/'
-
-        br = browser()
-        with closing(br.open(url + search_result.detail_item, timeout=timeout)) as nf:
-            idata = html.fromstring(nf.read())
-            if idata.xpath('boolean(//div[@class="content"]//li/b[contains(text(), "Simultaneous Device Usage")])'):
-                if idata.xpath('boolean(//div[@class="content"]//li[contains(., "Unlimited") and contains(b, "Simultaneous Device Usage")])'):
-                    search_result.drm = SearchResult.DRM_UNLOCKED
-                else:
-                    search_result.drm = SearchResult.DRM_UNKNOWN
-            else:
-                search_result.drm = SearchResult.DRM_LOCKED
-        return True
-
+    search_url = 'http://www.amazon.co.uk/s/url=search-alias%3Ddigital-text&field-keywords='
+    details_url = 'http://amazon.co.uk/dp/'