mirror of
https://github.com/kovidgoyal/calibre.git
synced 2025-07-09 03:04:10 -04:00
Set the Referer when accessing cached pages
This commit is contained in:
parent
122a1de44d
commit
faf46f844f
@ -1221,7 +1221,9 @@ class Amazon(Source):
|
|||||||
matches = []
|
matches = []
|
||||||
se = search_engines_module()
|
se = search_engines_module()
|
||||||
urlproc = se.bing_url_processor
|
urlproc = se.bing_url_processor
|
||||||
for result in se.bing_search(terms, site, log=log, br=br, timeout=timeout):
|
results, qurl = se.bing_search(terms, site, log=log, br=br, timeout=timeout)
|
||||||
|
br.set_current_header('Referer', qurl)
|
||||||
|
for result in results:
|
||||||
if abort.is_set():
|
if abort.is_set():
|
||||||
return matches, terms, domain, None
|
return matches, terms, domain, None
|
||||||
|
|
||||||
|
@ -129,12 +129,12 @@ def ddg_search(terms, site=None, br=None, log=prints, safe_search=False, dump_ra
|
|||||||
ans = []
|
ans = []
|
||||||
for a in root.xpath('//*[@class="results"]//*[@class="result__title"]/a[@href and @class="result__a"]'):
|
for a in root.xpath('//*[@class="results"]//*[@class="result__title"]/a[@href and @class="result__a"]'):
|
||||||
ans.append(Result(ddg_href(a.get('href')), tostring(a), None))
|
ans.append(Result(ddg_href(a.get('href')), tostring(a), None))
|
||||||
return ans
|
return ans, url
|
||||||
|
|
||||||
|
|
||||||
def ddg_develop():
|
def ddg_develop():
|
||||||
br = browser()
|
br = browser()
|
||||||
for result in ddg_search('heroes abercrombie'.split(), 'www.amazon.com', dump_raw='/t/raw.html', br=br):
|
for result in ddg_search('heroes abercrombie'.split(), 'www.amazon.com', dump_raw='/t/raw.html', br=br)[0]:
|
||||||
if '/dp/' in result.url:
|
if '/dp/' in result.url:
|
||||||
print(result.title)
|
print(result.title)
|
||||||
print(' ', result.url)
|
print(' ', result.url)
|
||||||
@ -177,12 +177,12 @@ def bing_search(terms, site=None, br=None, log=prints, safe_search=False, dump_r
|
|||||||
cached_url = 'http://cc.bingj.com/cache.aspx?q={q}&d={d}&mkt=en-US&setlang=en-US&w={w}'.format(
|
cached_url = 'http://cc.bingj.com/cache.aspx?q={q}&d={d}&mkt=en-US&setlang=en-US&w={w}'.format(
|
||||||
q=q, d=d, w=w)
|
q=q, d=d, w=w)
|
||||||
ans.append(Result(a.get('href'), tostring(a), cached_url))
|
ans.append(Result(a.get('href'), tostring(a), cached_url))
|
||||||
return ans
|
return ans, url
|
||||||
|
|
||||||
|
|
||||||
def bing_develop():
|
def bing_develop():
|
||||||
br = browser()
|
br = browser()
|
||||||
for result in bing_search('heroes abercrombie'.split(), 'www.amazon.com', dump_raw='/t/raw.html', br=br):
|
for result in bing_search('heroes abercrombie'.split(), 'www.amazon.com', dump_raw='/t/raw.html', br=br)[0]:
|
||||||
if '/dp/' in result.url:
|
if '/dp/' in result.url:
|
||||||
print(result.title)
|
print(result.title)
|
||||||
print(' ', result.url)
|
print(' ', result.url)
|
||||||
@ -220,12 +220,12 @@ def google_search(terms, site=None, br=None, log=prints, safe_search=False, dump
|
|||||||
c = div.xpath('descendant::div[@class="s"]//a[@class="fl"]')[0]
|
c = div.xpath('descendant::div[@class="s"]//a[@class="fl"]')[0]
|
||||||
cached_url = c.get('href')
|
cached_url = c.get('href')
|
||||||
ans.append(Result(a.get('href'), tostring(a), cached_url))
|
ans.append(Result(a.get('href'), tostring(a), cached_url))
|
||||||
return ans
|
return ans, url
|
||||||
|
|
||||||
|
|
||||||
def google_develop():
|
def google_develop():
|
||||||
br = browser()
|
br = browser()
|
||||||
for result in google_search('heroes abercrombie'.split(), 'www.amazon.com', dump_raw='/t/raw.html', br=br):
|
for result in google_search('heroes abercrombie'.split(), 'www.amazon.com', dump_raw='/t/raw.html', br=br)[0]:
|
||||||
if '/dp/' in result.url:
|
if '/dp/' in result.url:
|
||||||
print(result.title)
|
print(result.title)
|
||||||
print(' ', result.url)
|
print(' ', result.url)
|
||||||
|
Loading…
x
Reference in New Issue
Block a user