skip the wayback archive for the index page

This commit is contained in:
Kovid Goyal 2022-11-19 10:37:51 +05:30
parent 8db5fff5ac
commit 176171a116
No known key found for this signature in database
GPG Key ID: 06BC317B515ACE7C
2 changed files with 6 additions and 6 deletions

View File

@ -101,8 +101,8 @@ class NewYorkTimes(BasicNewsRecipe):
self._nyt_parser = ans = load_module('calibre.web.site_parsers.nytimes')
return ans
def get_nyt_page(self, url):
if use_wayback_machine:
def get_nyt_page(self, url, skip_wayback=False):
if use_wayback_machine and not skip_wayback:
from calibre import browser
return self.nyt_parser.download_url(url, browser())
return self.browser.open_novisit(url).read()
@ -123,7 +123,7 @@ class NewYorkTimes(BasicNewsRecipe):
def read_todays_paper(self):
INDEX = 'https://www.nytimes.com/section/todayspaper'
# INDEX = 'file:///t/raw.html'
return self.index_to_soup(self.get_nyt_page(INDEX))
return self.index_to_soup(self.get_nyt_page(INDEX, skip_wayback=True))
def read_nyt_metadata(self):
soup = self.read_todays_paper()

View File

@ -101,8 +101,8 @@ class NewYorkTimes(BasicNewsRecipe):
self._nyt_parser = ans = load_module('calibre.web.site_parsers.nytimes')
return ans
def get_nyt_page(self, url):
if use_wayback_machine:
def get_nyt_page(self, url, skip_wayback=False):
if use_wayback_machine and not skip_wayback:
from calibre import browser
return self.nyt_parser.download_url(url, browser())
return self.browser.open_novisit(url).read()
@ -123,7 +123,7 @@ class NewYorkTimes(BasicNewsRecipe):
def read_todays_paper(self):
INDEX = 'https://www.nytimes.com/section/todayspaper'
# INDEX = 'file:///t/raw.html'
return self.index_to_soup(self.get_nyt_page(INDEX))
return self.index_to_soup(self.get_nyt_page(INDEX, skip_wayback=True))
def read_nyt_metadata(self):
soup = self.read_todays_paper()