From 0746c9a34a3031ce7d5244e0270f22300f937078 Mon Sep 17 00:00:00 2001
From: Kovid Goyal <kovid@kovidgoyal.net>
Date: Thu, 29 Nov 2007 05:38:00 +0000
Subject: [PATCH] Add url_search_order parameter to web2lrf DefaultProfile

---
 src/libprs500/ebooks/lrf/web/profiles/__init__.py | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/src/libprs500/ebooks/lrf/web/profiles/__init__.py b/src/libprs500/ebooks/lrf/web/profiles/__init__.py
index dd255a11db..c9428ea079 100644
--- a/src/libprs500/ebooks/lrf/web/profiles/__init__.py
+++ b/src/libprs500/ebooks/lrf/web/profiles/__init__.py
@@ -34,6 +34,7 @@ class DefaultProfile(object):
     delay                 = 0     # Delay between consecutive downloads
     timeout               = 10    # Timeout for fetching files from server in seconds
     timefmt               = ' [%a %d %b %Y]' # The format of the date shown on the first page
+    url_search_order      = ['guid', 'link'] # THe order of elements to search for a URL when parssing the RSS feed
     pubdate_fmt           = None  # The format string used to parse the publication date in the RSS feed. If set to None some default heuristics are used, these may fail, in which case set this to the correct string or re-implement strptime in your subclass.
     no_stylesheets        = False # Download stylesheets only if False 
     match_regexps         = []    # List of regular expressions that determines which links to follow
@@ -172,9 +173,11 @@ class DefaultProfile(object):
                         continue
                     pubdate = pubdate.string
                     pubdate = pubdate.replace('+0000', 'GMT')
-                    url = item.find('guid')
-                    if not url:
-                        url = item.find('link')
+                    for element in self.url_search_order:
+                        url = item.find(element)
+                        if url:
+                            break
+                        
                     if not url or not url.string:
                         self.logger.debug('Skipping article as it does not have a link url')
                         continue