From 6b0df0e357d075516ee2b79bf622789262acd729 Mon Sep 17 00:00:00 2001 From: Kovid Goyal Date: Mon, 29 Jan 2007 18:12:34 +0000 Subject: [PATCH] --- src/libprs500/metadata/rtf.py | 28 ++++++++++++++++++++++------ 1 file changed, 22 insertions(+), 6 deletions(-) diff --git a/src/libprs500/metadata/rtf.py b/src/libprs500/metadata/rtf.py index c426930677..d84a1e4aef 100644 --- a/src/libprs500/metadata/rtf.py +++ b/src/libprs500/metadata/rtf.py @@ -12,17 +12,25 @@ ## You should have received a copy of the GNU General Public License along ## with this program; if not, write to the Free Software Foundation, Inc., ## 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. - +""" +Read metadata from RTF files. +""" import re, cStringIO from libprs500.metadata import MetaInformation -title_pat = re.compile(r'\{\\info.*?\{\\title(.*?)\}', re.DOTALL) -author_pat = re.compile(r'\{\\info.*?\{\\author(.*?)\}', re.DOTALL) -comment_pat = re.compile(r'\{\\info.*?\{\\subject(.*?)\}', re.DOTALL) -category_pat = re.compile(r'\{\\info.*?\{\\category(.*?)\}', re.DOTALL) +title_pat = re.compile(r'\{\\info.*?\{\\title(.*?)(? -1: + break if not found: return None, 0 data, count, = cStringIO.StringIO(), 0 pos = stream.tell() while True: ch = stream.read(1) + if ch == '\\': + data.write(ch + stream.read(1)) + continue if ch == '{': count += 1 elif ch == '}': @@ -53,6 +65,7 @@ def get_document_info(stream): return data.getvalue(), pos def get_metadata(stream): + """ Return metadata as a L{MetaInfo} object """ stream.seek(0) if stream.read(5) != r'{\rtf': raise Exception('Not a valid RTF file') @@ -79,6 +92,9 @@ def get_metadata(stream): def main(): import sys + if len(sys.argv) != 2: + print >> sys.stderr, "Usage:", sys.argv[0], " mybook.rtf" + sys.exit(1) print get_metadata(open(sys.argv[1])) if __name__ == '__main__':