Head r791

This commit is contained in:
Jon Tibble 2010-04-11 18:47:39 +01:00
parent 4eaec98a0f
commit 3f5ac846f6

View File

@ -24,23 +24,23 @@
############################################################################### ###############################################################################
# OOo API documentation: # OOo API documentation:
# http://wiki.services.openoffice.org/wiki/Documentation/BASIC_Guide/Structure_of_Text_Documents # http://wiki.services.openoffice.org/wiki/Documentation/BASIC_Guide/Structure_of_Text_Documents
# http://wiki.services.openoffice.org/wiki/Documentation/DevGuide/Text/Iterating_over_Text # http://wiki.services.openoffice.org/wiki/Documentation/DevGuide/Text/Iterating_over_Text
# http://www.oooforum.org/forum/viewtopic.phtml?t=14409 # http://www.oooforum.org/forum/viewtopic.phtml?t=14409
# http://wiki.services.openoffice.org/wiki/Python # http://wiki.services.openoffice.org/wiki/Python
import re import re
import os import os
import time import time
from PyQt4 import QtCore from PyQt4 import QtCore
from songimport import SongImport from songimport import SongImport
if os.name == u'nt': if os.name == u'nt':
from win32com.client import Dispatch from win32com.client import Dispatch
BOLD = 150.0 BOLD = 150.0
ITALIC = 2 ITALIC = 2
PAGE_BEFORE = 4 PAGE_BEFORE = 4
PAGE_AFTER = 5 PAGE_AFTER = 5
PAGE_BOTH = 6 PAGE_BOTH = 6
else: else:
import uno import uno
@ -95,15 +95,15 @@ class SofImport(object):
loop = 0 loop = 0
while ctx is None and loop < 5: while ctx is None and loop < 5:
try: try:
ctx = resolver.resolve(u'uno:socket,host=localhost,' \ ctx = resolver.resolve(u'uno:socket,host=localhost,' \
+ 'port=2002;urp;StarOffice.ComponentContext') + 'port=2002;urp;StarOffice.ComponentContext')
except: except:
pass pass
self.start_ooo_process() self.start_ooo_process()
loop += 1 loop += 1
manager = ctx.ServiceManager manager = ctx.ServiceManager
self.desktop = manager.createInstanceWithContext( self.desktop = manager.createInstanceWithContext(
"com.sun.star.frame.Desktop", ctx ) "com.sun.star.frame.Desktop", ctx )
def start_ooo_process(self): def start_ooo_process(self):
try: try:
@ -148,16 +148,16 @@ class SofImport(object):
def process_doc(self): def process_doc(self):
""" """
Process the RTF file, a paragraph at a time Process the RTF file, a paragraph at a time
""" """
self.blanklines = 0 self.blanklines = 0
self.new_song() self.new_song()
paragraphs = self.document.getText().createEnumeration() paragraphs = self.document.getText().createEnumeration()
while paragraphs.hasMoreElements(): while paragraphs.hasMoreElements():
paragraph = paragraphs.nextElement() paragraph = paragraphs.nextElement()
if paragraph.supportsService("com.sun.star.text.Paragraph"): if paragraph.supportsService("com.sun.star.text.Paragraph"):
self.process_paragraph(paragraph) self.process_paragraph(paragraph)
if self.song: if self.song:
self.song.finish() self.song.finish()
self.song = None self.song = None
def process_paragraph(self, paragraph): def process_paragraph(self, paragraph):
@ -171,71 +171,71 @@ class SofImport(object):
In later books, there may not be line breaks, so check for 3 or more In later books, there may not be line breaks, so check for 3 or more
newlines newlines
""" """
text = u'' text = u''
textportions = paragraph.createEnumeration() textportions = paragraph.createEnumeration()
while textportions.hasMoreElements(): while textportions.hasMoreElements():
textportion = textportions.nextElement() textportion = textportions.nextElement()
if textportion.BreakType in (PAGE_BEFORE, PAGE_BOTH): if textportion.BreakType in (PAGE_BEFORE, PAGE_BOTH):
self.process_paragraph_text(text) self.process_paragraph_text(text)
self.new_song() self.new_song()
text = u'' text = u''
text += self.process_textportion(textportion) text += self.process_textportion(textportion)
if textportion.BreakType in (PAGE_AFTER, PAGE_BOTH): if textportion.BreakType in (PAGE_AFTER, PAGE_BOTH):
self.process_paragraph_text(text) self.process_paragraph_text(text)
self.new_song() self.new_song()
text = u'' text = u''
self.process_paragraph_text(text) self.process_paragraph_text(text)
def process_paragraph_text(self, text): def process_paragraph_text(self, text):
""" """
Split the paragraph text into multiple lines and process Split the paragraph text into multiple lines and process
""" """
for line in text.split(u'\n'): for line in text.split(u'\n'):
self.process_paragraph_line(line) self.process_paragraph_line(line)
if self.blanklines > 2: if self.blanklines > 2:
self.new_song() self.new_song()
def process_paragraph_line(self, text): def process_paragraph_line(self, text):
""" """
Process a single line. Throw away that text which isn't relevant, i.e. Process a single line. Throw away that text which isn't relevant, i.e.
stuff that appears at the end of the song. stuff that appears at the end of the song.
Anything that is OK, append to the current verse Anything that is OK, append to the current verse
""" """
text = text.strip() text = text.strip()
if text == u'': if text == u'':
self.blanklines += 1 self.blanklines += 1
if self.blanklines > 1: if self.blanklines > 1:
return return
if self.song.get_title() != u'': if self.song.get_title() != u'':
self.finish_verse() self.finish_verse()
return return
self.blanklines = 0 self.blanklines = 0
if self.skip_to_close_bracket: if self.skip_to_close_bracket:
if text.endswith(u')'): if text.endswith(u')'):
self.skip_to_close_bracket = False self.skip_to_close_bracket = False
return return
if text.startswith(u'CCL Licence'): if text.startswith(u'CCL Licence'):
self.italics = False self.italics = False
return return
if text == u'A Songs of Fellowship Worship Resource': if text == u'A Songs of Fellowship Worship Resource':
return return
if text.startswith(u'(NB.') or text.startswith(u'(Regrettably') \ if text.startswith(u'(NB.') or text.startswith(u'(Regrettably') \
or text.startswith(u'(From'): or text.startswith(u'(From'):
self.skip_to_close_bracket = True self.skip_to_close_bracket = True
return return
if text.startswith(u'Copyright'): if text.startswith(u'Copyright'):
self.song.add_copyright(text) self.song.add_copyright(text)
return return
if text == u'(Repeat)': if text == u'(Repeat)':
self.finish_verse() self.finish_verse()
self.song.repeat_verse() self.song.repeat_verse()
return return
if self.song.get_title() == u'': if self.song.get_title() == u'':
if self.song.get_copyright() == u'': if self.song.get_copyright() == u'':
self.add_author(text) self.add_author(text)
else: else:
self.song.add_copyright(text) self.song.add_copyright(text)
return return
self.add_verse_line(text) self.add_verse_line(text)
def process_textportion(self, textportion): def process_textportion(self, textportion):
@ -244,41 +244,41 @@ class SofImport(object):
it's bold or italics. If it's bold then its a song number or song title. it's bold or italics. If it's bold then its a song number or song title.
Song titles are in all capitals, so we must bring the capitalization Song titles are in all capitals, so we must bring the capitalization
into line into line
""" """
text = textportion.getString() text = textportion.getString()
text = self.tidy_text(text) text = self.tidy_text(text)
if text.strip() == u'': if text.strip() == u'':
return text return text
if textportion.CharWeight == BOLD: if textportion.CharWeight == BOLD:
boldtext = text.strip() boldtext = text.strip()
if boldtext.isdigit() and self.song.get_song_number() == '': if boldtext.isdigit() and self.song.get_song_number() == '':
self.add_songnumber(boldtext) self.add_songnumber(boldtext)
return u'' return u''
if self.song.get_title() == u'': if self.song.get_title() == u'':
text = self.uncap_text(text) text = self.uncap_text(text)
self.add_title(text) self.add_title(text)
return text return text
if text.strip().startswith(u'('): if text.strip().startswith(u'('):
return text return text
self.italics = (textportion.CharPosture == ITALIC) self.italics = (textportion.CharPosture == ITALIC)
return text return text
def new_song(self): def new_song(self):
""" """
A change of song. Store the old, create a new A change of song. Store the old, create a new
... but only if the last song was complete. If not, stick with it ... but only if the last song was complete. If not, stick with it
""" """
if self.song: if self.song:
self.finish_verse() self.finish_verse()
if not self.song.check_complete(): if not self.song.check_complete():
return return
self.song.finish() self.song.finish()
self.song = SongImport(self.manager) self.song = SongImport(self.manager)
self.skip_to_close_bracket = False self.skip_to_close_bracket = False
self.is_chorus = False self.is_chorus = False
self.italics = False self.italics = False
self.currentverse = u'' self.currentverse = u''
def add_songnumber(self, song_no): def add_songnumber(self, song_no):
""" """
Add a song number, store as alternate title. Also use the song Add a song number, store as alternate title. Also use the song
@ -303,27 +303,27 @@ class SofImport(object):
""" """
Add the title to the song. Strip some leading/trailing punctuation that Add the title to the song. Strip some leading/trailing punctuation that
we don't want in a title we don't want in a title
""" """
title = text.strip() title = text.strip()
if title.startswith(u'\''): if title.startswith(u'\''):
title = title[1:] title = title[1:]
if title.endswith(u','): if title.endswith(u','):
title = title[:-1] title = title[:-1]
self.song.set_title(title) self.song.set_title(title)
def add_author(self, text): def add_author(self, text):
""" """
Add the author. OpenLP stores them individually so split by 'and', '&' Add the author. OpenLP stores them individually so split by 'and', '&'
and comma. and comma.
However need to check for "Mr and Mrs Smith" and turn it to However need to check for "Mr and Mrs Smith" and turn it to
"Mr Smith" and "Mrs Smith". "Mr Smith" and "Mrs Smith".
""" """
text = text.replace(u' and ', u' & ') text = text.replace(u' and ', u' & ')
for author in text.split(u','): for author in text.split(u','):
authors = author.split(u'&') authors = author.split(u'&')
for i in range(len(authors)): for i in range(len(authors)):
author2 = authors[i].strip() author2 = authors[i].strip()
if author2.find(u' ') == -1 and i < len(authors) - 1: if author2.find(u' ') == -1 and i < len(authors) - 1:
author2 = author2 + u' ' \ author2 = author2 + u' ' \
+ authors[i + 1].strip().split(u' ')[-1] + authors[i + 1].strip().split(u' ')[-1]
if author2.endswith(u'.'): if author2.endswith(u'.'):
@ -336,14 +336,14 @@ class SofImport(object):
Add a line to the current verse. If the formatting has changed and Add a line to the current verse. If the formatting has changed and
we're beyond the second line of first verse, then this indicates we're beyond the second line of first verse, then this indicates
a change of verse. Italics are a chorus a change of verse. Italics are a chorus
""" """
if self.italics != self.is_chorus and ((len(self.song.verses) > 0) or if self.italics != self.is_chorus and ((len(self.song.verses) > 0) or
(self.currentverse.count(u'\n') > 1)): (self.currentverse.count(u'\n') > 1)):
self.finish_verse() self.finish_verse()
if self.italics: if self.italics:
self.is_chorus = True self.is_chorus = True
self.currentverse += text + u'\n' self.currentverse += text + u'\n'
def finish_verse(self): def finish_verse(self):
""" """
Verse is finished, store it. Note in book 1+2, some songs are formatted Verse is finished, store it. Note in book 1+2, some songs are formatted
@ -383,18 +383,18 @@ class SofImport(object):
""" """
Get rid of some dodgy unicode and formatting characters we're not Get rid of some dodgy unicode and formatting characters we're not
interested in. Some can be converted to ascii. interested in. Some can be converted to ascii.
""" """
text = text.replace(u'\t', u' ') text = text.replace(u'\t', u' ')
text = text.replace(u'\r', u'\n') text = text.replace(u'\r', u'\n')
text = text.replace(u'\u2018', u'\'') text = text.replace(u'\u2018', u'\'')
text = text.replace(u'\u2019', u'\'') text = text.replace(u'\u2019', u'\'')
text = text.replace(u'\u201c', u'"') text = text.replace(u'\u201c', u'"')
text = text.replace(u'\u201d', u'"') text = text.replace(u'\u201d', u'"')
text = text.replace(u'\u2026', u'...') text = text.replace(u'\u2026', u'...')
text = text.replace(u'\u2013', u'-') text = text.replace(u'\u2013', u'-')
text = text.replace(u'\u2014', u'-') text = text.replace(u'\u2014', u'-')
return text return text
def uncap_text(self, text): def uncap_text(self, text):
""" """
Words in the title are in all capitals, so we lowercase them. Words in the title are in all capitals, so we lowercase them.
@ -403,128 +403,128 @@ class SofImport(object):
There is a complicated word "One", which is sometimes lower and There is a complicated word "One", which is sometimes lower and
sometimes upper depending on context. Never mind, keep it lower. sometimes upper depending on context. Never mind, keep it lower.
""" """
textarr = re.split(u'(\W+)', text) textarr = re.split(u'(\W+)', text)
textarr[0] = textarr[0].capitalize() textarr[0] = textarr[0].capitalize()
for i in range(1, len(textarr)): for i in range(1, len(textarr)):
# Do not translate these. Fixed strings in SOF song file # Do not translate these. Fixed strings in SOF song file
if textarr[i] in (u'JESUS', u'CHRIST', u'KING', u'ALMIGHTY', if textarr[i] in (u'JESUS', u'CHRIST', u'KING', u'ALMIGHTY',
u'REDEEMER', u'SHEPHERD', u'SON', u'GOD', u'LORD', u'FATHER', u'REDEEMER', u'SHEPHERD', u'SON', u'GOD', u'LORD', u'FATHER',
u'HOLY', u'SPIRIT', u'LAMB', u'YOU', u'YOUR', u'I', u'I\'VE', u'HOLY', u'SPIRIT', u'LAMB', u'YOU', u'YOUR', u'I', u'I\'VE',
u'I\'M', u'I\'LL', u'SAVIOUR', u'O', u'YOU\'RE', u'HE', u'HIS', u'I\'M', u'I\'LL', u'SAVIOUR', u'O', u'YOU\'RE', u'HE', u'HIS',
u'HIM', u'ZION', u'EMMANUEL', u'MAJESTY', u'JESUS\'', u'JIREH', u'HIM', u'ZION', u'EMMANUEL', u'MAJESTY', u'JESUS\'', u'JIREH',
u'JUDAH', u'LION', u'LORD\'S', u'ABRAHAM', u'GOD\'S', u'JUDAH', u'LION', u'LORD\'S', u'ABRAHAM', u'GOD\'S',
u'FATHER\'S', u'ELIJAH'): u'FATHER\'S', u'ELIJAH'):
textarr[i] = textarr[i].capitalize() textarr[i] = textarr[i].capitalize()
else: else:
textarr[i] = textarr[i].lower() textarr[i] = textarr[i].lower()
text = u''.join(textarr) text = u''.join(textarr)
return text return text
def verse_splits(self, song_number): def verse_splits(self, song_number):
""" """
Because someone at Kingsway forgot to check the 1+2 RTF file, Because someone at Kingsway forgot to check the 1+2 RTF file,
some verses were not formatted correctly. some verses were not formatted correctly.
""" """
if song_number == 11: return 8 if song_number == 11: return 8
if song_number == 18: return 5 if song_number == 18: return 5
if song_number == 21: return 6 if song_number == 21: return 6
if song_number == 23: return 4 if song_number == 23: return 4
if song_number == 24: return 7 if song_number == 24: return 7
if song_number == 27: return 4 if song_number == 27: return 4
if song_number == 31: return 6 if song_number == 31: return 6
if song_number == 49: return 4 if song_number == 49: return 4
if song_number == 50: return 8 if song_number == 50: return 8
if song_number == 70: return 4 if song_number == 70: return 4
if song_number == 75: return 8 if song_number == 75: return 8
if song_number == 79: return 6 if song_number == 79: return 6
if song_number == 97: return 7 if song_number == 97: return 7
if song_number == 107: return 4 if song_number == 107: return 4
if song_number == 109: return 4 if song_number == 109: return 4
if song_number == 133: return 4 if song_number == 133: return 4
if song_number == 155: return 10 if song_number == 155: return 10
if song_number == 156: return 8 if song_number == 156: return 8
if song_number == 171: return 4 if song_number == 171: return 4
if song_number == 188: return 7 if song_number == 188: return 7
if song_number == 192: return 4 if song_number == 192: return 4
if song_number == 208: return 8 if song_number == 208: return 8
if song_number == 215: return 8 if song_number == 215: return 8
if song_number == 220: return 4 if song_number == 220: return 4
if song_number == 247: return 6 if song_number == 247: return 6
if song_number == 248: return 6 if song_number == 248: return 6
if song_number == 251: return 8 if song_number == 251: return 8
if song_number == 295: return 8 if song_number == 295: return 8
if song_number == 307: return 5 if song_number == 307: return 5
if song_number == 314: return 6 if song_number == 314: return 6
if song_number == 325: return 8 if song_number == 325: return 8
if song_number == 386: return 6 if song_number == 386: return 6
if song_number == 415: return 4 if song_number == 415: return 4
if song_number == 426: return 4 if song_number == 426: return 4
if song_number == 434: return 5 if song_number == 434: return 5
if song_number == 437: return 4 if song_number == 437: return 4
if song_number == 438: return 6 if song_number == 438: return 6
if song_number == 456: return 8 if song_number == 456: return 8
if song_number == 461: return 4 if song_number == 461: return 4
if song_number == 469: return 4 if song_number == 469: return 4
if song_number == 470: return 5 if song_number == 470: return 5
if song_number == 476: return 6 if song_number == 476: return 6
if song_number == 477: return 7 if song_number == 477: return 7
if song_number == 480: return 8 if song_number == 480: return 8
if song_number == 482: return 4 if song_number == 482: return 4
if song_number == 512: return 4 if song_number == 512: return 4
if song_number == 513: return 8 if song_number == 513: return 8
if song_number == 518: return 5 if song_number == 518: return 5
if song_number == 520: return 4 if song_number == 520: return 4
if song_number == 523: return 6 if song_number == 523: return 6
if song_number == 526: return 8 if song_number == 526: return 8
if song_number == 527: return 4 if song_number == 527: return 4
if song_number == 529: return 4 if song_number == 529: return 4
if song_number == 537: return 4 if song_number == 537: return 4
if song_number == 555: return 6 if song_number == 555: return 6
if song_number == 581: return 4 if song_number == 581: return 4
if song_number == 589: return 6 if song_number == 589: return 6
if song_number == 590: return 4 if song_number == 590: return 4
if song_number == 593: return 8 if song_number == 593: return 8
if song_number == 596: return 4 if song_number == 596: return 4
if song_number == 610: return 6 if song_number == 610: return 6
if song_number == 611: return 6 if song_number == 611: return 6
if song_number == 619: return 8 if song_number == 619: return 8
if song_number == 645: return 5 if song_number == 645: return 5
if song_number == 653: return 6 if song_number == 653: return 6
if song_number == 683: return 7 if song_number == 683: return 7
if song_number == 686: return 4 if song_number == 686: return 4
if song_number == 697: return 8 if song_number == 697: return 8
if song_number == 698: return 4 if song_number == 698: return 4
if song_number == 704: return 6 if song_number == 704: return 6
if song_number == 716: return 4 if song_number == 716: return 4
if song_number == 717: return 6 if song_number == 717: return 6
if song_number == 730: return 4 if song_number == 730: return 4
if song_number == 731: return 8 if song_number == 731: return 8
if song_number == 732: return 8 if song_number == 732: return 8
if song_number == 738: return 4 if song_number == 738: return 4
if song_number == 756: return 9 if song_number == 756: return 9
if song_number == 815: return 6 if song_number == 815: return 6
if song_number == 830: return 8 if song_number == 830: return 8
if song_number == 831: return 4 if song_number == 831: return 4
if song_number == 876: return 6 if song_number == 876: return 6
if song_number == 877: return 6 if song_number == 877: return 6
if song_number == 892: return 4 if song_number == 892: return 4
if song_number == 894: return 6 if song_number == 894: return 6
if song_number == 902: return 8 if song_number == 902: return 8
if song_number == 905: return 8 if song_number == 905: return 8
if song_number == 921: return 6 if song_number == 921: return 6
if song_number == 940: return 7 if song_number == 940: return 7
if song_number == 955: return 9 if song_number == 955: return 9
if song_number == 968: return 8 if song_number == 968: return 8
if song_number == 972: return 7 if song_number == 972: return 7
if song_number == 974: return 4 if song_number == 974: return 4
if song_number == 988: return 6 if song_number == 988: return 6
if song_number == 991: return 5 if song_number == 991: return 5
if song_number == 1002: return 8 if song_number == 1002: return 8
if song_number == 1024: return 8 if song_number == 1024: return 8
if song_number == 1044: return 9 if song_number == 1044: return 9
if song_number == 1088: return 6 if song_number == 1088: return 6
if song_number == 1117: return 6 if song_number == 1117: return 6
if song_number == 1119: return 7 if song_number == 1119: return 7
return None return None