forked from openlp/openlp
367 lines
14 KiB
Python
367 lines
14 KiB
Python
# -*- coding: utf-8 -*-
|
|
# vim: autoindent shiftwidth=4 expandtab textwidth=80 tabstop=4 softtabstop=4
|
|
|
|
###############################################################################
|
|
# OpenLP - Open Source Lyrics Projection #
|
|
# --------------------------------------------------------------------------- #
|
|
# Copyright (c) 2008-2011 Raoul Snyman #
|
|
# Portions copyright (c) 2008-2011 Tim Bentley, Jonathan Corwin, Michael #
|
|
# Gorven, Scott Guerrieri, Meinert Jordan, Andreas Preikschat, Christian #
|
|
# Richter, Philip Ridout, Maikel Stuivenberg, Martin Thompson, Jon Tibble, #
|
|
# Carsten Tinggaard, Frode Woldsund #
|
|
# --------------------------------------------------------------------------- #
|
|
# This program is free software; you can redistribute it and/or modify it #
|
|
# under the terms of the GNU General Public License as published by the Free #
|
|
# Software Foundation; version 2 of the License. #
|
|
# #
|
|
# This program is distributed in the hope that it will be useful, but WITHOUT #
|
|
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or #
|
|
# FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for #
|
|
# more details. #
|
|
# #
|
|
# You should have received a copy of the GNU General Public License along #
|
|
# with this program; if not, write to the Free Software Foundation, Inc., 59 #
|
|
# Temple Place, Suite 330, Boston, MA 02111-1307 USA #
|
|
###############################################################################
|
|
|
|
import logging
|
|
import re
|
|
from PyQt4 import QtCore
|
|
|
|
from openlp.core.lib import Receiver, translate
|
|
from openlp.plugins.songs.lib import VerseType
|
|
from openlp.plugins.songs.lib.db import Song, Author, Topic, Book, MediaFile
|
|
from openlp.plugins.songs.lib.xml import SongXML
|
|
|
|
log = logging.getLogger(__name__)
|
|
|
|
class SongImport(QtCore.QObject):
|
|
"""
|
|
Helper class for import a song from a third party source into OpenLP
|
|
|
|
This class just takes the raw strings, and will work out for itself
|
|
whether the authors etc already exist and add them or refer to them
|
|
as necessary
|
|
"""
|
|
def __init__(self, manager):
|
|
"""
|
|
Initialise and create defaults for properties
|
|
|
|
``manager``
|
|
An instance of a SongManager, through which all database access is
|
|
performed.
|
|
"""
|
|
self.manager = manager
|
|
self.stop_import_flag = False
|
|
self.set_defaults()
|
|
QtCore.QObject.connect(Receiver.get_receiver(),
|
|
QtCore.SIGNAL(u'openlp_stop_wizard'), self.stop_import)
|
|
|
|
def set_defaults(self):
|
|
"""
|
|
Create defaults for properties - call this before each song
|
|
if importing many songs at once to ensure a clean beginning
|
|
"""
|
|
self.title = u''
|
|
self.song_number = u''
|
|
self.alternate_title = u''
|
|
self.copyright = u''
|
|
self.comments = u''
|
|
self.theme_name = u''
|
|
self.ccli_number = u''
|
|
self.authors = []
|
|
self.topics = []
|
|
self.media_files = []
|
|
self.song_book_name = u''
|
|
self.song_book_pub = u''
|
|
self.verse_order_list = []
|
|
self.verses = []
|
|
self.versecounts = {}
|
|
self.copyright_string = unicode(translate(
|
|
'SongsPlugin.SongImport', 'copyright'))
|
|
self.copyright_symbol = unicode(translate(
|
|
'SongsPlugin.SongImport', '\xa9'))
|
|
|
|
def stop_import(self):
|
|
"""
|
|
Sets the flag for importers to stop their import
|
|
"""
|
|
log.debug(u'Stopping songs import')
|
|
self.stop_import_flag = True
|
|
|
|
def register(self, import_wizard):
|
|
self.import_wizard = import_wizard
|
|
|
|
@staticmethod
|
|
def process_songs_text(manager, text):
|
|
songs = []
|
|
songtexts = SongImport.tidy_text(text).split(u'\f')
|
|
song = SongImport(manager)
|
|
for songtext in songtexts:
|
|
if songtext.strip():
|
|
song.process_song_text(songtext.strip())
|
|
if song.check_complete():
|
|
songs.append(song)
|
|
song = SongImport(manager)
|
|
if song.check_complete():
|
|
songs.append(song)
|
|
return songs
|
|
|
|
@staticmethod
|
|
def tidy_text(text):
|
|
"""
|
|
Get rid of some dodgy unicode and formatting characters we're not
|
|
interested in. Some can be converted to ascii.
|
|
"""
|
|
text = text.replace(u'\u2018', u'\'')
|
|
text = text.replace(u'\u2019', u'\'')
|
|
text = text.replace(u'\u201c', u'"')
|
|
text = text.replace(u'\u201d', u'"')
|
|
text = text.replace(u'\u2026', u'...')
|
|
text = text.replace(u'\u2013', u'-')
|
|
text = text.replace(u'\u2014', u'-')
|
|
# Remove surplus blank lines, spaces, trailing/leading spaces
|
|
text = re.sub(r'[ \t\v]+', u' ', text)
|
|
text = re.sub(r' ?(\r\n?|\n) ?', u'\n', text)
|
|
text = re.sub(r' ?(\n{5}|\f)+ ?', u'\f', text)
|
|
return text
|
|
|
|
def process_song_text(self, text):
|
|
versetexts = text.split(u'\n\n')
|
|
for versetext in versetexts:
|
|
if versetext.strip() != u'':
|
|
self.process_verse_text(versetext.strip())
|
|
|
|
def process_verse_text(self, text):
|
|
lines = text.split(u'\n')
|
|
if text.lower().find(self.copyright_string) >= 0 \
|
|
or text.lower().find(self.copyright_symbol) >= 0:
|
|
copyright_found = False
|
|
for line in lines:
|
|
if (copyright_found or
|
|
line.lower().find(self.copyright_string) >= 0 or
|
|
line.lower().find(self.copyright_symbol) >= 0):
|
|
copyright_found = True
|
|
self.add_copyright(line)
|
|
else:
|
|
self.parse_author(line)
|
|
return
|
|
if len(lines) == 1:
|
|
self.parse_author(lines[0])
|
|
return
|
|
if not self.title:
|
|
self.title = lines[0]
|
|
self.add_verse(text)
|
|
|
|
def add_copyright(self, copyright):
|
|
"""
|
|
Build the copyright field
|
|
"""
|
|
if self.copyright.find(copyright) >= 0:
|
|
return
|
|
if self.copyright != u'':
|
|
self.copyright += ' '
|
|
self.copyright += copyright
|
|
|
|
def parse_author(self, text):
|
|
"""
|
|
Add the author. OpenLP stores them individually so split by 'and', '&'
|
|
and comma. However need to check for 'Mr and Mrs Smith' and turn it to
|
|
'Mr Smith' and 'Mrs Smith'.
|
|
"""
|
|
for author in text.split(u','):
|
|
authors = author.split(u'&')
|
|
for i in range(len(authors)):
|
|
author2 = authors[i].strip()
|
|
if author2.find(u' ') == -1 and i < len(authors) - 1:
|
|
author2 = author2 + u' ' \
|
|
+ authors[i + 1].strip().split(u' ')[-1]
|
|
if author2.endswith(u'.'):
|
|
author2 = author2[:-1]
|
|
if author2:
|
|
self.add_author(author2)
|
|
|
|
def add_author(self, author):
|
|
"""
|
|
Add an author to the list
|
|
"""
|
|
if author in self.authors:
|
|
return
|
|
self.authors.append(author)
|
|
|
|
def add_media_file(self, filename):
|
|
"""
|
|
Add a media file to the list
|
|
"""
|
|
if filename in self.media_files:
|
|
return
|
|
self.media_files.append(filename)
|
|
|
|
def add_verse(self, versetext, versetag=u'V', lang=None):
|
|
"""
|
|
Add a verse. This is the whole verse, lines split by \n. It will also
|
|
attempt to detect duplicates. In this case it will just add to the verse
|
|
order.
|
|
|
|
``versetext``
|
|
The text of the verse.
|
|
|
|
``versetag``
|
|
The verse tag can be V1/C1/B etc, or 'V' and 'C' (will count the
|
|
verses/choruses itself) or None, where it will assume verse.
|
|
|
|
``lang``
|
|
The language code (ISO-639) of the verse, for example *en* or *de*.
|
|
"""
|
|
for (oldversetag, oldverse, oldlang) in self.verses:
|
|
if oldverse.strip() == versetext.strip():
|
|
self.verse_order_list.append(oldversetag)
|
|
return
|
|
if versetag[0] in self.versecounts:
|
|
self.versecounts[versetag[0]] += 1
|
|
else:
|
|
self.versecounts[versetag[0]] = 1
|
|
if len(versetag) == 1:
|
|
versetag += unicode(self.versecounts[versetag[0]])
|
|
elif int(versetag[1:]) > self.versecounts[versetag[0]]:
|
|
self.versecounts[versetag[0]] = int(versetag[1:])
|
|
self.verses.append([versetag, versetext.rstrip(), lang])
|
|
self.verse_order_list.append(versetag)
|
|
if versetag.startswith(u'V') and u'C1' in self.verse_order_list:
|
|
self.verse_order_list.append(u'C1')
|
|
|
|
def repeat_verse(self):
|
|
"""
|
|
Repeat the previous verse in the verse order
|
|
"""
|
|
self.verse_order_list.append(self.verse_order_list[-1])
|
|
|
|
def check_complete(self):
|
|
"""
|
|
Check the mandatory fields are entered (i.e. title and a verse)
|
|
Author not checked here, if no author then "Author unknown" is
|
|
automatically added
|
|
"""
|
|
if self.title == u'' or len(self.verses) == 0:
|
|
return False
|
|
else:
|
|
return True
|
|
|
|
def remove_punctuation(self, text):
|
|
"""
|
|
Extracts alphanumeric words for searchable fields
|
|
"""
|
|
return re.sub(r'\W+', u' ', text, re.UNICODE)
|
|
|
|
def finish(self):
|
|
"""
|
|
All fields have been set to this song. Write the song to disk.
|
|
"""
|
|
if not self.authors:
|
|
self.authors.append(unicode(translate('SongsPlugin.SongImport',
|
|
'Author unknown')))
|
|
log.info(u'commiting song %s to database', self.title)
|
|
song = Song()
|
|
song.title = self.title
|
|
song.alternate_title = self.alternate_title
|
|
song.search_title = self.remove_punctuation(self.title).lower() \
|
|
+ '@' + self.remove_punctuation(self.alternate_title).lower()
|
|
song.song_number = self.song_number
|
|
song.search_lyrics = u''
|
|
verses_changed_to_other = {}
|
|
sxml = SongXML()
|
|
other_count = 1
|
|
for (versetag, versetext, lang) in self.verses:
|
|
if versetag[0] == u'C':
|
|
versetype = VerseType.to_string(VerseType.Chorus)
|
|
elif versetag[0] == u'V':
|
|
versetype = VerseType.to_string(VerseType.Verse)
|
|
elif versetag[0] == u'B':
|
|
versetype = VerseType.to_string(VerseType.Bridge)
|
|
elif versetag[0] == u'I':
|
|
versetype = VerseType.to_string(VerseType.Intro)
|
|
elif versetag[0] == u'P':
|
|
versetype = VerseType.to_string(VerseType.PreChorus)
|
|
elif versetag[0] == u'E':
|
|
versetype = VerseType.to_string(VerseType.Ending)
|
|
else:
|
|
newversetag = u'O%d' % other_count
|
|
verses_changed_to_other[versetag] = newversetag
|
|
other_count += 1
|
|
versetype = VerseType.to_string(VerseType.Other)
|
|
log.info(u'Versetype %s changing to %s' , versetag, newversetag)
|
|
versetag = newversetag
|
|
sxml.add_verse_to_lyrics(versetype, versetag[1:], versetext, lang)
|
|
song.search_lyrics += u' ' + self.remove_punctuation(versetext)
|
|
song.search_lyrics = song.search_lyrics.lower()
|
|
song.lyrics = unicode(sxml.extract_xml(), u'utf-8')
|
|
for i, current_verse_tag in enumerate(self.verse_order_list):
|
|
if verses_changed_to_other.has_key(current_verse_tag):
|
|
self.verse_order_list[i] = \
|
|
verses_changed_to_other[current_verse_tag]
|
|
song.verse_order = u' '.join(self.verse_order_list)
|
|
song.copyright = self.copyright
|
|
song.comments = self.comments
|
|
song.theme_name = self.theme_name
|
|
song.ccli_number = self.ccli_number
|
|
for authortext in self.authors:
|
|
author = self.manager.get_object_filtered(Author,
|
|
Author.display_name == authortext)
|
|
if not author:
|
|
author = Author.populate(display_name = authortext,
|
|
last_name=authortext.split(u' ')[-1],
|
|
first_name=u' '.join(authortext.split(u' ')[:-1]))
|
|
song.authors.append(author)
|
|
for filename in self.media_files:
|
|
media_file = self.manager.get_object_filtered(MediaFile,
|
|
MediaFile.file_name == filename)
|
|
if not media_file:
|
|
song.media_files.append(MediaFile.populate(file_name=filename))
|
|
if self.song_book_name:
|
|
song_book = self.manager.get_object_filtered(Book,
|
|
Book.name == self.song_book_name)
|
|
if song_book is None:
|
|
song_book = Book.populate(name=self.song_book_name,
|
|
publisher=self.song_book_pub)
|
|
song.book = song_book
|
|
for topictext in self.topics:
|
|
if len(topictext) == 0:
|
|
continue
|
|
topic = self.manager.get_object_filtered(Topic,
|
|
Topic.name == topictext)
|
|
if topic is None:
|
|
topic = Topic.populate(name=topictext)
|
|
song.topics.append(topic)
|
|
self.manager.save_object(song)
|
|
self.set_defaults()
|
|
|
|
def print_song(self):
|
|
"""
|
|
For debugging
|
|
"""
|
|
print u'========================================' \
|
|
+ u'========================================'
|
|
print u'TITLE: ' + self.title
|
|
print u'ALT TITLE: ' + self.alternate_title
|
|
for (versetag, versetext, lang) in self.verses:
|
|
print u'VERSE ' + versetag + u': ' + versetext
|
|
print u'ORDER: ' + u' '.join(self.verse_order_list)
|
|
for author in self.authors:
|
|
print u'AUTHOR: ' + author
|
|
if self.copyright:
|
|
print u'COPYRIGHT: ' + self.copyright
|
|
if self.song_book_name:
|
|
print u'BOOK: ' + self.song_book_name
|
|
if self.song_book_pub:
|
|
print u'BOOK PUBLISHER: ' + self.song_book_pub
|
|
if self.song_number:
|
|
print u'NUMBER: ' + self.song_number
|
|
for topictext in self.topics:
|
|
print u'TOPIC: ' + topictext
|
|
if self.comments:
|
|
print u'COMMENTS: ' + self.comments
|
|
if self.theme_name:
|
|
print u'THEME: ' + self.theme_name
|
|
if self.ccli_number:
|
|
print u'CCLI: ' + self.ccli_number
|