openlp/openlp/plugins/songs/lib/__init__.py

# -*- coding: utf-8 -*-
# vim: autoindent shiftwidth=4 expandtab textwidth=120 tabstop=4 softtabstop=4

###############################################################################
# OpenLP - Open Source Lyrics Projection                                      #
# --------------------------------------------------------------------------- #
# Copyright (c) 2008-2013 Raoul Snyman                                        #
# Portions copyright (c) 2008-2013 Tim Bentley, Gerald Britton, Jonathan      #
# Corwin, Samuel Findlay, Michael Gorven, Scott Guerrieri, Matthias Hub,      #
# Meinert Jordan, Armin Köhler, Erik Lundin, Edwin Lunando, Brian T. Meyer.   #
# Joshua Miller, Stevan Pettit, Andreas Preikschat, Mattias Põldaru,          #
# Christian Richter, Philip Ridout, Simon Scudder, Jeffrey Smith,             #
# Maikel Stuivenberg, Martin Thompson, Jon Tibble, Dave Warnock,              #
# Frode Woldsund, Martin Zibricky, Patrick Zimmermann                         #
# --------------------------------------------------------------------------- #
# This program is free software; you can redistribute it and/or modify it     #
# under the terms of the GNU General Public License as published by the Free  #
# Software Foundation; version 2 of the License.                              #
#                                                                             #
# This program is distributed in the hope that it will be useful, but WITHOUT #
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or       #
# FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for    #
# more details.                                                               #
#                                                                             #
# You should have received a copy of the GNU General Public License along     #
# with this program; if not, write to the Free Software Foundation, Inc., 59  #
# Temple Place, Suite 330, Boston, MA 02111-1307 USA                          #
###############################################################################
import re

from PyQt4 import QtGui

from openlp.core.lib import translate
from openlp.core.utils import CONTROL_CHARS, locale_direct_compare
from db import Author
from ui import SongStrings

WHITESPACE = re.compile(r'[\W_]+', re.UNICODE)
APOSTROPHE = re.compile(u'[\'`’ʻ′]', re.UNICODE)
PATTERN = re.compile(r"\\([a-z]{1,32})(-?\d{1,10})?[ ]?|\\'"
    r"([0-9a-f]{2})|\\([^a-z])|([{}])|[\r\n]+|(.)", re.I)
# RTF control words which specify a "destination" to be ignored.
DESTINATIONS = frozenset((
    u'aftncn', u'aftnsep', u'aftnsepc', u'annotation', u'atnauthor',
    u'atndate', u'atnicn', u'atnid', u'atnparent', u'atnref', u'atntime',
    u'atrfend', u'atrfstart', u'author', u'background', u'bkmkend',
    u'bkmkstart', u'blipuid', u'buptim', u'category',
    u'colorschememapping', u'colortbl', u'comment', u'company', u'creatim',
    u'datafield', u'datastore', u'defchp', u'defpap', u'do', u'doccomm',
    u'docvar', u'dptxbxtext', u'ebcend', u'ebcstart', u'factoidname',
    u'falt', u'fchars', u'ffdeftext', u'ffentrymcr', u'ffexitmcr',
    u'ffformat', u'ffhelptext', u'ffl', u'ffname', u'ffstattext', u'field',
    u'file', u'filetbl', u'fldinst', u'fldrslt', u'fldtype', u'fname',
    u'fontemb', u'fontfile', u'footer', u'footerf', u'footerl', u'footerr',
    u'footnote', u'formfield', u'ftncn', u'ftnsep', u'ftnsepc', u'g',
    u'generator', u'gridtbl', u'header', u'headerf', u'headerl',
    u'headerr', u'hl', u'hlfr', u'hlinkbase', u'hlloc', u'hlsrc', u'hsv',
    u'htmltag', u'info', u'keycode', u'keywords', u'latentstyles',
    u'lchars', u'levelnumbers', u'leveltext', u'lfolevel', u'linkval',
    u'list', u'listlevel', u'listname', u'listoverride',
    u'listoverridetable', u'listpicture', u'liststylename', u'listtable',
    u'listtext', u'lsdlockedexcept', u'macc', u'maccPr', u'mailmerge',
    u'maln', u'malnScr', u'manager', u'margPr', u'mbar', u'mbarPr',
    u'mbaseJc', u'mbegChr', u'mborderBox', u'mborderBoxPr', u'mbox',
    u'mboxPr', u'mchr', u'mcount', u'mctrlPr', u'md', u'mdeg', u'mdegHide',
    u'mden', u'mdiff', u'mdPr', u'me', u'mendChr', u'meqArr', u'meqArrPr',
    u'mf', u'mfName', u'mfPr', u'mfunc', u'mfuncPr', u'mgroupChr',
    u'mgroupChrPr', u'mgrow', u'mhideBot', u'mhideLeft', u'mhideRight',
    u'mhideTop', u'mhtmltag', u'mlim', u'mlimloc', u'mlimlow',
    u'mlimlowPr', u'mlimupp', u'mlimuppPr', u'mm', u'mmaddfieldname',
    u'mmath', u'mmathPict', u'mmathPr', u'mmaxdist', u'mmc', u'mmcJc',
    u'mmconnectstr', u'mmconnectstrdata', u'mmcPr', u'mmcs',
    u'mmdatasource', u'mmheadersource', u'mmmailsubject', u'mmodso',
    u'mmodsofilter', u'mmodsofldmpdata', u'mmodsomappedname',
    u'mmodsoname', u'mmodsorecipdata', u'mmodsosort', u'mmodsosrc',
    u'mmodsotable', u'mmodsoudl', u'mmodsoudldata', u'mmodsouniquetag',
    u'mmPr', u'mmquery', u'mmr', u'mnary', u'mnaryPr', u'mnoBreak',
    u'mnum', u'mobjDist', u'moMath', u'moMathPara', u'moMathParaPr',
    u'mopEmu', u'mphant', u'mphantPr', u'mplcHide', u'mpos', u'mr',
    u'mrad', u'mradPr', u'mrPr', u'msepChr', u'mshow', u'mshp', u'msPre',
    u'msPrePr', u'msSub', u'msSubPr', u'msSubSup', u'msSubSupPr', u'msSup',
    u'msSupPr', u'mstrikeBLTR', u'mstrikeH', u'mstrikeTLBR', u'mstrikeV',
    u'msub', u'msubHide', u'msup', u'msupHide', u'mtransp', u'mtype',
    u'mvertJc', u'mvfmf', u'mvfml', u'mvtof', u'mvtol', u'mzeroAsc',
    u'mzFrodesc', u'mzeroWid', u'nesttableprops', u'nextfile',
    u'nonesttables', u'objalias', u'objclass', u'objdata', u'object',
    u'objname', u'objsect', u'objtime', u'oldcprops', u'oldpprops',
    u'oldsprops', u'oldtprops', u'oleclsid', u'operator', u'panose',
    u'password', u'passwordhash', u'pgp', u'pgptbl', u'picprop', u'pict',
    u'pn', u'pnseclvl', u'pntext', u'pntxta', u'pntxtb', u'printim',
    u'private', u'propname', u'protend', u'protstart', u'protusertbl',
    u'pxe', u'result', u'revtbl', u'revtim', u'rsidtbl', u'rxe', u'shp',
    u'shpgrp', u'shpinst', u'shppict', u'shprslt', u'shptxt', u'sn', u'sp',
    u'staticval', u'stylesheet', u'subject', u'sv', u'svb', u'tc',
    u'template', u'themedata', u'title', u'txe', u'ud', u'upr',
    u'userprops', u'wgrffmtfilter', u'windowcaption', u'writereservation',
    u'writereservhash', u'xe', u'xform', u'xmlattrname', u'xmlattrvalue',
    u'xmlclose', u'xmlname', u'xmlnstbl', u'xmlopen'))
# Translation of some special characters.
SPECIAL_CHARS = {
    u'par': u'\n',
    u'sect': u'\n\n',
    # Required page and column break.
    # Would be good if we could split verse into subverses here.
    u'page': u'\n\n',
    u'column': u'\n\n',
    # Soft breaks.
    u'softpage': u'[---]',
    u'softcol': u'[---]',
    u'line': u'\n',
    u'tab': u'\t',
    u'emdash': u'\u2014',
    u'endash': u'\u2013',
    u'emspace': u'\u2003',
    u'enspace': u'\u2002',
    u'qmspace': u'\u2005',
    u'bullet': u'\u2022',
    u'lquote': u'\u2018',
    u'rquote': u'\u2019',
    u'ldblquote': u'\u201C',
    u'rdblquote': u'\u201D',
    u'ltrmark': u'\u200E',
    u'rtlmark': u'\u200F',
    u'zwj': u'\u200D',
    u'zwnj': u'\u200C'}
CHARSET_MAPPING = {
    u'fcharset0': u'cp1252',
    u'fcharset161': u'cp1253',
    u'fcharset162': u'cp1254',
    u'fcharset163': u'cp1258',
    u'fcharset177': u'cp1255',
    u'fcharset178': u'cp1256',
    u'fcharset186': u'cp1257',
    u'fcharset204': u'cp1251',
    u'fcharset222': u'cp874',
    u'fcharset238': u'cp1250'}


class VerseType(object):
    """
    VerseType provides an enumeration for the tags that may be associated
    with verses in songs.
    """
    Verse = 0
    Chorus = 1
    Bridge = 2
    PreChorus = 3
    Intro = 4
    Ending = 5
    Other = 6

    Names = [
        u'Verse',
        u'Chorus',
        u'Bridge',
        u'Pre-Chorus',
        u'Intro',
        u'Ending',
        u'Other']
    Tags = [name[0].lower() for name in Names]

    TranslatedNames = [
        translate('SongsPlugin.VerseType', 'Verse'),
        translate('SongsPlugin.VerseType', 'Chorus'),
        translate('SongsPlugin.VerseType', 'Bridge'),
        translate('SongsPlugin.VerseType', 'Pre-Chorus'),
        translate('SongsPlugin.VerseType', 'Intro'),
        translate('SongsPlugin.VerseType', 'Ending'),
        translate('SongsPlugin.VerseType', 'Other')]
    TranslatedTags = [name[0].lower() for name in TranslatedNames]

    @staticmethod
    def translated_tag(verse_tag, default=Other):
        """
        Return the translated UPPERCASE tag for a given tag,
        used to show translated verse tags in UI

        ``verse_tag``
            The string to return a VerseType for

        ``default``
            Default return value if no matching tag is found
        """
        verse_tag = verse_tag[0].lower()
        for num, tag in enumerate(VerseType.Tags):
            if verse_tag == tag:
                return VerseType.TranslatedTags[num].upper()
        if default in VerseType.TranslatedTags:
            return VerseType.TranslatedTags[default].upper()

    @staticmethod
    def translated_name(verse_tag, default=Other):
        """
        Return the translated name for a given tag

        ``verse_tag``
            The string to return a VerseType for

        ``default``
            Default return value if no matching tag is found
        """
        verse_tag = verse_tag[0].lower()
        for num, tag in enumerate(VerseType.Tags):
            if verse_tag == tag:
                return VerseType.TranslatedNames[num]
        if default in VerseType.TranslatedNames:
            return VerseType.TranslatedNames[default]

    @staticmethod
    def from_tag(verse_tag, default=Other):
        """
        Return the VerseType for a given tag

        ``verse_tag``
            The string to return a VerseType for

        ``default``
            Default return value if no matching tag is found
        """
        verse_tag = verse_tag[0].lower()
        for num, tag in enumerate(VerseType.Tags):
            if verse_tag == tag:
                return num
        return default

    @staticmethod
    def from_translated_tag(verse_tag, default=Other):
        """
        Return the VerseType for a given tag

        ``verse_tag``
            The string to return a VerseType for

        ``default``
            Default return value if no matching tag is found
        """
        verse_tag = verse_tag[0].lower()
        for num, tag in enumerate(VerseType.TranslatedTags):
            if verse_tag == tag:
                return num
        return default

    @staticmethod
    def from_string(verse_name, default=Other):
        """
        Return the VerseType for a given string

        ``verse_name``
            The string to return a VerseType for

        ``default``
            Default return value if no matching tag is found
        """
        verse_name = verse_name.lower()
        for num, name in enumerate(VerseType.Names):
            if verse_name == name.lower():
                return num
        return default

    @staticmethod
    def from_translated_string(verse_name):
        """
        Return the VerseType for a given string

        ``verse_name``
            The string to return a VerseType for
        """
        verse_name = verse_name.lower()
        for num, translation in enumerate(VerseType.TranslatedNames):
            if verse_name == translation.lower():
                return num

    @staticmethod
    def from_loose_input(verse_name, default=Other):
        """
        Return the VerseType for a given string

        ``verse_name``
            The string to return a VerseType for

        ``default``
            Default return value if no matching tag is found
        """
        if len(verse_name) > 1:
            verse_index = VerseType.from_translated_string(verse_name)
            if verse_index is None:
                verse_index = VerseType.from_string(verse_name, default)
        elif len(verse_name) == 1:
            verse_index = VerseType.from_translated_tag(verse_name, None)
            if verse_index is None:
                verse_index = VerseType.from_tag(verse_name, default)
        else:
            return default
        return verse_index


def retrieve_windows_encoding(recommendation=None):
    """
    Determines which encoding to use on an information source. The process uses
    both automated detection, which is passed to this method as a
    recommendation, and user confirmation to return an encoding.

    ``recommendation``
        A recommended encoding discovered programmatically for the user to
        confirm.
    """
    # map chardet result to compatible windows standard code page
    codepage_mapping = {'IBM866': u'cp866', 'TIS-620': u'cp874',
        'SHIFT_JIS': u'cp932', 'GB2312': u'cp936', 'HZ-GB-2312': u'cp936',
        'EUC-KR': u'cp949', 'Big5': u'cp950', 'ISO-8859-2': u'cp1250',
        'windows-1250': u'cp1250', 'windows-1251': u'cp1251',
        'windows-1252': u'cp1252', 'ISO-8859-7': u'cp1253',
        'windows-1253': u'cp1253', 'ISO-8859-8': u'cp1255',
        'windows-1255': u'cp1255'}
    if recommendation in codepage_mapping:
        recommendation = codepage_mapping[recommendation]

    # Show dialog for encoding selection
    encodings = [(u'cp1256', translate('SongsPlugin', 'Arabic (CP-1256)')),
        (u'cp1257', translate('SongsPlugin', 'Baltic (CP-1257)')),
        (u'cp1250', translate('SongsPlugin', 'Central European (CP-1250)')),
        (u'cp1251', translate('SongsPlugin', 'Cyrillic (CP-1251)')),
        (u'cp1253', translate('SongsPlugin', 'Greek (CP-1253)')),
        (u'cp1255', translate('SongsPlugin', 'Hebrew (CP-1255)')),
        (u'cp932', translate('SongsPlugin', 'Japanese (CP-932)')),
        (u'cp949', translate('SongsPlugin', 'Korean (CP-949)')),
        (u'cp936', translate('SongsPlugin', 'Simplified Chinese (CP-936)')),
        (u'cp874', translate('SongsPlugin', 'Thai (CP-874)')),
        (u'cp950', translate('SongsPlugin', 'Traditional Chinese (CP-950)')),
        (u'cp1254', translate('SongsPlugin', 'Turkish (CP-1254)')),
        (u'cp1258', translate('SongsPlugin', 'Vietnam (CP-1258)')),
        (u'cp1252', translate('SongsPlugin', 'Western European (CP-1252)'))]
    recommended_index = -1
    if recommendation:
        for index in range(len(encodings)):
            if recommendation == encodings[index][0]:
                recommended_index = index
                break
    if recommended_index > 0:
        choice = QtGui.QInputDialog.getItem(None,
            translate('SongsPlugin', 'Character Encoding'),
            translate('SongsPlugin', 'The codepage setting is responsible\n'
                'for the correct character representation.\nUsually you are fine with the preselected choice.'),
            [pair[1] for pair in encodings], recommended_index, False)
    else:
        choice = QtGui.QInputDialog.getItem(None,
            translate('SongsPlugin', 'Character Encoding'),
            translate('SongsPlugin', 'Please choose the character encoding.\n'
                'The encoding is responsible for the correct character representation.'),
                [pair[1] for pair in encodings], 0, False)
    if not choice[1]:
        return None
    return filter(lambda item: item[1] == choice[0], encodings)[0][0]


def clean_string(string):
    """
    Strips punctuation from the passed string to assist searching
    """
    return WHITESPACE.sub(u' ', APOSTROPHE.sub(u'', string)).lower()


def clean_title(title):
    """
    Cleans the song title by removing Unicode control chars groups C0 & C1,
    as well as any trailing spaces
    """
    return CONTROL_CHARS.sub(u'', title).rstrip()


def clean_song(manager, song):
    """
    Cleans the search title, rebuilds the search lyrics, adds a default author
    if the song does not have one and other clean ups. This should always
    called when a new song is added or changed.

    ``manager``
        The song's manager.

    ``song``
        The song object.
    """
    if isinstance(song.title, buffer):
        song.title = unicode(song.title)
    if isinstance(song.alternate_title, buffer):
        song.alternate_title = unicode(song.alternate_title)
    if isinstance(song.lyrics, buffer):
        song.lyrics = unicode(song.lyrics)
    if song.title:
        song.title = clean_title(song.title)
    else:
        song.title = u''
    if song.alternate_title:
        song.alternate_title = clean_title(song.alternate_title)
    else:
        song.alternate_title = u''
    song.search_title = clean_string(song.title) + u'@' + clean_string(song.alternate_title)
    # Only do this, if we the song is a 1.9.4 song (or older).
    if song.lyrics.find(u'<lyrics language="en">') != -1:
        # Remove the old "language" attribute from lyrics tag (prior to 1.9.5).
        # This is not very important, but this keeps the database clean. This
        # can be removed when everybody has cleaned his songs.
        song.lyrics = song.lyrics.replace(u'<lyrics language="en">', u'<lyrics>')
        verses = SongXML().get_verses(song.lyrics)
        song.search_lyrics = u' '.join([clean_string(verse[1])
            for verse in verses])
        # We need a new and clean SongXML instance.
        sxml = SongXML()
        # Rebuild the song's verses, to remove any wrong verse names (for
        # example translated ones), which might have been added prior to 1.9.5.
        # List for later comparison.
        compare_order = []
        for verse in verses:
            verse_type = VerseType.Tags[VerseType.from_loose_input(verse[0][u'type'])]
            sxml.add_verse_to_lyrics(
                verse_type,
                verse[0][u'label'],
                verse[1],
                verse[0].get(u'lang')
            )
            compare_order.append((u'%s%s' % (verse_type, verse[0][u'label'])).upper())
            if verse[0][u'label'] == u'1':
                compare_order.append(verse_type.upper())
        song.lyrics = unicode(sxml.extract_xml(), u'utf-8')
        # Rebuild the verse order, to convert translated verse tags, which might
        # have been added prior to 1.9.5.
        if song.verse_order:
            order = CONTROL_CHARS.sub(u'', song.verse_order).strip().split()
        else:
            order = []
        new_order = []
        for verse_def in order:
            verse_type = VerseType.Tags[
                VerseType.from_loose_input(verse_def[0])]
            if len(verse_def) > 1:
                new_order.append((u'%s%s' % (verse_type, verse_def[1:])).upper())
            else:
                new_order.append(verse_type.upper())
        song.verse_order = u' '.join(new_order)
        # Check if the verse order contains tags for verses which do not exist.
        for order in new_order:
            if order not in compare_order:
                song.verse_order = u''
                break
    else:
        verses = SongXML().get_verses(song.lyrics)
        song.search_lyrics = u' '.join([clean_string(verse[1])
            for verse in verses])

    # The song does not have any author, add one.
    if not song.authors:
        name = SongStrings.AuthorUnknown
        author = manager.get_object_filtered(Author, Author.display_name == name)
        if author is None:
            author = Author.populate(display_name=name, last_name=u'', first_name=u'')
        song.authors.append(author)
    if song.copyright:
        song.copyright = CONTROL_CHARS.sub(u'', song.copyright).strip()


def get_encoding(font, font_table, default_encoding, failed=False):
    """
    Finds an encoding to use. Asks user, if necessary.

    ``font``
    The number of currently active font.

    ``font_table``
    Dictionary of fonts and respective encodings.

    ``default_encoding``
    The default encoding to use when font_table is empty or no font is used.

    ``failed``
    A boolean indicating whether the previous encoding didn't work.
    """
    encoding = None
    if font in font_table:
        encoding = font_table[font]
    if not encoding and default_encoding:
        encoding = default_encoding
    if not encoding or failed:
        encoding = retrieve_windows_encoding()
        default_encoding = encoding
    font_table[font] = encoding
    return encoding, default_encoding


def strip_rtf(text, default_encoding=None):
    """
    This function strips RTF control structures and returns an unicode string.

    Thanks to Markus Jarderot (MizardX) for this code, used by permission.
    http://stackoverflow.com/questions/188545

    ``text``
    RTF-encoded text, a string.

    ``default_encoding``
    Default encoding to use when no encoding is specified.
    """
    # Current font is the font tag we last met.
    font = u''
    # Character encoding is defined inside fonttable.
    # font_table could contain eg u'0': u'cp1252'
    font_table = {u'': u''}
    # Stack of things to keep track of when entering/leaving groups.
    stack = []
    # Whether this group (and all inside it) are "ignorable".
    ignorable = False
    # Number of ASCII characters to skip after an unicode character.
    ucskip = 1
    # Number of ASCII characters left to skip.
    curskip = 0
    # Output buffer.
    out = []
    for match in PATTERN.finditer(text):
        word, arg, hex, char, brace, tchar = match.groups()
        if brace:
            curskip = 0
            if brace == u'{':
                # Push state
                stack.append((ucskip, ignorable, font))
            elif brace == u'}':
                # Pop state
                ucskip, ignorable, font = stack.pop()
        # \x (not a letter)
        elif char:
            curskip = 0
            if char == u'~' and not ignorable:
                out.append(u'\xA0')
            elif char in u'{}\\' and not ignorable:
                out.append(char)
            elif char == u'-' and not ignorable:
                out.append(u'\u00AD')
            elif char == u'_' and not ignorable:
                out.append(u'\u2011')
            elif char == u'*':
                ignorable = True
        # \command
        elif word:
            curskip = 0
            if word in DESTINATIONS:
                ignorable = True
            elif word in SPECIAL_CHARS:
                out.append(SPECIAL_CHARS[word])
            elif word == u'uc':
                ucskip = int(arg)
            elif word == u' ':
                c = int(arg)
                if c < 0:
                    c += 0x10000
                out.append(unichr(c))
                curskip = ucskip
            elif word == u'fonttbl':
                ignorable = True
            elif word == u'f':
                font = arg
            elif word == u'ansicpg':
                font_table[font] = 'cp' + arg
            elif word == u'fcharset' and font not in font_table and word + arg in CHARSET_MAPPING:
                # \ansicpg overrides \fcharset, if present.
                font_table[font] = CHARSET_MAPPING[word + arg]
        # \'xx
        elif hex:
            if curskip > 0:
                curskip -= 1
            elif not ignorable:
                charcode = int(hex, 16)
                failed = False
                while True:
                    try:
                        encoding, default_encoding = get_encoding(font, font_table, default_encoding, failed=failed)
                        if not encoding:
                            return None
                        out.append(chr(charcode).decode(encoding))
                    except UnicodeDecodeError:
                        failed = True
                    else:
                        break
        elif tchar:
            if curskip > 0:
                curskip -= 1
            elif not ignorable:
                out.append(tchar)
    text = u''.join(out)
    return text, default_encoding


def natcmp(a, b):
    """
    Natural string comparison which mimics the behaviour of Python's internal
    cmp function.
    """
    if len(a) <= len(b):
        for i, key in enumerate(a):
            if isinstance(key, int) and isinstance(b[i], int):
                result = cmp(key, b[i])
            elif isinstance(key, int) and not isinstance(b[i], int):
                result = locale_direct_compare(str(key), b[i])
            elif not isinstance(key, int) and isinstance(b[i], int):
                result = locale_direct_compare(key, str(b[i]))
            else:
                result = locale_direct_compare(key, b[i])
            if result != 0:
                return result
        if len(a) == len(b):
            return 0
        else:
            return -1
    else:
        for i, key in enumerate(b):
            if isinstance(a[i], int) and isinstance(key, int):
                result = cmp(a[i], key)
            elif isinstance(a[i], int) and not isinstance(key, int):
                result = locale_direct_compare(str(a[i]), key)
            elif not isinstance(a[i], int) and isinstance(key, int):
                result = locale_direct_compare(a[i], str(key))
            else:
                result = locale_direct_compare(a[i], key)
            if result != 0:
                return result
        return 1

from xml import OpenLyrics, SongXML
from songstab import SongsTab
from mediaitem import SongMediaItem
-												Added the "lib" module for the Songs plugin.

bzr-revno: 195

											
										
										
											2008-12-07 08:09:59 +00:00
+								# -*- coding: utf-8 -*-
-												Final 120 files
											
										
										
											2013-01-06 17:25:49 +00:00
+								# vim: autoindent shiftwidth=4 expandtab textwidth=120 tabstop=4 softtabstop=4
-												Added the "lib" module for the Songs plugin.

bzr-revno: 195

											
										
										
											2008-12-07 08:09:59 +00:00
-												Changed the license info from docstrings to normal comments.

											
										
										
											2009-09-08 19:58:05 +00:00
+								###############################################################################
 								# OpenLP - Open Source Lyrics Projection                                      #
 								# --------------------------------------------------------------------------- #
-is comming
											
										
										
											2012-12-29 20:56:56 +00:00
+								# Copyright (c) 2008-2013 Raoul Snyman                                        #
 								# Portions copyright (c) 2008-2013 Tim Bentley, Gerald Britton, Jonathan      #
-												Added three names in Copyright headers and About window (Samuel Findlay, Edwin Lunando, Dave Warnock). Fixed consistency issues.
											
										
										
											2012-06-22 14:14:53 +00:00
+								# Corwin, Samuel Findlay, Michael Gorven, Scott Guerrieri, Matthias Hub,      #
-												Fixes
											
										
										
											2012-11-11 21:16:14 +00:00
+								# Meinert Jordan, Armin Köhler, Erik Lundin, Edwin Lunando, Brian T. Meyer.   #
-												Copyrights
											
										
										
											2012-10-21 13:16:22 +00:00
+								# Joshua Miller, Stevan Pettit, Andreas Preikschat, Mattias Põldaru,          #
 								# Christian Richter, Philip Ridout, Simon Scudder, Jeffrey Smith,             #
 								# Maikel Stuivenberg, Martin Thompson, Jon Tibble, Dave Warnock,              #
-												Copyright and Translation updates from 2.0
											
										
										
											2012-12-01 07:57:54 +00:00
+								# Frode Woldsund, Martin Zibricky, Patrick Zimmermann                         #
-												Changed the license info from docstrings to normal comments.

											
										
										
											2009-09-08 19:58:05 +00:00
+								# --------------------------------------------------------------------------- #
 								# This program is free software; you can redistribute it and/or modify it     #
 								# under the terms of the GNU General Public License as published by the Free  #
 								# Software Foundation; version 2 of the License.                              #
 								#                                                                             #
 								# This program is distributed in the hope that it will be useful, but WITHOUT #
 								# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or       #
 								# FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for    #
 								# more details.                                                               #
 								#                                                                             #
 								# You should have received a copy of the GNU General Public License along     #
 								# with this program; if not, write to the Free Software Foundation, Inc., 59  #
 								# Temple Place, Suite 330, Boston, MA 02111-1307 USA                          #
 								###############################################################################
-												added a song clean up function
											
										
										
											2011-03-14 18:59:59 +00:00
+								import re
-												Added the "lib" module for the Songs plugin.

bzr-revno: 195

											
										
										
											2008-12-07 08:09:59 +00:00
-												removed not needed imports
											
										
										
											2013-01-18 23:31:02 +00:00
+								from PyQt4 import QtGui
-												moved code
											
										
										
											2011-02-23 20:22:29 +00:00
-												Keep library classes/methods in lib dirs
											
										
										
											2010-06-12 12:33:04 +00:00
+								from openlp.core.lib import translate
-												Fix sorting in song export
											
										
										
											2012-12-08 21:18:45 +00:00
+								from openlp.core.utils import CONTROL_CHARS, locale_direct_compare
-												moved code
											
										
										
											2011-02-23 20:22:29 +00:00
+								from db import Author
 								from ui import SongStrings
-												Keep library classes/methods in lib dirs
											
										
										
											2010-06-12 12:33:04 +00:00
-												aphrostrophe fix for song searching
											
										
										
											2011-06-01 22:47:42 +00:00
+								WHITESPACE = re.compile(r'[\W_]+', re.UNICODE)
-												More apostrophes
											
										
										
											2011-06-02 21:13:32 +00:00
+								APOSTROPHE = re.compile(u'[\'`’ʻ′]', re.UNICODE)
-												Make strip_rtf a function again.

											
										
										
											2012-07-03 22:26:54 +00:00
+								PATTERN = re.compile(r"\\([a-z]{1,32})(-?\d{1,10})?[ ]?|\\'"
 								    r"([0-9a-f]{2})|\\([^a-z])|([{}])|[\r\n]+|(.)", re.I)
 								# RTF control words which specify a "destination" to be ignored.
 								DESTINATIONS = frozenset((
-												fixed bug caused by merge
											
										
										
											2012-12-27 16:46:27 +00:00
+								    u'aftncn', u'aftnsep', u'aftnsepc', u'annotation', u'atnauthor',
-												Make strip_rtf a function again.

											
										
										
											2012-07-03 22:26:54 +00:00
+								    u'atndate', u'atnicn', u'atnid', u'atnparent', u'atnref', u'atntime',
 								    u'atrfend', u'atrfstart', u'author', u'background', u'bkmkend',
 								    u'bkmkstart', u'blipuid', u'buptim', u'category',
 								    u'colorschememapping', u'colortbl', u'comment', u'company', u'creatim',
 								    u'datafield', u'datastore', u'defchp', u'defpap', u'do', u'doccomm',
 								    u'docvar', u'dptxbxtext', u'ebcend', u'ebcstart', u'factoidname',
 								    u'falt', u'fchars', u'ffdeftext', u'ffentrymcr', u'ffexitmcr',
 								    u'ffformat', u'ffhelptext', u'ffl', u'ffname', u'ffstattext', u'field',
 								    u'file', u'filetbl', u'fldinst', u'fldrslt', u'fldtype', u'fname',
 								    u'fontemb', u'fontfile', u'footer', u'footerf', u'footerl', u'footerr',
 								    u'footnote', u'formfield', u'ftncn', u'ftnsep', u'ftnsepc', u'g',
 								    u'generator', u'gridtbl', u'header', u'headerf', u'headerl',
 								    u'headerr', u'hl', u'hlfr', u'hlinkbase', u'hlloc', u'hlsrc', u'hsv',
 								    u'htmltag', u'info', u'keycode', u'keywords', u'latentstyles',
 								    u'lchars', u'levelnumbers', u'leveltext', u'lfolevel', u'linkval',
 								    u'list', u'listlevel', u'listname', u'listoverride',
 								    u'listoverridetable', u'listpicture', u'liststylename', u'listtable',
 								    u'listtext', u'lsdlockedexcept', u'macc', u'maccPr', u'mailmerge',
 								    u'maln', u'malnScr', u'manager', u'margPr', u'mbar', u'mbarPr',
 								    u'mbaseJc', u'mbegChr', u'mborderBox', u'mborderBoxPr', u'mbox',
 								    u'mboxPr', u'mchr', u'mcount', u'mctrlPr', u'md', u'mdeg', u'mdegHide',
 								    u'mden', u'mdiff', u'mdPr', u'me', u'mendChr', u'meqArr', u'meqArrPr',
 								    u'mf', u'mfName', u'mfPr', u'mfunc', u'mfuncPr', u'mgroupChr',
 								    u'mgroupChrPr', u'mgrow', u'mhideBot', u'mhideLeft', u'mhideRight',
 								    u'mhideTop', u'mhtmltag', u'mlim', u'mlimloc', u'mlimlow',
 								    u'mlimlowPr', u'mlimupp', u'mlimuppPr', u'mm', u'mmaddfieldname',
 								    u'mmath', u'mmathPict', u'mmathPr', u'mmaxdist', u'mmc', u'mmcJc',
 								    u'mmconnectstr', u'mmconnectstrdata', u'mmcPr', u'mmcs',
 								    u'mmdatasource', u'mmheadersource', u'mmmailsubject', u'mmodso',
 								    u'mmodsofilter', u'mmodsofldmpdata', u'mmodsomappedname',
 								    u'mmodsoname', u'mmodsorecipdata', u'mmodsosort', u'mmodsosrc',
 								    u'mmodsotable', u'mmodsoudl', u'mmodsoudldata', u'mmodsouniquetag',
 								    u'mmPr', u'mmquery', u'mmr', u'mnary', u'mnaryPr', u'mnoBreak',
 								    u'mnum', u'mobjDist', u'moMath', u'moMathPara', u'moMathParaPr',
 								    u'mopEmu', u'mphant', u'mphantPr', u'mplcHide', u'mpos', u'mr',
 								    u'mrad', u'mradPr', u'mrPr', u'msepChr', u'mshow', u'mshp', u'msPre',
 								    u'msPrePr', u'msSub', u'msSubPr', u'msSubSup', u'msSubSupPr', u'msSup',
 								    u'msSupPr', u'mstrikeBLTR', u'mstrikeH', u'mstrikeTLBR', u'mstrikeV',
 								    u'msub', u'msubHide', u'msup', u'msupHide', u'mtransp', u'mtype',
 								    u'mvertJc', u'mvfmf', u'mvfml', u'mvtof', u'mvtol', u'mzeroAsc',
-												Fix spelling - oops
											
										
										
											2012-11-07 21:37:01 +00:00
+								    u'mzFrodesc', u'mzeroWid', u'nesttableprops', u'nextfile',
-												Make strip_rtf a function again.

											
										
										
											2012-07-03 22:26:54 +00:00
+								    u'nonesttables', u'objalias', u'objclass', u'objdata', u'object',
 								    u'objname', u'objsect', u'objtime', u'oldcprops', u'oldpprops',
 								    u'oldsprops', u'oldtprops', u'oleclsid', u'operator', u'panose',
 								    u'password', u'passwordhash', u'pgp', u'pgptbl', u'picprop', u'pict',
 								    u'pn', u'pnseclvl', u'pntext', u'pntxta', u'pntxtb', u'printim',
 								    u'private', u'propname', u'protend', u'protstart', u'protusertbl',
 								    u'pxe', u'result', u'revtbl', u'revtim', u'rsidtbl', u'rxe', u'shp',
 								    u'shpgrp', u'shpinst', u'shppict', u'shprslt', u'shptxt', u'sn', u'sp',
 								    u'staticval', u'stylesheet', u'subject', u'sv', u'svb', u'tc',
 								    u'template', u'themedata', u'title', u'txe', u'ud', u'upr',
 								    u'userprops', u'wgrffmtfilter', u'windowcaption', u'writereservation',
 								    u'writereservhash', u'xe', u'xform', u'xmlattrname', u'xmlattrvalue',
 								    u'xmlclose', u'xmlname', u'xmlnstbl', u'xmlopen'))
 								# Translation of some special characters.
 								SPECIAL_CHARS = {
 								    u'par': u'\n',
 								    u'sect': u'\n\n',
 								    # Required page and column break.
 								    # Would be good if we could split verse into subverses here.
 								    u'page': u'\n\n',
 								    u'column': u'\n\n',
 								    # Soft breaks.
 								    u'softpage': u'[---]',
 								    u'softcol': u'[---]',
 								    u'line': u'\n',
 								    u'tab': u'\t',
 								    u'emdash': u'\u2014',
 								    u'endash': u'\u2013',
 								    u'emspace': u'\u2003',
 								    u'enspace': u'\u2002',
 								    u'qmspace': u'\u2005',
 								    u'bullet': u'\u2022',
 								    u'lquote': u'\u2018',
 								    u'rquote': u'\u2019',
 								    u'ldblquote': u'\u201C',
 								    u'rdblquote': u'\u201D',
 								    u'ltrmark': u'\u200E',
 								    u'rtlmark': u'\u200F',
 								    u'zwj': u'\u200D',
 								    u'zwnj': u'\u200C'}
 								CHARSET_MAPPING = {
 								    u'fcharset0': u'cp1252',
 								    u'fcharset161': u'cp1253',
 								    u'fcharset162': u'cp1254',
 								    u'fcharset163': u'cp1258',
 								    u'fcharset177': u'cp1255',
 								    u'fcharset178': u'cp1256',
 								    u'fcharset186': u'cp1257',
 								    u'fcharset204': u'cp1251',
 								    u'fcharset222': u'cp874',
 								    u'fcharset238': u'cp1250'}
-												aphrostrophe fix for song searching
											
										
										
											2011-06-01 22:47:42 +00:00
-												Keep library classes/methods in lib dirs
											
										
										
											2010-06-12 12:33:04 +00:00
+								class VerseType(object):
 								    """
 								    VerseType provides an enumeration for the tags that may be associated
 								    with verses in songs.
 								    """
 								    Verse = 0
 								    Chorus = 1
 								    Bridge = 2
 								    PreChorus = 3
 								    Intro = 4
 								    Ending = 5
 								    Other = 6
-												just another massive set of changes
											
										
										
											2011-02-17 19:46:01 +00:00
-												VerseType changes
											
										
										
											2011-02-16 18:37:51 +00:00
+								    Names = [
 								        u'Verse',
 								        u'Chorus',
 								        u'Bridge',
 								        u'Pre-Chorus',
 								        u'Intro',
 								        u'Ending',
 								        u'Other']
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								    Tags = [name[0].lower() for name in Names]
-												just another massive set of changes
											
										
										
											2011-02-17 19:46:01 +00:00
 								    TranslatedNames = [
-												removed not neede unicode calls
											
										
										
											2012-05-17 18:57:01 +00:00
+								        translate('SongsPlugin.VerseType', 'Verse'),
 								        translate('SongsPlugin.VerseType', 'Chorus'),
 								        translate('SongsPlugin.VerseType', 'Bridge'),
 								        translate('SongsPlugin.VerseType', 'Pre-Chorus'),
 								        translate('SongsPlugin.VerseType', 'Intro'),
 								        translate('SongsPlugin.VerseType', 'Ending'),
 								        translate('SongsPlugin.VerseType', 'Other')]
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								    TranslatedTags = [name[0].lower() for name in TranslatedNames]
-												VerseType changes
											
										
										
											2011-02-16 18:37:51 +00:00
 								    @staticmethod
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								    def translated_tag(verse_tag, default=Other):
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								        """
 								        Return the translated UPPERCASE tag for a given tag,
 								        used to show translated verse tags in UI
 								        ``verse_tag``
 								            The string to return a VerseType for
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								        ``default``
 								            Default return value if no matching tag is found
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								        """
 								        verse_tag = verse_tag[0].lower()
 								        for num, tag in enumerate(VerseType.Tags):
 								            if verse_tag == tag:
 								                return VerseType.TranslatedTags[num].upper()
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								        if default in VerseType.TranslatedTags:
 								            return VerseType.TranslatedTags[default].upper()
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
 								    @staticmethod
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								    def translated_name(verse_tag, default=Other):
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								        """
 								        Return the translated name for a given tag
 								        ``verse_tag``
 								            The string to return a VerseType for
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								        ``default``
 								            Default return value if no matching tag is found
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								        """
 								        verse_tag = verse_tag[0].lower()
 								        for num, tag in enumerate(VerseType.Tags):
 								            if verse_tag == tag:
 								                return VerseType.TranslatedNames[num]
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								        if default in VerseType.TranslatedNames:
 								            return VerseType.TranslatedNames[default]
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
 								    @staticmethod
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								    def from_tag(verse_tag, default=Other):
-												Keep library classes/methods in lib dirs
											
										
										
											2010-06-12 12:33:04 +00:00
+								        """
-												first working example with unilanguage tags handling
											
										
										
											2011-02-17 15:05:58 +00:00
+								        Return the VerseType for a given tag
-												Keep library classes/methods in lib dirs
											
										
										
											2010-06-12 12:33:04 +00:00
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								        ``verse_tag``
-												Keep library classes/methods in lib dirs
											
										
										
											2010-06-12 12:33:04 +00:00
+								            The string to return a VerseType for
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								        ``default``
 								            Default return value if no matching tag is found
-												first working example with unilanguage tags handling
											
										
										
											2011-02-17 15:05:58 +00:00
+								        """
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								        verse_tag = verse_tag[0].lower()
 								        for num, tag in enumerate(VerseType.Tags):
 								            if verse_tag == tag:
-												first working example with unilanguage tags handling
											
										
										
											2011-02-17 15:05:58 +00:00
+								                return num
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								        return default
-												VerseType changes
											
										
										
											2011-02-16 18:37:51 +00:00
-												first working example with unilanguage tags handling
											
										
										
											2011-02-17 15:05:58 +00:00
+								    @staticmethod
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								    def from_translated_tag(verse_tag, default=Other):
-												first working example with unilanguage tags handling
											
										
										
											2011-02-17 15:05:58 +00:00
+								        """
 								        Return the VerseType for a given tag
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								        ``verse_tag``
-												first working example with unilanguage tags handling
											
										
										
											2011-02-17 15:05:58 +00:00
+								            The string to return a VerseType for
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
 								        ``default``
 								            Default return value if no matching tag is found
-												first working example with unilanguage tags handling
											
										
										
											2011-02-17 15:05:58 +00:00
+								        """
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								        verse_tag = verse_tag[0].lower()
 								        for num, tag in enumerate(VerseType.TranslatedTags):
 								            if verse_tag == tag:
 								                return num
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								        return default
-												first working example with unilanguage tags handling
											
										
										
											2011-02-17 15:05:58 +00:00
 								    @staticmethod
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								    def from_string(verse_name, default=Other):
-												first working example with unilanguage tags handling
											
										
										
											2011-02-17 15:05:58 +00:00
+								        """
 								        Return the VerseType for a given string
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								        ``verse_name``
-												first working example with unilanguage tags handling
											
										
										
											2011-02-17 15:05:58 +00:00
+								            The string to return a VerseType for
-												Bug #875286
use VerseType.Other if it is not recogniced during OpenSong import.

											
										
										
											2011-11-18 10:53:56 +00:00
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								        ``default``
 								            Default return value if no matching tag is found
-												Keep library classes/methods in lib dirs
											
										
										
											2010-06-12 12:33:04 +00:00
+								        """
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								        verse_name = verse_name.lower()
 								        for num, name in enumerate(VerseType.Names):
 								            if verse_name == name.lower():
 								                return num
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								        return default
-												Keep library classes/methods in lib dirs
											
										
										
											2010-06-12 12:33:04 +00:00
-												VerseType changes
											
										
										
											2011-02-16 18:37:51 +00:00
+								    @staticmethod
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								    def from_translated_string(verse_name):
-												VerseType changes
											
										
										
											2011-02-16 18:37:51 +00:00
+								        """
 								        Return the VerseType for a given string
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								        ``verse_name``
-												VerseType changes
											
										
										
											2011-02-16 18:37:51 +00:00
+								            The string to return a VerseType for
 								        """
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								        verse_name = verse_name.lower()
-												just another massive set of changes
											
										
										
											2011-02-17 19:46:01 +00:00
+								        for num, translation in enumerate(VerseType.TranslatedNames):
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								            if verse_name == translation.lower():
-												VerseType changes
											
										
										
											2011-02-16 18:37:51 +00:00
+								                return num
 								    @staticmethod
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								    def from_loose_input(verse_name, default=Other):
-												first working example with unilanguage tags handling
											
										
										
											2011-02-17 15:05:58 +00:00
+								        """
-												corrected function comment

											
										
										
											2011-11-24 22:49:21 +00:00
+								        Return the VerseType for a given string
-												first working example with unilanguage tags handling
											
										
										
											2011-02-17 15:05:58 +00:00
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								        ``verse_name``
-												first working example with unilanguage tags handling
											
										
										
											2011-02-17 15:05:58 +00:00
+								            The string to return a VerseType for
-												Bug #875286
use VerseType.Other if it is not recogniced during OpenSong import.

											
										
										
											2011-11-18 10:53:56 +00:00
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								        ``default``
 								            Default return value if no matching tag is found
-												first working example with unilanguage tags handling
											
										
										
											2011-02-17 15:05:58 +00:00
+								        """
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								        if len(verse_name) > 1:
 								            verse_index = VerseType.from_translated_string(verse_name)
 								            if verse_index is None:
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								                verse_index = VerseType.from_string(verse_name, default)
-												Fix #249 on tracker, exception on opensong files with verse name containing only number [1]

											
										
										
											2011-08-16 00:08:16 +00:00
+								        elif len(verse_name) == 1:
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								            verse_index = VerseType.from_translated_tag(verse_name, None)
-												Fix #249 on tracker, exception on opensong files with verse name containing only number [1]

											
										
										
											2011-08-16 00:08:16 +00:00
+								            if verse_index is None:
-												make VerseType.Other default for VerseType encodings

											
										
										
											2011-11-24 22:34:27 +00:00
+								                verse_index = VerseType.from_tag(verse_name, default)
 								        else:
 								            return default
-												better variable names, fixed translation issues for verse sequences
											
										
										
											2011-02-18 00:48:58 +00:00
+								        return verse_index
-												Character selection fallback for the ewimporter

											
										
										
											2011-01-04 10:13:41 +00:00
-												variable naming conventions, converted dict to list
											
										
										
											2012-06-16 15:51:04 +00:00
-												Character selection fallback for the ewimporter

											
										
										
											2011-01-04 10:13:41 +00:00
+								def retrieve_windows_encoding(recommendation=None):
-												Missing function docstrings
											
										
										
											2011-02-07 16:29:06 +00:00
+								    """
 								    Determines which encoding to use on an information source. The process uses
 								    both automated detection, which is passed to this method as a
 								    recommendation, and user confirmation to return an encoding.
 								    ``recommendation``
 								        A recommended encoding discovered programmatically for the user to
 								        confirm.
 								    """
-												Character selection fallback for the ewimporter

											
										
										
											2011-01-04 10:13:41 +00:00
+								    # map chardet result to compatible windows standard code page
 								    codepage_mapping = {'IBM866': u'cp866', 'TIS-620': u'cp874',
 								        'SHIFT_JIS': u'cp932', 'GB2312': u'cp936', 'HZ-GB-2312': u'cp936',
 								        'EUC-KR': u'cp949', 'Big5': u'cp950', 'ISO-8859-2': u'cp1250',
 								        'windows-1250': u'cp1250', 'windows-1251': u'cp1251',
 								        'windows-1252': u'cp1252', 'ISO-8859-7': u'cp1253',
 								        'windows-1253': u'cp1253', 'ISO-8859-8': u'cp1255',
 								        'windows-1255': u'cp1255'}
 								    if recommendation in codepage_mapping:
 								        recommendation = codepage_mapping[recommendation]
 								    # Show dialog for encoding selection
 								    encodings = [(u'cp1256', translate('SongsPlugin', 'Arabic (CP-1256)')),
 								        (u'cp1257', translate('SongsPlugin', 'Baltic (CP-1257)')),
 								        (u'cp1250', translate('SongsPlugin', 'Central European (CP-1250)')),
 								        (u'cp1251', translate('SongsPlugin', 'Cyrillic (CP-1251)')),
 								        (u'cp1253', translate('SongsPlugin', 'Greek (CP-1253)')),
 								        (u'cp1255', translate('SongsPlugin', 'Hebrew (CP-1255)')),
 								        (u'cp932', translate('SongsPlugin', 'Japanese (CP-932)')),
 								        (u'cp949', translate('SongsPlugin', 'Korean (CP-949)')),
 								        (u'cp936', translate('SongsPlugin', 'Simplified Chinese (CP-936)')),
 								        (u'cp874', translate('SongsPlugin', 'Thai (CP-874)')),
 								        (u'cp950', translate('SongsPlugin', 'Traditional Chinese (CP-950)')),
 								        (u'cp1254', translate('SongsPlugin', 'Turkish (CP-1254)')),
 								        (u'cp1258', translate('SongsPlugin', 'Vietnam (CP-1258)')),
 								        (u'cp1252', translate('SongsPlugin', 'Western European (CP-1252)'))]
 								    recommended_index = -1
 								    if recommendation:
 								        for index in range(len(encodings)):
 								            if recommendation == encodings[index][0]:
 								                recommended_index = index
 								                break
 								    if recommended_index > 0:
 								        choice = QtGui.QInputDialog.getItem(None,
 								            translate('SongsPlugin', 'Character Encoding'),
 								            translate('SongsPlugin', 'The codepage setting is responsible\n'
-												Final 120 files
											
										
										
											2013-01-06 17:25:49 +00:00
+								                'for the correct character representation.\nUsually you are fine with the preselected choice.'),
-												Character selection fallback for the ewimporter

											
										
										
											2011-01-04 10:13:41 +00:00
+								            [pair[1] for pair in encodings], recommended_index, False)
 								    else:
 								        choice = QtGui.QInputDialog.getItem(None,
 								            translate('SongsPlugin', 'Character Encoding'),
 								            translate('SongsPlugin', 'Please choose the character encoding.\n'
-												Final 120 files
											
										
										
											2013-01-06 17:25:49 +00:00
+								                'The encoding is responsible for the correct character representation.'),
 								                [pair[1] for pair in encodings], 0, False)
-												Character selection fallback for the ewimporter

											
										
										
											2011-01-04 10:13:41 +00:00
+								    if not choice[1]:
 								        return None
 								    return filter(lambda item: item[1] == choice[0], encodings)[0][0]
-												variable naming conventions, converted dict to list
											
										
										
											2012-06-16 15:51:04 +00:00
-												aphrostrophe fix for song searching
											
										
										
											2011-06-01 22:47:42 +00:00
+								def clean_string(string):
 								    """
 								    Strips punctuation from the passed string to assist searching
 								    """
-												More apostrophes
											
										
										
											2011-06-02 21:13:32 +00:00
+								    return WHITESPACE.sub(u' ', APOSTROPHE.sub(u'', string)).lower()
-												removed whitespaces at line ends

											
										
										
											2012-04-04 07:26:51 +00:00
-												variable naming conventions, converted dict to list
											
										
										
											2012-06-16 15:51:04 +00:00
-												Fix for bug 952533

											
										
										
											2012-03-22 06:50:54 +00:00
+								def clean_title(title):
 								    """
 								    Cleans the song title by removing Unicode control chars groups C0 & C1,
 								    as well as any trailing spaces
 								    """
-												Made modifications according to merge request

											
										
										
											2012-03-22 17:22:01 +00:00
+								    return CONTROL_CHARS.sub(u'', title).rstrip()
-												aphrostrophe fix for song searching
											
										
										
											2011-06-01 22:47:42 +00:00
-												variable naming conventions, converted dict to list
											
										
										
											2012-06-16 15:51:04 +00:00
-												added a song clean up function
											
										
										
											2011-03-14 18:59:59 +00:00
+								def clean_song(manager, song):
-												moved code
											
										
										
											2011-02-23 20:22:29 +00:00
+								    """
-												removed old hack, updated comment, typo
											
										
										
											2011-03-16 17:21:03 +00:00
+								    Cleans the search title, rebuilds the search lyrics, adds a default author
-												spelling
											
										
										
											2011-03-15 17:56:34 +00:00
+								    if the song does not have one and other clean ups. This should always
 								    called when a new song is added or changed.
-												moved code
											
										
										
											2011-02-23 20:22:29 +00:00
 								    ``manager``
 								        The song's manager.
 								    ``song``
 								        The song object.
 								    """
-												Changed typecast to rather check for buffer.
											
										
										
											2011-07-08 06:40:50 +00:00
+								    if isinstance(song.title, buffer):
-												Fixed bug #794971: Typecast the buffer object to a unicode object.
											
										
										
											2011-07-08 06:31:34 +00:00
+								        song.title = unicode(song.title)
-												Changed typecast to rather check for buffer.
											
										
										
											2011-07-08 06:40:50 +00:00
+								    if isinstance(song.alternate_title, buffer):
 								        song.alternate_title = unicode(song.alternate_title)
 								    if isinstance(song.lyrics, buffer):
-												Fixed bug #794971: Typecast the buffer object to a unicode object.
											
										
										
											2011-07-08 06:31:34 +00:00
+								        song.lyrics = unicode(song.lyrics)
-												Fix for bug 952533

											
										
										
											2012-03-22 06:50:54 +00:00
+								    if song.title:
 								        song.title = clean_title(song.title)
 								    else:
 								        song.title = u''
 								    if song.alternate_title:
 								        song.alternate_title = clean_title(song.alternate_title)
 								    else:
-												added a song clean up function
											
										
										
											2011-03-14 18:59:59 +00:00
+								        song.alternate_title = u''
-												Final 120 files
											
										
										
											2013-01-06 17:25:49 +00:00
+								    song.search_title = clean_string(song.title) + u'@' + clean_string(song.alternate_title)
-												better solution
											
										
										
											2011-05-28 17:01:41 +00:00
+								    # Only do this, if we the song is a 1.9.4 song (or older).
 								    if song.lyrics.find(u'<lyrics language="en">') != -1:
 								        # Remove the old "language" attribute from lyrics tag (prior to 1.9.5).
 								        # This is not very important, but this keeps the database clean. This
 								        # can be removed when everybody has cleaned his songs.
-												Final 120 files
											
										
										
											2013-01-06 17:25:49 +00:00
+								        song.lyrics = song.lyrics.replace(u'<lyrics language="en">', u'<lyrics>')
-												better solution
											
										
										
											2011-05-28 17:01:41 +00:00
+								        verses = SongXML().get_verses(song.lyrics)
-												aphrostrophe fix for song searching
											
										
										
											2011-06-01 22:47:42 +00:00
+								        song.search_lyrics = u' '.join([clean_string(verse[1])
 								            for verse in verses])
-												better solution
											
										
										
											2011-05-28 17:01:41 +00:00
+								        # We need a new and clean SongXML instance.
 								        sxml = SongXML()
 								        # Rebuild the song's verses, to remove any wrong verse names (for
 								        # example translated ones), which might have been added prior to 1.9.5.
 								        # List for later comparison.
 								        compare_order = []
 								        for verse in verses:
-												Final 120 files
											
										
										
											2013-01-06 17:25:49 +00:00
+								            verse_type = VerseType.Tags[VerseType.from_loose_input(verse[0][u'type'])]
-												better solution
											
										
										
											2011-05-28 17:01:41 +00:00
+								            sxml.add_verse_to_lyrics(
 								                verse_type,
 								                verse[0][u'label'],
 								                verse[1],
-												pythonifying code:
- replace has_key() by key in dict
- remove len() method from sequence and mapping types when mapping to bool

											
										
										
											2012-04-29 15:31:56 +00:00
+								                verse[0].get(u'lang')
-												better solution
											
										
										
											2011-05-28 17:01:41 +00:00
+								            )
-												Final 120 files
											
										
										
											2013-01-06 17:25:49 +00:00
+								            compare_order.append((u'%s%s' % (verse_type, verse[0][u'label'])).upper())
-												better solution
											
										
										
											2011-05-28 17:01:41 +00:00
+								            if verse[0][u'label'] == u'1':
 								                compare_order.append(verse_type.upper())
 								        song.lyrics = unicode(sxml.extract_xml(), u'utf-8')
 								        # Rebuild the verse order, to convert translated verse tags, which might
 								        # have been added prior to 1.9.5.
 								        if song.verse_order:
-												Bug #969282: Remove control characters from song copyright string

											
										
										
											2012-04-02 11:38:22 +00:00
+								            order = CONTROL_CHARS.sub(u'', song.verse_order).strip().split()
-												better solution
											
										
										
											2011-05-28 17:01:41 +00:00
+								        else:
 								            order = []
 								        new_order = []
 								        for verse_def in order:
 								            verse_type = VerseType.Tags[
 								                VerseType.from_loose_input(verse_def[0])]
 								            if len(verse_def) > 1:
-												Final 120 files
											
										
										
											2013-01-06 17:25:49 +00:00
+								                new_order.append((u'%s%s' % (verse_type, verse_def[1:])).upper())
-												better solution
											
										
										
											2011-05-28 17:01:41 +00:00
+								            else:
 								                new_order.append(verse_type.upper())
 								        song.verse_order = u' '.join(new_order)
 								        # Check if the verse order contains tags for verses which do not exist.
 								        for order in new_order:
 								            if order not in compare_order:
 								                song.verse_order = u''
 								                break
-												aphrostrophe fix for song searching
											
										
										
											2011-06-01 22:47:42 +00:00
+								    else:
 								        verses = SongXML().get_verses(song.lyrics)
 								        song.search_lyrics = u' '.join([clean_string(verse[1])
 								            for verse in verses])
-												continued clean up
											
										
										
											2011-03-15 17:52:42 +00:00
+								    # The song does not have any author, add one.
 								    if not song.authors:
 								        name = SongStrings.AuthorUnknown
-												Final 120 files
											
										
										
											2013-01-06 17:25:49 +00:00
+								        author = manager.get_object_filtered(Author, Author.display_name == name)
-												continued clean up
											
										
										
											2011-03-15 17:52:42 +00:00
+								        if author is None:
-												Final 120 files
											
										
										
											2013-01-06 17:25:49 +00:00
+								            author = Author.populate(display_name=name, last_name=u'', first_name=u'')
-												continued clean up
											
										
										
											2011-03-15 17:52:42 +00:00
+								        song.authors.append(author)
-												Bug #969282: Remove control characters from song copyright string

											
										
										
											2012-04-02 11:38:22 +00:00
+								    if song.copyright:
 								        song.copyright = CONTROL_CHARS.sub(u'', song.copyright).strip()
-												moved code
											
										
										
											2011-02-23 20:22:29 +00:00
-												Make strip_rtf a function again.

											
										
										
											2012-07-03 22:26:54 +00:00
 								def get_encoding(font, font_table, default_encoding, failed=False):
 								    """
 								    Finds an encoding to use. Asks user, if necessary.
 								    ``font``
 								    The number of currently active font.
 								    ``font_table``
 								    Dictionary of fonts and respective encodings.
 								    ``default_encoding``
-												Use new strip_rtf routine and error trap
											
										
										
											2012-07-05 19:24:56 +00:00
+								    The default encoding to use when font_table is empty or no font is used.
-												Make strip_rtf a function again.

											
										
										
											2012-07-03 22:26:54 +00:00
 								    ``failed``
 								    A boolean indicating whether the previous encoding didn't work.
 								    """
 								    encoding = None
 								    if font in font_table:
 								        encoding = font_table[font]
 								    if not encoding and default_encoding:
 								        encoding = default_encoding
 								    if not encoding or failed:
 								        encoding = retrieve_windows_encoding()
 								        default_encoding = encoding
 								    font_table[font] = encoding
 								    return encoding, default_encoding
 								def strip_rtf(text, default_encoding=None):
-												Move strip_rtf and change it into a class StripRtf + other changes. It might not work that well yet.

											
										
										
											2012-06-24 18:08:20 +00:00
+								    """
-												Make strip_rtf a function again.

											
										
										
											2012-07-03 22:26:54 +00:00
+								    This function strips RTF control structures and returns an unicode string.
-												Move strip_rtf and change it into a class StripRtf + other changes. It might not work that well yet.

											
										
										
											2012-06-24 18:08:20 +00:00
 								    Thanks to Markus Jarderot (MizardX) for this code, used by permission.
 								    http://stackoverflow.com/questions/188545
-												Make strip_rtf a function again.

											
										
										
											2012-07-03 22:26:54 +00:00
 								    ``text``
 								    RTF-encoded text, a string.
 								    ``default_encoding``
 								    Default encoding to use when no encoding is specified.
-												Move strip_rtf and change it into a class StripRtf + other changes. It might not work that well yet.

											
										
										
											2012-06-24 18:08:20 +00:00
+								    """
-												Make strip_rtf a function again.

											
										
										
											2012-07-03 22:26:54 +00:00
+								    # Current font is the font tag we last met.
 								    font = u''
 								    # Character encoding is defined inside fonttable.
 								    # font_table could contain eg u'0': u'cp1252'
 								    font_table = {u'': u''}
 								    # Stack of things to keep track of when entering/leaving groups.
 								    stack = []
 								    # Whether this group (and all inside it) are "ignorable".
 								    ignorable = False
 								    # Number of ASCII characters to skip after an unicode character.
 								    ucskip = 1
 								    # Number of ASCII characters left to skip.
 								    curskip = 0
 								    # Output buffer.
 								    out = []
 								    for match in PATTERN.finditer(text):
 								        word, arg, hex, char, brace, tchar = match.groups()
 								        if brace:
 								            curskip = 0
 								            if brace == u'{':
 								                # Push state
 								                stack.append((ucskip, ignorable, font))
 								            elif brace == u'}':
 								                # Pop state
 								                ucskip, ignorable, font = stack.pop()
 								        # \x (not a letter)
 								        elif char:
 								            curskip = 0
 								            if char == u'~' and not ignorable:
 								                out.append(u'\xA0')
 								            elif char in u'{}\\' and not ignorable:
 								                out.append(char)
 								            elif char == u'-' and not ignorable:
 								                out.append(u'\u00AD')
 								            elif char == u'_' and not ignorable:
 								                out.append(u'\u2011')
 								            elif char == u'*':
 								                ignorable = True
 								        # \command
 								        elif word:
 								            curskip = 0
 								            if word in DESTINATIONS:
 								                ignorable = True
 								            elif word in SPECIAL_CHARS:
 								                out.append(SPECIAL_CHARS[word])
 								            elif word == u'uc':
 								                ucskip = int(arg)
 								            elif word == u' ':
 								                c = int(arg)
 								                if c < 0:
 								                    c += 0x10000
 								                out.append(unichr(c))
 								                curskip = ucskip
 								            elif word == u'fonttbl':
 								                ignorable = True
 								            elif word == u'f':
 								                font = arg
 								            elif word == u'ansicpg':
 								                font_table[font] = 'cp' + arg
-												Final 120 files
											
										
										
											2013-01-06 17:25:49 +00:00
+								            elif word == u'fcharset' and font not in font_table and word + arg in CHARSET_MAPPING:
-												Make strip_rtf a function again.

											
										
										
											2012-07-03 22:26:54 +00:00
+								                # \ansicpg overrides \fcharset, if present.
 								                font_table[font] = CHARSET_MAPPING[word + arg]
 								        # \'xx
 								        elif hex:
 								            if curskip > 0:
 								                curskip -= 1
 								            elif not ignorable:
 								                charcode = int(hex, 16)
-												Cleanup.

											
										
										
											2012-07-03 22:55:53 +00:00
+								                failed = False
-												Make strip_rtf a function again.

											
										
										
											2012-07-03 22:26:54 +00:00
+								                while True:
 								                    try:
-												Final 120 files
											
										
										
											2013-01-06 17:25:49 +00:00
+								                        encoding, default_encoding = get_encoding(font, font_table, default_encoding, failed=failed)
-												fixes bug 1098075 trunk version

											
										
										
											2013-02-04 17:47:02 +00:00
+								                        if not encoding:
 								                            return None
-												Make strip_rtf a function again.

											
										
										
											2012-07-03 22:26:54 +00:00
+								                        out.append(chr(charcode).decode(encoding))
 								                    except UnicodeDecodeError:
-												Cleanup.

											
										
										
											2012-07-03 22:55:53 +00:00
+								                        failed = True
-												Make strip_rtf a function again.

											
										
										
											2012-07-03 22:26:54 +00:00
+								                    else:
 								                        break
 								        elif tchar:
 								            if curskip > 0:
 								                curskip -= 1
 								            elif not ignorable:
 								                out.append(tchar)
 								    text = u''.join(out)
 								    return text, default_encoding
-												fixed bug caused by merge
											
										
										
											2012-12-27 16:46:27 +00:00
-												Fix sorting in song export
											
										
										
											2012-12-08 21:18:45 +00:00
+								def natcmp(a, b):
 								    """
 								    Natural string comparison which mimics the behaviour of Python's internal
 								    cmp function.
 								    """
 								    if len(a) <= len(b):
 								        for i, key in enumerate(a):
 								            if isinstance(key, int) and isinstance(b[i], int):
 								                result = cmp(key, b[i])
 								            elif isinstance(key, int) and not isinstance(b[i], int):
-												fixed bug caused by merge
											
										
										
											2012-12-27 16:46:27 +00:00
+								                result = locale_direct_compare(str(key), b[i])
-												Fix sorting in song export
											
										
										
											2012-12-08 21:18:45 +00:00
+								            elif not isinstance(key, int) and isinstance(b[i], int):
-												fixed bug caused by merge
											
										
										
											2012-12-27 16:46:27 +00:00
+								                result = locale_direct_compare(key, str(b[i]))
-												Fix sorting in song export
											
										
										
											2012-12-08 21:18:45 +00:00
+								            else:
 								                result = locale_direct_compare(key, b[i])
 								            if result != 0:
 								                return result
 								        if len(a) == len(b):
 								            return 0
 								        else:
 								            return -1
 								    else:
 								        for i, key in enumerate(b):
 								            if isinstance(a[i], int) and isinstance(key, int):
 								                result = cmp(a[i], key)
 								            elif isinstance(a[i], int) and not isinstance(key, int):
-												fixed bug caused by merge
											
										
										
											2012-12-27 16:46:27 +00:00
+								                result = locale_direct_compare(str(a[i]), key)
-												Fix sorting in song export
											
										
										
											2012-12-08 21:18:45 +00:00
+								            elif not isinstance(a[i], int) and isinstance(key, int):
-												fixed bug caused by merge
											
										
										
											2012-12-27 16:46:27 +00:00
+								                result = locale_direct_compare(a[i], str(key))
-												Fix sorting in song export
											
										
										
											2012-12-08 21:18:45 +00:00
+								            else:
 								                result = locale_direct_compare(a[i], key)
 								            if result != 0:
 								                return result
 								        return 1
-												Better handling of encodings. User is asked only once, if possible.

											
										
										
											2012-06-25 06:44:11 +00:00
-												merged classes together
											
										
										
											2011-01-09 16:52:31 +00:00
+								from xml import OpenLyrics, SongXML
-												Added a songs settings tab.

bzr-revno: 352

											
										
										
											2009-02-28 23:31:24 +00:00
+								from songstab import SongsTab
-												Character selection fallback for the ewimporter

											
										
										
											2011-01-04 10:13:41 +00:00
+								from mediaitem import SongMediaItem