2009-10-19 13:57:31 +00:00
|
|
|
#!/usr/bin/env python
|
|
|
|
# -*- coding: utf-8 -*-
|
2009-10-24 07:14:11 +00:00
|
|
|
# vim: autoindent shiftwidth=4 expandtab textwidth=80 tabstop=4 softtabstop=4
|
|
|
|
|
|
|
|
###############################################################################
|
|
|
|
# OpenLP - Open Source Lyrics Projection #
|
|
|
|
# --------------------------------------------------------------------------- #
|
2009-12-31 12:52:01 +00:00
|
|
|
# Copyright (c) 2008-2010 Raoul Snyman #
|
|
|
|
# Portions copyright (c) 2008-2010 Tim Bentley, Jonathan Corwin, Michael #
|
2009-11-30 20:29:26 +00:00
|
|
|
# Gorven, Scott Guerrieri, Maikel Stuivenberg, Martin Thompson, Jon Tibble, #
|
|
|
|
# Carsten Tinggaard #
|
2009-10-24 07:14:11 +00:00
|
|
|
# --------------------------------------------------------------------------- #
|
|
|
|
# This program is free software; you can redistribute it and/or modify it #
|
|
|
|
# under the terms of the GNU General Public License as published by the Free #
|
|
|
|
# Software Foundation; version 2 of the License. #
|
|
|
|
# #
|
|
|
|
# This program is distributed in the hope that it will be useful, but WITHOUT #
|
|
|
|
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or #
|
|
|
|
# FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for #
|
|
|
|
# more details. #
|
|
|
|
# #
|
|
|
|
# You should have received a copy of the GNU General Public License along #
|
|
|
|
# with this program; if not, write to the Free Software Foundation, Inc., 59 #
|
|
|
|
# Temple Place, Suite 330, Boston, MA 02111-1307 USA #
|
|
|
|
###############################################################################
|
2009-10-19 13:57:31 +00:00
|
|
|
|
|
|
|
import sys
|
|
|
|
import os
|
|
|
|
import sqlite
|
|
|
|
import sqlite3
|
2009-10-19 20:03:55 +00:00
|
|
|
import re
|
2009-10-19 13:57:31 +00:00
|
|
|
from optparse import OptionParser
|
|
|
|
from traceback import format_tb as get_traceback
|
|
|
|
|
|
|
|
# Some global options to be used throughout the import process
|
2009-10-20 16:43:36 +00:00
|
|
|
dirty_chars = re.compile(r'\W ', re.UNICODE)
|
2009-10-19 13:57:31 +00:00
|
|
|
verbose = False
|
|
|
|
debug = False
|
|
|
|
old_cursor = None
|
|
|
|
new_cursor = None
|
|
|
|
|
|
|
|
# SQL create statments
|
|
|
|
create_statements = [
|
2009-10-19 20:03:55 +00:00
|
|
|
(u'table "authors"', u"""CREATE TABLE authors (
|
2009-10-19 13:57:31 +00:00
|
|
|
id INTEGER NOT NULL,
|
|
|
|
first_name VARCHAR(128),
|
|
|
|
last_name VARCHAR(128),
|
|
|
|
display_name VARCHAR(255) NOT NULL,
|
|
|
|
PRIMARY KEY (id)
|
2009-10-19 20:03:55 +00:00
|
|
|
)"""),
|
|
|
|
(u'table "song_books"', u"""CREATE TABLE song_books (
|
2009-10-19 13:57:31 +00:00
|
|
|
id INTEGER NOT NULL,
|
|
|
|
name VARCHAR(128) NOT NULL,
|
|
|
|
publisher VARCHAR(128),
|
|
|
|
PRIMARY KEY (id)
|
2009-10-19 20:03:55 +00:00
|
|
|
)"""),
|
|
|
|
(u'table "songs"', u"""CREATE TABLE songs (
|
2009-10-19 13:57:31 +00:00
|
|
|
id INTEGER NOT NULL,
|
|
|
|
song_book_id INTEGER,
|
|
|
|
title VARCHAR(255) NOT NULL,
|
|
|
|
lyrics TEXT NOT NULL,
|
|
|
|
verse_order VARCHAR(128),
|
|
|
|
copyright VARCHAR(255),
|
|
|
|
comments TEXT,
|
|
|
|
ccli_number VARCHAR(64),
|
|
|
|
song_number VARCHAR(64),
|
|
|
|
theme_name VARCHAR(128),
|
|
|
|
search_title VARCHAR(255) NOT NULL,
|
|
|
|
search_lyrics TEXT NOT NULL,
|
|
|
|
PRIMARY KEY (id),
|
|
|
|
FOREIGN KEY(song_book_id) REFERENCES song_books (id)
|
2009-10-19 20:03:55 +00:00
|
|
|
)"""),
|
|
|
|
(u'table "topics"', u"""CREATE TABLE topics (
|
2009-10-19 13:57:31 +00:00
|
|
|
id INTEGER NOT NULL,
|
|
|
|
name VARCHAR(128) NOT NULL,
|
|
|
|
PRIMARY KEY (id)
|
2009-10-19 20:03:55 +00:00
|
|
|
)"""),
|
|
|
|
(u'index "ix_songs_search_lyrics"',
|
|
|
|
u"""CREATE INDEX ix_songs_search_lyrics ON songs (search_lyrics)"""),
|
|
|
|
(u'index "ix_songs_search_title',
|
|
|
|
u"""CREATE INDEX ix_songs_search_title ON songs (search_title)"""),
|
|
|
|
(u'table "authors_songs"', u"""CREATE TABLE authors_songs (
|
2009-10-19 13:57:31 +00:00
|
|
|
author_id INTEGER NOT NULL,
|
|
|
|
song_id INTEGER NOT NULL,
|
|
|
|
PRIMARY KEY (author_id, song_id),
|
|
|
|
FOREIGN KEY(author_id) REFERENCES authors (id),
|
|
|
|
FOREIGN KEY(song_id) REFERENCES songs (id)
|
2009-10-19 20:03:55 +00:00
|
|
|
)"""),
|
|
|
|
(u'table "songs_topics"', u"""CREATE TABLE songs_topics (
|
2009-10-19 13:57:31 +00:00
|
|
|
song_id INTEGER NOT NULL,
|
|
|
|
topic_id INTEGER NOT NULL,
|
|
|
|
PRIMARY KEY (song_id, topic_id),
|
|
|
|
FOREIGN KEY(song_id) REFERENCES songs (id),
|
|
|
|
FOREIGN KEY(topic_id) REFERENCES topics (id)
|
2009-10-19 20:03:55 +00:00
|
|
|
)""")
|
2009-10-19 13:57:31 +00:00
|
|
|
]
|
|
|
|
|
2009-10-30 20:57:44 +00:00
|
|
|
def prepare_string(dirty):
|
2009-10-20 16:43:36 +00:00
|
|
|
return dirty_chars.sub(u'', dirty.replace(u'\r\n', ' ').replace(u'\n', ' '))
|
2009-10-19 20:03:55 +00:00
|
|
|
|
|
|
|
def display_sql(sql, params):
|
|
|
|
prepared_params = []
|
|
|
|
for param in params:
|
|
|
|
if isinstance(param, basestring):
|
|
|
|
prepared_params.append(u'"%s"' % param)
|
|
|
|
elif isinstance(param, (int, long)):
|
|
|
|
prepared_params.append(u'%d' % param)
|
|
|
|
elif isinstance(param, (float, complex)):
|
|
|
|
prepared_params.append(u'%f' % param)
|
|
|
|
else:
|
|
|
|
prepared_params.append(u'"%s"' % str(param))
|
|
|
|
for prepared_param in prepared_params:
|
|
|
|
sql = sql.replace(u'?', prepared_param, 1)
|
|
|
|
return sql
|
|
|
|
|
2009-10-19 13:57:31 +00:00
|
|
|
def create_database():
|
|
|
|
global new_cursor, create_statements
|
|
|
|
if debug or verbose:
|
|
|
|
print 'Creating new database:'
|
|
|
|
else:
|
|
|
|
print 'Creating new database...',
|
2009-10-19 20:03:55 +00:00
|
|
|
for statement_type, sql_create in create_statements:
|
2009-10-19 13:57:31 +00:00
|
|
|
if debug:
|
|
|
|
print '... ', sql_create.replace('\n', ' ').replace(' ', ' ')
|
|
|
|
elif verbose:
|
2009-10-19 20:03:55 +00:00
|
|
|
print '... creating %s...' % statement_type,
|
2009-10-19 13:57:31 +00:00
|
|
|
new_cursor.execute(sql_create)
|
|
|
|
if verbose and not debug:
|
|
|
|
print 'done.'
|
|
|
|
if not verbose and not debug:
|
|
|
|
print 'done.'
|
|
|
|
|
|
|
|
def import_songs():
|
|
|
|
global old_cursor, new_cursor, debug, verbose
|
|
|
|
if debug or verbose:
|
|
|
|
print 'Importing authors:'
|
|
|
|
else:
|
|
|
|
print 'Importing authors...',
|
|
|
|
if debug:
|
|
|
|
print '... SELECT authorid AS id, authorname AS displayname FROM authors'
|
|
|
|
elif verbose:
|
|
|
|
print '... fetching authors from old database...',
|
|
|
|
old_cursor.execute(u'SELECT authorid AS id, authorname AS displayname FROM authors')
|
|
|
|
rows = old_cursor.fetchall()
|
|
|
|
if not debug and verbose:
|
|
|
|
print 'done.'
|
|
|
|
author_map = {}
|
|
|
|
for row in rows:
|
2009-10-20 16:43:36 +00:00
|
|
|
display_name = unicode(row[1], u'cp1252')
|
2009-10-19 20:03:55 +00:00
|
|
|
names = display_name.split(u' ')
|
2009-10-19 13:57:31 +00:00
|
|
|
first_name = names[0]
|
|
|
|
last_name = u' '.join(names[1:])
|
|
|
|
if last_name is None:
|
|
|
|
last_name = u''
|
|
|
|
sql_insert = u'INSERT INTO authors '\
|
|
|
|
'(id, first_name, last_name, display_name) '\
|
2009-10-19 20:03:55 +00:00
|
|
|
'VALUES (NULL, ?, ?, ?)'
|
|
|
|
sql_params = (first_name, last_name, display_name)
|
2009-10-19 13:57:31 +00:00
|
|
|
if debug:
|
2009-10-19 20:03:55 +00:00
|
|
|
print '...', display_sql(sql_insert, sql_params)
|
2009-10-19 13:57:31 +00:00
|
|
|
elif verbose:
|
2009-10-19 20:03:55 +00:00
|
|
|
print '... importing "%s"' % display_name
|
|
|
|
new_cursor.execute(sql_insert, sql_params)
|
2009-10-19 13:57:31 +00:00
|
|
|
author_map[row[0]] = new_cursor.lastrowid
|
|
|
|
if debug:
|
|
|
|
print ' >>> authors.authorid =', row[0], 'authors.id =', author_map[row[0]]
|
|
|
|
if not verbose and not debug:
|
|
|
|
print 'done.'
|
|
|
|
if debug or verbose:
|
|
|
|
print 'Importing songs:'
|
|
|
|
else:
|
|
|
|
print 'Importing songs...',
|
|
|
|
if debug:
|
2009-10-20 16:43:36 +00:00
|
|
|
print '... SELECT songid AS id, songtitle AS title, lyrics || \'\' AS lyrics, copyrightinfo AS copyright FROM songs...',
|
2009-10-19 13:57:31 +00:00
|
|
|
elif verbose:
|
|
|
|
print '... fetching songs from old database...',
|
2009-10-20 16:43:36 +00:00
|
|
|
old_cursor.execute(u'SELECT songid AS id, songtitle AS title, lyrics || \'\' AS lyrics, copyrightinfo AS copyright FROM songs')
|
2009-10-19 13:57:31 +00:00
|
|
|
rows = old_cursor.fetchall()
|
2009-10-19 20:03:55 +00:00
|
|
|
if debug or verbose:
|
2009-10-19 13:57:31 +00:00
|
|
|
print 'done.'
|
|
|
|
song_map = {}
|
|
|
|
xml_lyrics_template = u'<?xml version="1.0" encoding="utf-8"?><song version="1.0"><lyrics language="en">%s</lyrics></song>'
|
|
|
|
xml_verse_template = u'<verse label="%d" type="Verse"><![CDATA[%s]]></verse>'
|
|
|
|
for row in rows:
|
2009-10-20 16:43:36 +00:00
|
|
|
clean_title = unicode(row[1], u'cp1252')
|
|
|
|
clean_lyrics = unicode(row[2], u'cp1252')
|
|
|
|
clean_copyright = unicode(row[3], u'cp1252')
|
|
|
|
verse_order = u''
|
2009-10-19 20:03:55 +00:00
|
|
|
text_lyrics = clean_lyrics.split(u'\n\n')
|
2009-10-20 16:43:36 +00:00
|
|
|
xml_verse = u''
|
2009-10-19 13:57:31 +00:00
|
|
|
for line, verse in enumerate(text_lyrics):
|
|
|
|
if not verse:
|
|
|
|
continue
|
2009-10-20 16:43:36 +00:00
|
|
|
xml_verse += (xml_verse_template % (line + 1, verse))
|
|
|
|
verse_order += '%d ' % (line + 1)
|
|
|
|
xml_lyrics = xml_lyrics_template % xml_verse
|
2009-10-30 20:57:44 +00:00
|
|
|
search_title = prepare_string(clean_title)
|
|
|
|
search_lyrics = prepare_string(clean_lyrics)
|
2009-10-19 13:57:31 +00:00
|
|
|
sql_insert = u'INSERT INTO songs '\
|
2009-10-20 16:54:56 +00:00
|
|
|
'(id, song_book_id, title, lyrics, verse_order, copyright, search_title, search_lyrics) '\
|
|
|
|
'VALUES (NULL, 0, ?, ?, ?, ?, ?, ?)'
|
2009-10-30 20:57:44 +00:00
|
|
|
sql_params = (clean_title, xml_lyrics, verse_order, clean_copyright, search_title, search_lyrics)
|
2009-10-19 13:57:31 +00:00
|
|
|
if debug:
|
2009-10-20 16:43:36 +00:00
|
|
|
print '...', display_sql(sql_insert, (sql_params[0], u'%s...' % clean_lyrics[:7], sql_params[2], sql_params[3], sql_params[4], u'%s...' % search_lyrics[:7]))
|
2009-10-19 13:57:31 +00:00
|
|
|
elif verbose:
|
2009-10-19 20:03:55 +00:00
|
|
|
print '... importing "%s"' % clean_title
|
|
|
|
new_cursor.execute(sql_insert, sql_params)
|
2009-10-19 13:57:31 +00:00
|
|
|
song_map[row[0]] = new_cursor.lastrowid
|
2009-10-20 16:43:36 +00:00
|
|
|
if debug:
|
|
|
|
print ' >>> songs.songid =', row[0], 'songs.id =', song_map[row[0]]
|
2009-10-19 13:57:31 +00:00
|
|
|
if not verbose and not debug:
|
|
|
|
print 'done.'
|
|
|
|
if debug or verbose:
|
|
|
|
print 'Importing song-to-author mapping:'
|
|
|
|
else:
|
|
|
|
print 'Importing song-to-author mapping...',
|
|
|
|
if debug:
|
|
|
|
print '... SELECT authorid AS author_id, songid AS song_id FROM songauthors'
|
|
|
|
elif verbose:
|
|
|
|
print '... fetching song-to-author mapping from old database...',
|
2009-10-19 20:03:55 +00:00
|
|
|
old_cursor.execute(u'SELECT authorid AS author_id, songid AS song_id FROM songauthors')
|
2009-10-19 13:57:31 +00:00
|
|
|
rows = old_cursor.fetchall()
|
|
|
|
if not debug and verbose:
|
|
|
|
print 'done.'
|
|
|
|
for row in rows:
|
|
|
|
sql_insert = u'INSERT INTO authors_songs '\
|
|
|
|
'(author_id, song_id) '\
|
2009-10-19 20:03:55 +00:00
|
|
|
'VALUES (?, ?)'
|
|
|
|
sql_params = (author_map[row[0]], song_map[row[1]])
|
2009-10-19 13:57:31 +00:00
|
|
|
if debug:
|
2009-10-19 20:03:55 +00:00
|
|
|
print '... ', display_sql(sql_insert, sql_params)
|
2009-10-19 13:57:31 +00:00
|
|
|
elif verbose:
|
|
|
|
print '... Author %d (was %d) => Song %d (was %d)'\
|
|
|
|
% (int(row[0]), author_map[row[0]],
|
|
|
|
int(row[1]), song_map[row[1]])
|
2009-10-19 20:03:55 +00:00
|
|
|
new_cursor.execute(sql_insert, sql_params)
|
2009-10-19 13:57:31 +00:00
|
|
|
if not verbose and not debug:
|
|
|
|
print 'done.'
|
|
|
|
|
|
|
|
def main(old_db, new_db):
|
|
|
|
global old_cursor, new_cursor, debug
|
|
|
|
old_connection = None
|
|
|
|
new_connection = None
|
|
|
|
try:
|
|
|
|
old_connection = sqlite.connect(old_db)
|
|
|
|
except:
|
|
|
|
if debug:
|
|
|
|
errormsg = '\n' + ''.join(get_traceback(sys.exc_info()[2]))\
|
|
|
|
+ str(sys.exc_info()[1])
|
|
|
|
else:
|
|
|
|
errormsg = sys.exc_info()[1]
|
|
|
|
print 'There was a problem connecting to the old database:', errormsg
|
|
|
|
return 1
|
|
|
|
try:
|
|
|
|
new_connection = sqlite3.connect(new_db)
|
|
|
|
except:
|
|
|
|
if debug:
|
|
|
|
errormsg = '\n' + ''.join(get_traceback(sys.exc_info()[2]))\
|
|
|
|
+ str(sys.exc_info()[1])
|
|
|
|
else:
|
|
|
|
errormsg = sys.exc_info()[1]
|
|
|
|
print 'There was a problem creating the new database:', errormsg
|
|
|
|
return 1
|
|
|
|
old_cursor = old_connection.cursor()
|
|
|
|
new_cursor = new_connection.cursor()
|
|
|
|
try:
|
|
|
|
create_database()
|
|
|
|
except:
|
|
|
|
if debug:
|
|
|
|
errormsg = '\n' + ''.join(get_traceback(sys.exc_info()[2]))\
|
|
|
|
+ str(sys.exc_info()[1])
|
|
|
|
else:
|
|
|
|
errormsg = sys.exc_info()[1]
|
|
|
|
print 'There was a problem creating the database:', errormsg
|
|
|
|
return 1
|
|
|
|
try:
|
|
|
|
import_songs()
|
|
|
|
new_connection.commit()
|
|
|
|
except:
|
|
|
|
new_connection.rollback()
|
|
|
|
if debug:
|
|
|
|
errormsg = '\n' + ''.join(get_traceback(sys.exc_info()[2]))\
|
|
|
|
+ str(sys.exc_info()[1])
|
|
|
|
else:
|
|
|
|
errormsg = sys.exc_info()[1]
|
|
|
|
print 'There was a problem importing songs:', errormsg
|
|
|
|
return 1
|
|
|
|
print 'Import complete.'
|
|
|
|
|
|
|
|
if __name__ == u'__main__':
|
|
|
|
option_parser = OptionParser(usage='Usage: %prog [options] OLDDATABASE NEWDATABASE')
|
|
|
|
option_parser.add_option('-o', '--overwrite', dest='overwrite', default=False,
|
|
|
|
action=u'store_true', help='Overwrite database file if it already exists.')
|
|
|
|
option_parser.add_option('-v', '--verbose', dest='verbose', default=False,
|
|
|
|
action=u'store_true', help='Outputs additional progress data.')
|
|
|
|
option_parser.add_option('-d', '--debug', dest='debug', default=False,
|
|
|
|
action=u'store_true', help='Outputs raw SQL statements (overrides verbose).')
|
|
|
|
options, arguments = option_parser.parse_args()
|
|
|
|
if len(arguments) < 2:
|
|
|
|
if len(arguments) == 0:
|
|
|
|
option_parser.error('Please specify an old database and a new database.')
|
|
|
|
else:
|
|
|
|
option_parser.error('Please specify a new database.')
|
|
|
|
old_db = os.path.abspath(arguments[0])
|
|
|
|
new_db = os.path.abspath(arguments[1])
|
|
|
|
if not os.path.isfile(old_db):
|
|
|
|
option_parser.error('Old database file ("%s") is not a file.' % old_db)
|
|
|
|
if not os.path.exists(old_db):
|
|
|
|
option_parser.error('Old database file ("%s") does not exist.' % old_db)
|
|
|
|
if os.path.exists(new_db):
|
|
|
|
if not options.overwrite:
|
|
|
|
option_parser.error('New database file ("%s") exists. If you want to overwrite it, specify the --overwrite option.' % new_db)
|
|
|
|
else:
|
|
|
|
if not os.path.isfile(new_db):
|
|
|
|
option_parser.error('New database file ("%s") is not a file.' % new_db)
|
|
|
|
os.unlink(new_db)
|
|
|
|
verbose = options.verbose
|
|
|
|
debug = options.debug
|
2009-12-31 12:52:01 +00:00
|
|
|
main(old_db, new_db)
|