X-Git-Url: http://jaekl.net/gitweb/?p=quanlib.git;a=blobdiff_plain;f=store.rb;h=92d1ce57d1917ea7309d86527fa96f5aa826581e;hp=660fc80bb64464fcb9aa20e18aa4c9a797666294;hb=HEAD;hpb=2c6d69af97c152524366d3fefe1808dfb78f8f56 diff --git a/store.rb b/store.rb index 660fc80..1a33ca3 100644 --- a/store.rb +++ b/store.rb @@ -1,26 +1,39 @@ require 'csv' require 'fileutils' +require 'inifile' require 'pg' -require 'series' +require_relative 'series' +require_relative 'tconn' class Store - def initialize - @basepath = '/arc/quanlib' # TODO: FIXME: configure this in a sane way + def unclassified_csv + @basePath + '/csv/unclassified.csv' + end + + def initialize(config_file) @conn = nil - #@dburl = 'dbi:Pg:quanlib:localhost' - @dbhost = "localhost" + config = IniFile.load(config_file) + if nil == config + puts 'FATAL: Failed to load config file "' + config_file + '". Aborting initialization.' + return + end + + section = config['database'] + @dbhost = section['host'] @dbport = 5432 - @dbname = 'quanlib' - @dbuser = 'quanlib' - @dbpass = 'quanlib' + @dbname = section['name'] + @dbuser = section['user'] + @dbpass = section['pass'] + + section = config['filesystem'] + @basePath = section['basePath'] end def connect - # @conn = PGconn.connect('localhost', 5432, '', '', 'quanlib', 'quanlib', 'quanlib') - @conn = PG.connect('localhost', 5432, '', '', 'quanlib', 'quanlib', 'quanlib') + @conn = TimedConn.new(PG.connect(@dbhost, @dbport, '', '', @dbname, @dbuser, @dbpass)) return @conn end @@ -35,24 +48,34 @@ class Store return path, name end - def create_schema - create_authors = + def cross_reference_lists +puts "@@@@@@@@@@@ CROSS-REF START @@@@@@@@@@@" + exec_update("TRUNCATE TABLE Lists CASCADE;", []) + + populate_lists_table +puts "@@@@@@@@@@@ CROSS-REF DONE @@@@@@@@@@@" + end + + def create_schema(skip_class) + create_authors = < 0 return rs[0]['id'] end end + return nil end - def init_db + def init_db(skip_class) sql = "SELECT 1 FROM pg_tables WHERE tableowner='quanlib' AND tablename='books'" found = false @conn.exec(sql).each do |row| @@ -180,12 +252,11 @@ EOS end if ! found - create_schema() + create_schema(skip_class) end end def load_author(id) - #puts 'DEBUG: load_author(' + id + ')' sqlSelect = "SELECT grouping, reading, sort FROM Authors WHERE id=$1" args = [id] @conn.exec_params(sqlSelect, args) do |rs| @@ -194,10 +265,8 @@ EOS end row = rs[0] author = Author.new(row['grouping'], row['reading'], row['sort']) - #puts 'DEBUG: author: ' + author.inspect() return author end - #puts 'DEBUG: NOT FOUND' return nil end @@ -207,7 +276,7 @@ EOS id = next_id('author_id') sqlInsert = "INSERT INTO Authors(id, grouping, reading, sort) VALUES ($1, $2, $3, $4);" args = [id, author.grouping, author.reading_order, author.sort_order] - begin + begin rs = @conn.exec_params(sqlInsert, args) rescue Exception => e puts sqlInsert + ": " + args.inspect() @@ -221,8 +290,7 @@ EOS end def load_book(id) - #puts 'DEBUG: load_book(' + id + ')' - sql = "SELECT author, classification, cover, description, path, series, title, volume FROM Books WHERE id=$1;" + sql = "SELECT author, classification, cover, description, language, path, series, title, volume FROM Books WHERE id=$1;" book = nil begin @@ -238,36 +306,36 @@ EOS book.classification_id = row['classification'] book.cover = load_cover(row['cover']) book.description = row['description'] + book.language = row['language'] book.path = row['path'] book.series_id = row['series'] book.title = row['title'] book.volume = row['volume'] - end + end rescue Exception => e puts sql + ": " + id puts e.message puts $@ end - #puts 'DEBUG: loaded book: ' + book.inspect() return book end def store_book(book) - sql = "INSERT INTO Books (id, author, classification, cover, description, path, series, title, volume) VALUES ($1, $2, $3, $4, $5, $6, $7, $8, $9);" + sql = "INSERT INTO Books (id, arrived, author, classification, cover, description, language, path, series, title, volume) VALUES ($1, $2, $3, $4, $5, $6, $7, $8, $9, $10, $11);" book_id = next_id('book_id') author_id = store_author(book.author) (efs_id, mime_type) = store_cover(book) - args = [book_id, author_id, book.classification_id, efs_id, book.description(), book.path(), book.series_id(), book.title(), book.volume()] + args = [book_id, book.arrived, author_id, book.classification_id, efs_id, book.description, book.language, book.path, book.series_id, book.title, book.volume] begin rs = @conn.exec_params(sql, args) rescue Exception => e puts sql + ": " + args.inspect() - puts e.message + puts e.message puts $@ ensure rs.clear if rs @@ -277,15 +345,34 @@ EOS end def find_classification(author_grouping, title_grouping) - #puts 'find_classification("' + author_grouping.inspect + '", "' + title_grouping.inspect + '")...' sql = "SELECT id FROM Classifications WHERE author_grouping = $1 AND title_grouping = $2;" @conn.exec_params(sql, [author_grouping, title_grouping]) do |rs| if rs.ntuples > 0 - #puts ' --> ' + rs[0]['id'].inspect return rs[0]['id'] end end - #puts ' --> NIL' + return nil + end + + def load_classification(id) + sql = "SELECT ddc, lcc, author_grouping, author_sort, title_grouping, title " + sql += " FROM Classifications WHERE id=$1" + @conn.exec_params(sql, [id]) do |rs| + if rs.ntuples > 0 + row = rs[0] + ddc = row['ddc'] + lcc = row['lcc'] + author_grouping = row['author_grouping'] + author = row['author_sort'] + title_grouping = row['title_grouping'] + title = row['title'] + + result = Classification.new(ddc, lcc, author_grouping, author, title_grouping, title) + result.id = id + return result + end + end + return nil end @@ -306,15 +393,9 @@ EOS (efspath, efsname) = construct_efs_path(id) - fullpath = @basepath + '/efs/' + efspath + '/' + efsname + fullpath = @basePath + '/efs/' + efspath + '/' + efsname return Cover.new(nil, fullpath, mime_type) - - #File.open(fullpath, 'rb') do |is| - # return Cover.new(is, fullpath, mime_type) - #end - # - #return nil end def store_cover(book) @@ -335,7 +416,7 @@ EOS (efspath, efsname) = construct_efs_path(efs_id) - efspath = @basepath + '/efs/' + efspath + efspath = @basePath + '/efs/' + efspath FileUtils.mkdir_p(efspath) @@ -351,7 +432,7 @@ EOS ensure rs.clear if rs end - + return efs_id, mimetype end @@ -381,7 +462,7 @@ EOS id = nil @conn.exec("SELECT nextval('" + seq_name + "');") do |rs| id = rs[0]['nextval'] - end + end return id end @@ -422,7 +503,7 @@ EOS def populate_classifications_table puts "Populating the Classifications table..." first = true - CSV.foreach(@basepath + '/csv/class.csv') do |row| + CSV.foreach(@basePath + '/csv/class.csv') do |row| if first # skip the header row first = false @@ -437,7 +518,7 @@ EOS author_sort = row[3] title_grouping = row[4] title = row[5] - + sqlInsert = "INSERT INTO Classifications (id, ddc, lcc, author_grouping, author_sort, title_grouping, title) VALUES ($1, $2, $3, $4, $5, $6, $7);" args = [id, ddc, lcc, author_grouping, author_sort, title_grouping, title] exec_update(sqlInsert, args) @@ -448,7 +529,7 @@ EOS input = row[6] if input.length > 0 fast = input.split(';') - end + end fast.each do |fast_id| sqlInsert = "INSERT INTO FAST_Classifications (fast, classification) VALUES ($1, $2);" @@ -462,7 +543,7 @@ EOS def populate_fast_table puts "Populating the FAST table..." first = true - CSV.foreach(@basepath + '/csv/fast.csv') do |row| + CSV.foreach(@basePath + '/csv/fast.csv') do |row| if first first = false # skip the header row else @@ -474,9 +555,53 @@ EOS end end + def populate_lists_table + puts "Populating the Lists table..." + + CSV.foreach(@basePath + "/csv/lists.csv", headers: true) do |row| + author_ids = find_all_authors(row['author']) + if author_ids.empty? + specification = [row['age'], row['category'], row['code'], row['year'], row['author'], row['title']] + .map { |x| x.inspect } + .join(', ') + + puts "WARNING: For list entry (#{specification}), no such author was found." + + next + end + + sqlInsert = %Q( + INSERT INTO Lists (id, age, category, code, year, author, title) + VALUES ($1, $2, $3, $4, $5, $6, $7); + ) + author_ids.each do |author_id| + list_id = next_id('list_id') + args = [list_id, row['age'], row['category'], row['code'], row['year'], author_id, row['title']] + exec_update(sqlInsert, args) + + update_lists_books_table(list_id, author_id, row['title']) + end + end + end + + # Scan for books that match this Lists entry, and add any matches to the Lists_Books associative table + def update_lists_books_table(list_id, author_id, title) + title_pattern = Book.grouping_for_title(title).gsub('_', '%') + sqlSelect = "SELECT id FROM Books WHERE author = $1 AND title LIKE $2;" + args = [author_id, title_pattern] + + @conn.exec_params(sqlSelect, args) do |rs| + rs.each do |row| + sqlInsert = "INSERT INTO Lists_Books (list, book) VALUES ($1, $2)" + args = [list_id, row['id']] + exec_update(sqlInsert, args) + end + end + end + def populate_series_table puts "Populating the Series table..." - CSV.foreach(@basepath + '/csv/series.csv') do |row| + CSV.foreach(@basePath + '/csv/series.csv') do |row| id = next_id('series_id') sqlInsert = "INSERT INTO Series (id, age, genre, grouping, code, descr) VALUES ($1, $2, $3, $4, $5, $6);" args = [id] + row @@ -485,21 +610,21 @@ EOS end def query_books_by_author(pattern) - sql = + sql = <