-require './author.rb'
+require 'nokogiri'
+require 'zip'
+
+require 'author'
+require 'cover'
class Book
def initialize(fileName)
return false
end
+ #puts "Filename: " + fileName.to_s
lowerName = fileName.downcase()
if lowerName.end_with?(".epub")
return false
end
+ def cover
+ return @cover
+ end
+
+ def describe
+ result = []
+
+ if nil != @title
+ result.push('<b>' + @title + '</b>')
+ else
+ result.push('<i>(Unknown title)</i>')
+ end
+ if nil != @author
+ result.push(@author.to_s())
+ end
+
+ seriesInfo = []
+ if nil != @series
+ seriesInfo.push(@series.to_s)
+ end
+ if nil != @volume
+ seriesInfo.push(@volume.to_s)
+ end
+ if seriesInfo.length > 0
+ result.push(seriesInfo.join(' '))
+ end
+
+ return result.join('<br/>')
+ end
+
def inspect
data = []
if nil != @author
- data.push('author="' + @author + '"')
+ data.push('author="' + @author.to_s + '"')
end
if nil != @series
data.push('series="' + @series + '"')
if nil != @title
data.push('title="' + @title + '"')
end
+ if nil != @cover
+ data.push(@cover.inspect())
+ end
if nil != @path
data.push('path="' + @path + '"')
end
return '(Book:' + data.join(',') + ')'
end
+ def path
+ @path
+ end
+
def to_s
return inspect()
end
if parts.length > 1
@author = massageAuthor(parts[-2])
end
+
+ if fileName.downcase.end_with?(".epub")
+ scanEpub!(fileName)
+ end
+ end
+
+ protected
+ def scanEpub!(fileName)
+ #puts 'Scanning "' + fileName.to_s + '"...'
+ begin
+ Zip::File.open(fileName) do |zipfile|
+ entry = zipfile.find_entry('META-INF/container.xml')
+ if nil == entry
+ return
+ end
+ contXml = zipfile.read('META-INF/container.xml')
+ contDoc = Nokogiri::XML(contXml)
+ opfPath = contDoc.css("container rootfiles rootfile")[0]['full-path']
+
+ scanOpf!(zipfile, opfPath)
+ end
+ rescue Zip::Error => exc
+ puts 'ERROR processing file "' + fileName + '":'
+ puts exc.message
+ puts exc.backtrace
+ end
+ end
+
+ protected
+ def scanOpf!(zipfile, opfPath)
+ coverId = nil
+
+ opfXml = zipfile.read(opfPath)
+ opfDoc = Nokogiri::XML(opfXml)
+
+ #-------
+ # Author
+
+ creator = opfDoc.css('dc|creator', 'dc' => 'http://purl.org/dc/elements/1.1/')
+ if (nil != creator) and (creator.length > 0)
+ roleNode = creator.attr('role')
+ if nil != roleNode
+ role = roleNode.value
+ if ('aut' == role) and (creator.children.length > 0) and (nil != creator.children[0])
+ name = creator.children[0].content
+ parts = name.split(' ')
+ if parts.length > 1
+ surname = parts[-1]
+ givenNames = parts[0..-2].join(' ')
+ @author = Author.new(surname, givenNames)
+ else
+ @author = Author.new(name, '')
+ end
+ end
+ end
+ end
+
+ #---------------------------------------
+ # Other metadata: series, volume, cover
+
+ metas = opfDoc.css('package metadata meta')
+ for m in metas
+ name = m['name']
+ content = m['content']
+
+ if 'calibre:series' == name
+ @series = content
+ elsif 'calibre:series-index' == name
+ @volume = content
+ elsif 'cover' == name
+ coverId = content
+ end
+ end
+
+ #---------------
+ # Load the cover
+
+ @cover = loadCover(zipfile, opfPath, opfDoc, coverId)
+ end
+
+ protected
+ def loadCover(zipfile, opfPath, opfDoc, coverId)
+ coverFile = nil
+ if nil == coverId
+ coverId = "cover-image"
+ end
+
+ items = opfDoc.css('package manifest item')
+ for i in items
+ href = i['href']
+ id = i['id']
+ mimeType = i['media-type']
+
+ if coverId == id
+ entry = zipfile.find_entry(href)
+
+ if nil == entry
+ # Although the epub standard requires the path to be relative
+ # to the base of the epub (zip), some books encountered in the
+ # wild have been found to use a bath relative to the location
+ # of the opf file.
+ parts = opfPath.split('/')
+ opfBasePath = opfPath.split('/')[0..-2].join('/')
+ coverPath = opfBasePath + '/' + href
+ entry = zipfile.find_entry(coverPath)
+ end
+
+ if nil == entry
+ puts 'WARNING! Cover image "' + href + '" not found in file "' + @path + '".'
+ return nil
+ else
+ entry.get_input_stream() do |is|
+ return Cover.new(is, href, mimeType)
+ end
+ end
+ end
+ end
+ return nil
end
end
+