-require 'author'
-require 'classification'
-require 'cover'
-require 'store'
+require_relative 'author'
+require_relative 'classification'
+require_relative 'cover'
+require_relative 'store'
+ @@SERIES_AND_VOLUME_REGEX = /^([A-Z]+)([0-9]+(\.[0-9]+)?)$/
+
+ attr_accessor :arrived
+ attr_accessor :author
+ attr_accessor :classification_id
+ attr_accessor :cover
+ attr_accessor :description
+ attr_accessor :language
+ attr_accessor :path
+ attr_accessor :series_id
+ attr_accessor :title
+ attr_accessor :volume
- def description
- @description
- end
+ '\'",!#'.split('').each do |c|
+ result = result.gsub(c, '-')
+ end
+ result = result.gsub(/: */, '--')
+ result = result.gsub(' ', '_')
+ bare_title_grouping = title_grouping
+ .split('_')
+ .reject { |part| part.match(@@SERIES_AND_VOLUME_REGEX) }
+ .join('_')
+
+ unless bare_title_grouping == Book.grouping_for_title(title)
+ puts "WARNING: title_grouping mismatch: #{bare_title_grouping.inspect} vs. #{Book.grouping_for_title(title).inspect}"
+ end
+
@classification_id = @store.find_classification(@author.grouping, File.basename(file_name, '.*'))
# TODO: Fix horrible hard-coded strings and paths
if ('01_nonfic' == category) && (nil == classification_id)
open(Store.unclassified_csv, 'a') do |fd|
fd.puts('"' + grouping.to_s + '","' + path + '"')
@classification_id = @store.find_classification(@author.grouping, File.basename(file_name, '.*'))
# TODO: Fix horrible hard-coded strings and paths
if ('01_nonfic' == category) && (nil == classification_id)
open(Store.unclassified_csv, 'a') do |fd|
fd.puts('"' + grouping.to_s + '","' + path + '"')
descrNodes = opfDoc.css('dc|description', 'dc' => @@DC_NS_URL)
if (descrNodes.length > 0)
descrNode = descrNodes[0]
descrNodes = opfDoc.css('dc|description', 'dc' => @@DC_NS_URL)
if (descrNodes.length > 0)
descrNode = descrNodes[0]
+ #---------------------------------------
+ # Language
+
+ langNodes = opfDoc.css('dc|language', 'dc' => @@DC_NS_URL)
+ if (langNodes.length > 0)
+ langNode = langNodes[0]
+ if langNode
+ @language = langNode.content
+ end
+ end
+
#---------------------------------------
# Other metadata: series, volume, cover
#---------------------------------------
# Other metadata: series, volume, cover
+ unless entry
+ # Another case found in the wild: cover image is at the root, but path is '../cover.jpeg'
+ if href.start_with? '../'
+ coverPath = href[3..-1]
+ entry = zipfile.find_entry(coverPath)
+ end
+ end
+