Changes to OPF spine to not duplicate idrefs for documents with parts not at the...

author Keith Fahlgren <abdelazer@users.sourceforge.net>

Fri, 30 May 2008 17:20:11 +0000 (17:20 +0000)

committer Keith Fahlgren <abdelazer@users.sourceforge.net>

Fri, 30 May 2008 17:20:11 +0000 (17:20 +0000)
author Keith Fahlgren <abdelazer@users.sourceforge.net>
Fri, 30 May 2008 17:20:11 +0000 (17:20 +0000)
committer Keith Fahlgren <abdelazer@users.sourceforge.net>
Fri, 30 May 2008 17:20:11 +0000 (17:20 +0000)
diff --git a/xsl/epub/bin/dbtoepub b/xsl/epub/bin/dbtoepub

old mode 100644 (file)

new mode 100755 (executable)

index 111b61c..7de2be7
--- a/xsl/epub/bin/dbtoepub
+++ b/xsl/epub/bin/dbtoepub
@@ -1,10 +1,21 @@
  #!/usr/bin/env ruby
+# This program converts DocBook documents into .epub files.
+# 
+# Usage: dbtoepub [OPTIONS] [DocBook Files]
+#
+# .epub is defined by the IDPF at www.idpf.org and is made up of 3 standards:
+# - Open Publication Structure (OPS)
+# - Open Packaging Format (OPF) 
+# - Open Container Format (OCF)
+#
+# Specific options:
+#     -d, --debug                      Show debugging output.
+#     -h, --help                       Display usage info
+#     -v, --verbose                    Make output verbose
+
  lib = File.expand_path(File.join(File.dirname(__FILE__), 'lib'))
  $LOAD_PATH.unshift(lib) if File.exist?(lib)
  
-# Keith Fahlgren
-# Sat Feb 23 17:22:35 PST 2008
-
  require 'optparse'
  
  require 'docbook'
diff --git a/xsl/epub/bin/lib/docbook.rb b/xsl/epub/bin/lib/docbook.rb

index de45eca848fa1ddaedce60a28a274c84a449ea92..423e3eafe46a399f2b7950d42119f5238fb26294 100755 (executable)
--- a/xsl/epub/bin/lib/docbook.rb
+++ b/xsl/epub/bin/lib/docbook.rb
@@ -37,7 +37,7 @@ module DocBook
      end
  
      def self.invalid?(file)
-      # obnoxiously, we can't just check for a non-zero output...
+      # Obnoxiously, we can't just check for a non-zero output...
        cmd = "#{CHECKER} #{file}"
        output = `#{cmd} 2>&1`
  
@@ -69,12 +69,12 @@ module DocBook
  
      def bundle_epub(output_file, verbose)  
        quiet = verbose ? "" : "-q"
-      # zip -X -r ../book.epub mimetype META-INF OEBPS
        mimetype_filename = write_mimetype()
        meta  = File.basename(@meta_dir)
        oebps  = File.basename(@oebps_dir)
        images = copy_images()
        callouts = copy_callouts()
+      # zip -X -r ../book.epub mimetype META-INF OEBPS
        zip_cmd = "cd #{@output_dir} &&  #{ZIPPER} #{quiet} -X -r  #{File.expand_path(output_file)} #{mimetype_filename} #{meta} #{oebps}"
        puts zip_cmd if $DEBUG
        success = system(zip_cmd)
diff --git a/xsl/epub/bin/spec/epub_realbook_spec.rb b/xsl/epub/bin/spec/epub_realbook_spec.rb

index e893504acc99c5e5d723b7d6471101104ad24b5f..2b1d7433dae4046990ba6656e2e27d00ba2e3e66 100755 (executable)
--- a/xsl/epub/bin/spec/epub_realbook_spec.rb
+++ b/xsl/epub/bin/spec/epub_realbook_spec.rb
@@ -6,8 +6,8 @@ require 'spec/spec_helper'
  lib = File.expand_path(File.join(File.dirname(__FILE__), '..', 'lib'))
  $LOAD_PATH.unshift(lib) if File.exist?(lib)
  
-require 'tmpdir'
  require 'fileutils'
+require 'tmpdir'
  
  require 'rubygems'
  require 'spec'
diff --git a/xsl/epub/bin/spec/epub_regressions_spec.rb b/xsl/epub/bin/spec/epub_regressions_spec.rb

new file mode 100755 (executable)

index 0000000..1d1ed13
--- /dev/null
+++ b/xsl/epub/bin/spec/epub_regressions_spec.rb
@@ -0,0 +1,47 @@
+#!/usr/bin/env ruby
+spec = File.expand_path(File.dirname(__FILE__))
+$LOAD_PATH.unshift(spec) if File.exist?(spec)
+require 'spec/spec_helper'
+
+lib = File.expand_path(File.join(File.dirname(__FILE__), '..', 'lib'))
+$LOAD_PATH.unshift(lib) if File.exist?(lib)
+
+require 'fileutils'
+require 'rexml/document'
+require 'tmpdir'
+
+require 'rubygems'
+require 'spec'
+
+require 'docbook'
+
+$DEBUG = false
+
+describe DocBook::Epub do
+  before(:all) do
+    @filedir = File.expand_path(File.join(File.dirname(__FILE__), 'files'))
+    @testdocsdir = File.expand_path(File.join(File.dirname(__FILE__), 'testdocs'))
+    @tmpdir = File.join(Dir::tmpdir(), "epubregressions"); Dir.mkdir(@tmpdir) rescue Errno::EEXIST
+  end
+
+  it "should not include two <itemref>s to the contents of <part>s in the OPF file" do
+    part_file = File.join(@testdocsdir, "subtitle.001.xml") 
+    epub_file = File.join(@tmpdir, File.basename(part_file, ".xml") + ".epub")
+    part_epub = DocBook::Epub.new(part_file, @tmpdir)
+    part_epub.render_to_file(epub_file, $DEBUG)
+
+    FileUtils.copy(epub_file, "./.t.epub") if $DEBUG
+
+    itemref_tmpdir = File.join(Dir::tmpdir(), "epubitemref"); Dir.mkdir(itemref_tmpdir) rescue Errno::EEXIST
+    system("unzip -q -o -d #{itemref_tmpdir} #{epub_file}")
+    opf_file = File.join(itemref_tmpdir, "OEBPS", "content.opf")
+    opf = REXML::Document.new(File.new(opf_file))
+
+    itemrefs = REXML::XPath.match(opf, "//itemref").map {|e| e.attributes['idref']}
+    itemrefs.should == itemrefs.uniq
+  end
+
+  after(:all) do
+    FileUtils.rm_r(@tmpdir, :force => true)
+  end  
+end
diff --git a/xsl/epub/bin/spec/epub_small_smoketest.rb b/xsl/epub/bin/spec/epub_small_smoketest.rb

index 5ea0f1a62041449db4eda283cbb3722d68753ffe..28dd78748ba362cd4632f7001e370bba746e8ab2 100755 (executable)
--- a/xsl/epub/bin/spec/epub_small_smoketest.rb
+++ b/xsl/epub/bin/spec/epub_small_smoketest.rb
@@ -14,7 +14,7 @@ require 'spec'
  
  require 'docbook'
  
-$DEBUG = true
+$DEBUG = false
  
  TESTDOCSDIR = File.expand_path(File.join(File.dirname(__FILE__), 'testdocs'))
  NUMBER_TO_TEST = 15
@@ -25,10 +25,7 @@ describe DocBook::Epub do
      @tmpdir = File.join(Dir::tmpdir(), "epubspecsmoke"); Dir.mkdir(@tmpdir) rescue Errno::EEXIST
    end
  
-  # TODO olink, index, cmdsynopsis, refentry, table
-
-  Dir["#{TESTDOCSDIR}/programlisting*.006.xml"].sort_by { rand }[0..(NUMBER_TO_TEST-1)].each do |xml_file|
-  #Dir["#{TESTDOCSDIR}/*.[0-9][0-9][0-9].xml"].sort_by { rand }[0..(NUMBER_TO_TEST-1)].each do |xml_file|
+  Dir["#{TESTDOCSDIR}/*.[0-9][0-9][0-9].xml"].sort_by { rand }[0..(NUMBER_TO_TEST-1)].each do |xml_file|
      it "should be able to render a valid .epub for the test document #{xml_file}" do
        epub = DocBook::Epub.new(xml_file, @tmpdir)
        epub_file = File.join(@tmpdir, File.basename(xml_file, ".xml") + ".epub")
diff --git a/xsl/epub/bin/spec/epub_smoketest_spec.rb b/xsl/epub/bin/spec/epub_smoketest_spec.rb

index 7c39f7f58306ac6219090899fa4f4c9bfd1cda2b..6efad0d00375cfa3650a2054a3cf3b11a4ab0251 100755 (executable)
--- a/xsl/epub/bin/spec/epub_smoketest_spec.rb
+++ b/xsl/epub/bin/spec/epub_smoketest_spec.rb
@@ -25,6 +25,26 @@ describe DocBook::Epub do
      @tmpdir = File.join(Dir::tmpdir(), "epubspecsmoke"); Dir.mkdir(@tmpdir) rescue Errno::EEXIST
    end
  
+  # TODO 
+  # Known failures on all of:
+  #  calloutlist.003.xml
+  #  extensions.00[24].xml
+  #  programlisting.00[26].xml 
+  #  olink.*.xml
+  #  cmdsynopsis.002.xml
+  #  refentry.007.xml
+  #  programlistingco.002.xml
+  #  textobject.*.xml
+  #
+  # The causes of the failures are typically missing extensions in xsltproc
+  # (specifically insertfile, for textdata, imagedata, graphic, or inlinegraphic
+  # text/XML @filerefs, invalid XHTML 1.1 (block elements inside inlines that 
+  # I don't feel like # fixing because I think they're edge cases), callouts 
+  # (which are hard in .epub), or test docs I really don't think are cromulent.
+  
+  # Current passage rate:
+  #   224 examples, 12 failures (94.6%)
+
    Dir["#{TESTDOCSDIR}/[a-z]*.[0-9][0-9][0-9].xml"].each_with_index do |xml_file, ix|
      it "should be able to render a valid .epub for the test document #{xml_file} [#{ix}]" do
        epub = DocBook::Epub.new(xml_file, @tmpdir)
diff --git a/xsl/epub/docbook.xsl b/xsl/epub/docbook.xsl

index c7b5462c1b6307ba0a46a1c0a0ffaffc6c3b2b27..020e6910977acd819726a96bbe32a1e86a896be6 100644 (file)
--- a/xsl/epub/docbook.xsl
+++ b/xsl/epub/docbook.xsl
@@ -24,12 +24,13 @@
    </xsl:param>
  
    <xsl:param name="ade.extensions" select="0"/>
-  <xsl:param name="epub.autolabel" select="'1'"/> <!-- TODO: Document this in params -->
-  <xsl:param name="manifest.in.base.dir" select="'1'"/> <!-- TODO: Document this in params; is '1' correct? -->
+  <xsl:param name="epub.autolabel" select="'1'"/> 
  
-  <xsl:param name="epub.oebps.dir" select="'OEBPS/'"/> 
+
+  <xsl:param name="manifest.in.base.dir" select="'1'"/> 
    <xsl:param name="base.dir" select="$epub.oebps.dir"/>
  
+  <xsl:param name="epub.oebps.dir" select="'OEBPS/'"/> 
    <xsl:param name="epub.ncx.filename" select="'toc.ncx'"/> 
    <xsl:param name="epub.container.filename" select="'container.xml'"/> 
    <xsl:param name="epub.opf.filename" select="concat($epub.oebps.dir, 'content.opf')"/> 
@@ -41,7 +42,6 @@
    <xsl:param name="epub.html.toc.id">htmltoc</xsl:param>
    <xsl:param name="epub.metainf.dir" select="'META-INF/'"/> 
  
-
    <!-- Per Bob Stayton:
         """Process your documents with the css.decoration parameter set to zero. 
            That will avoid the use of style attributes in XHTML elements where they are not permitted."""
@@ -361,7 +361,7 @@
              </xsl:when>
              <xsl:otherwise>
                <xsl:variable name="title">
-                <xsl:if test="$epub.autolabel=1">
+                <xsl:if test="$epub.autolabel != 0">
                    <xsl:variable name="label.markup">
                      <xsl:apply-templates select="/*" mode="label.markup" />
                    </xsl:variable>
@@ -423,7 +423,7 @@
                  mode="ncx">
      <xsl:variable name="depth" select="count(ancestor::*)"/>
      <xsl:variable name="title">
-      <xsl:if test="$epub.autolabel=1">
+      <xsl:if test="$epub.autolabel != 0">
          <xsl:variable name="label.markup">
            <xsl:apply-templates select="." mode="label.markup" />
          </xsl:variable>
@@ -596,12 +596,14 @@
        </xsl:if>  
  
        <!-- TODO: be nice to have a idref="titlepage" here -->
-      <xsl:if test="$root.is.a.chunk != '0'">
-
-        <xsl:apply-templates select="/*" mode="opf.spine"/>
-      </xsl:if>
-      <xsl:apply-templates select="/*/*|
-                                   /*/part/*" mode="opf.spine"/>
+      <xsl:choose>
+        <xsl:when test="$root.is.a.chunk != '0'">
+          <xsl:apply-templates select="/*" mode="opf.spine"/>
+        </xsl:when>
+        <xsl:otherwise>
+          <xsl:apply-templates select="/*/*" mode="opf.spine"/>
+        </xsl:otherwise>
+      </xsl:choose>
                                     
      </xsl:element>
    </xsl:template>
@@ -778,7 +780,7 @@
  
    <xsl:template match="mediaobjectco"
                  mode="opf.manifest">
-    <xsl:message>Warning: mediaobjectco almost certain will not render as expected in .epub </xsl:message>
+    <xsl:message>Warning: mediaobjectco almost certainly will not render as expected in .epub!</xsl:message>
      <xsl:apply-templates select="imageobjectco/imageobject/imagedata" 
                           mode="opf.manifest"/>              
    </xsl:template>
@@ -1321,4 +1323,8 @@
      <xsl:value-of select="$html.ext"/>
    </xsl:template>
  
+  <xsl:template match="bibliodiv" mode="label.markup">
+  </xsl:template>
+
+
  </xsl:stylesheet>
author	Keith Fahlgren <abdelazer@users.sourceforge.net>
	Fri, 30 May 2008 17:20:11 +0000 (17:20 +0000)
committer	Keith Fahlgren <abdelazer@users.sourceforge.net>
	Fri, 30 May 2008 17:20:11 +0000 (17:20 +0000)
xsl/epub/bin/dbtoepub	[changed mode: 0644->0755]	patch \| blob \| history
xsl/epub/bin/lib/docbook.rb		patch \| blob \| history
xsl/epub/bin/spec/epub_realbook_spec.rb		patch \| blob \| history
xsl/epub/bin/spec/epub_regressions_spec.rb	[new file with mode: 0755]	patch \| blob
xsl/epub/bin/spec/epub_small_smoketest.rb		patch \| blob \| history
xsl/epub/bin/spec/epub_smoketest_spec.rb		patch \| blob \| history
xsl/epub/docbook.xsl		patch \| blob \| history