diff --git a/epub.js b/epub.js index 5adbf35..aa9cb3b 100644 --- a/epub.js +++ b/epub.js @@ -1,6 +1,5 @@ var xml2js = require('xml2js'); var xml2jsOptions = xml2js.defaults['0.1']; -var util = require('util'); var EventEmitter = require('events').EventEmitter; try { @@ -53,717 +52,719 @@ try { * * /images/logo_img/OPT/logo.jpg **/ -function EPub(fname, imageroot, linkroot) { - EventEmitter.call(this); - this.filename = fname; - - this.imageroot = (imageroot || "/images/").trim(); - this.linkroot = (linkroot || "/links/").trim(); - - if (this.imageroot.substr(-1) != "/") { - this.imageroot += "/"; - } - if (this.linkroot.substr(-1) != "/") { - this.linkroot += "/"; - } -} -util.inherits(EPub, EventEmitter); - -/** - * EPub#parse() -> undefined - * - * Starts the parser, needs to be called by the script - **/ -EPub.prototype.parse = function () { - - this.containerFile = false; - this.mimeFile = false; - this.rootFile = false; - - this.metadata = {}; - this.manifest = {}; - this.spine = {toc: false, contents: []}; - this.flow = []; - this.toc = []; - - this.open(); -}; - -/** - * EPub#open() -> undefined - * - * Opens the epub file with Zip unpacker, retrieves file listing - * and runs mime type check - **/ -EPub.prototype.open = function () { - try { - this.zip = new ZipFile(this.filename); - } catch (E) { - this.emit("error", new Error("Invalid/missing file")); - return; - } - - if (!this.zip.names || !this.zip.names.length) { - this.emit("error", new Error("No files in archive")); - return; - } - - this.checkMimeType(); -}; - -/** - * EPub#checkMimeType() -> undefined - * - * Checks if there's a file called "mimetype" and that it's contents - * are "application/epub+zip". On success runs root file check. - **/ -EPub.prototype.checkMimeType = function () { - var i, len; - - for (i = 0, len = this.zip.names.length; i < len; i++) { - if (this.zip.names[i].toLowerCase() == "mimetype") { - this.mimeFile = this.zip.names[i]; - break; +class EPub extends EventEmitter { + constructor(fname, imageroot, linkroot) { + super(); + + this.filename = fname; + + this.imageroot = (imageroot || "/images/").trim(); + this.linkroot = (linkroot || "/links/").trim(); + + if (this.imageroot.substr(-1) != "/") { + this.imageroot += "/"; + } + if (this.linkroot.substr(-1) != "/") { + this.linkroot += "/"; } } - if (!this.mimeFile) { - this.emit("error", new Error("No mimetype file in archive")); - return; + + /** + * EPub#parse() -> undefined + * + * Starts the parser, needs to be called by the script + **/ + parse() { + this.containerFile = false; + this.mimeFile = false; + this.rootFile = false; + + this.metadata = {}; + this.manifest = {}; + this.spine = {toc: false, contents: []}; + this.flow = []; + this.toc = []; + + this.open(); } - this.zip.readFile(this.mimeFile, (function (err, data) { - if (err) { - this.emit("error", new Error("Reading archive failed")); + + + /** + * EPub#open() -> undefined + * + * Opens the epub file with Zip unpacker, retrieves file listing + * and runs mime type check + **/ + open() { + try { + this.zip = new ZipFile(this.filename); + } catch (E) { + this.emit("error", new Error("Invalid/missing file")); return; } - var txt = data.toString("utf-8").toLowerCase().trim(); - - if (txt != "application/epub+zip") { - this.emit("error", new Error("Unsupported mime type")); + + if (!this.zip.names || !this.zip.names.length) { + this.emit("error", new Error("No files in archive")); return; } - - this.getRootFiles(); - }).bind(this)); -}; - -/** - * EPub#getRootFiles() -> undefined - * - * Looks for a "meta-inf/container.xml" file and searches for a - * rootfile element with mime type "application/oebps-package+xml". - * On success calls the rootfile parser - **/ -EPub.prototype.getRootFiles = function () { - var i, len; - for (i = 0, len = this.zip.names.length; i < len; i++) { - if (this.zip.names[i].toLowerCase() == "meta-inf/container.xml") { - this.containerFile = this.zip.names[i]; - break; + + this.checkMimeType(); + }; + + /** + * EPub#checkMimeType() -> undefined + * + * Checks if there's a file called "mimetype" and that it's contents + * are "application/epub+zip". On success runs root file check. + **/ + checkMimeType() { + var i, len; + + for (i = 0, len = this.zip.names.length; i < len; i++) { + if (this.zip.names[i].toLowerCase() == "mimetype") { + this.mimeFile = this.zip.names[i]; + break; + } } - } - if (!this.containerFile) { - this.emit("error", new Error("No container file in archive")); - return; - } - - this.zip.readFile(this.containerFile, (function (err, data) { - if (err) { - this.emit("error", new Error("Reading archive failed")); + if (!this.mimeFile) { + this.emit("error", new Error("No mimetype file in archive")); return; } - var xml = data.toString("utf-8").toLowerCase().trim(), - xmlparser = new xml2js.Parser(xml2jsOptions); - - xmlparser.on("end", (function (result) { - - if (!result.rootfiles || !result.rootfiles.rootfile) { - this.emit("error", new Error("No rootfiles found")); - console.dir(result); + this.zip.readFile(this.mimeFile, (function (err, data) { + if (err) { + this.emit("error", new Error("Reading archive failed")); return; } - - var rootfile = result.rootfiles.rootfile, - filename = false, i, len; - - if (Array.isArray(rootfile)) { - - for (i = 0, len = rootfile.length; i < len; i++) { - if (rootfile[i]["@"]["media-type"] && - rootfile[i]["@"]["media-type"] == "application/oebps-package+xml" && - rootfile[i]["@"]["full-path"]) { - filename = rootfile[i]["@"]["full-path"].toLowerCase().trim(); + var txt = data.toString("utf-8").toLowerCase().trim(); + + if (txt != "application/epub+zip") { + this.emit("error", new Error("Unsupported mime type")); + return; + } + + this.getRootFiles(); + }).bind(this)); + }; + + /** + * EPub#getRootFiles() -> undefined + * + * Looks for a "meta-inf/container.xml" file and searches for a + * rootfile element with mime type "application/oebps-package+xml". + * On success calls the rootfile parser + **/ + getRootFiles() { + var i, len; + for (i = 0, len = this.zip.names.length; i < len; i++) { + if (this.zip.names[i].toLowerCase() == "meta-inf/container.xml") { + this.containerFile = this.zip.names[i]; + break; + } + } + if (!this.containerFile) { + this.emit("error", new Error("No container file in archive")); + return; + } + + this.zip.readFile(this.containerFile, (function (err, data) { + if (err) { + this.emit("error", new Error("Reading archive failed")); + return; + } + var xml = data.toString("utf-8").toLowerCase().trim(), + xmlparser = new xml2js.Parser(xml2jsOptions); + + xmlparser.on("end", (function (result) { + + if (!result.rootfiles || !result.rootfiles.rootfile) { + this.emit("error", new Error("No rootfiles found")); + console.dir(result); + return; + } + + var rootfile = result.rootfiles.rootfile, + filename = false, i, len; + + if (Array.isArray(rootfile)) { + + for (i = 0, len = rootfile.length; i < len; i++) { + if (rootfile[i]["@"]["media-type"] && + rootfile[i]["@"]["media-type"] == "application/oebps-package+xml" && + rootfile[i]["@"]["full-path"]) { + filename = rootfile[i]["@"]["full-path"].toLowerCase().trim(); + break; + } + } + + } else if (rootfile["@"]) { + if (rootfile["@"]["media-type"] != "application/oebps-package+xml" || !rootfile["@"]["full-path"]) { + this.emit("error", new Error("Rootfile in unknown format")); + return; + } + filename = rootfile["@"]["full-path"].toLowerCase().trim(); + } + + if (!filename) { + this.emit("error", new Error("Empty rootfile")); + return; + } + + + for (i = 0, len = this.zip.names.length; i < len; i++) { + if (this.zip.names[i].toLowerCase() == filename) { + this.rootFile = this.zip.names[i]; break; } } - - } else if (rootfile["@"]) { - if (rootfile["@"]["media-type"] != "application/oebps-package+xml" || !rootfile["@"]["full-path"]) { - this.emit("error", new Error("Rootfile in unknown format")); + + if (!this.rootFile) { + this.emit("error", new Error("Rootfile not found from archive")); return; } - filename = rootfile["@"]["full-path"].toLowerCase().trim(); - } - - if (!filename) { - this.emit("error", new Error("Empty rootfile")); + + this.handleRootFile(); + + }).bind(this)); + + xmlparser.on("error", (function (err) { + this.emit("error", new Error("Parsing container XML failed")); return; - } - - - for (i = 0, len = this.zip.names.length; i < len; i++) { - if (this.zip.names[i].toLowerCase() == filename) { - this.rootFile = this.zip.names[i]; - break; - } - } - - if (!this.rootFile) { - this.emit("error", new Error("Rootfile not found from archive")); + }).bind(this)); + + xmlparser.parseString(xml); + + + }).bind(this)); + }; + + /** + * EPub#handleRootFile() -> undefined + * + * Parses the rootfile XML and calls rootfile parser + **/ + handleRootFile() { + + this.zip.readFile(this.rootFile, (function (err, data) { + if (err) { + this.emit("error", new Error("Reading archive failed")); return; } - - this.handleRootFile(); - - }).bind(this)); - - xmlparser.on("error", (function (err) { - this.emit("error", new Error("Parsing container XML failed")); - return; + var xml = data.toString("utf-8"), + xmlparser = new xml2js.Parser(xml2jsOptions); + + xmlparser.on("end", this.parseRootFile.bind(this)); + + xmlparser.on("error", (function (err) { + this.emit("error", new Error("Parsing container XML failed")); + return; + }).bind(this)); + + xmlparser.parseString(xml); + }).bind(this)); - - xmlparser.parseString(xml); - - - }).bind(this)); -}; - -/** - * EPub#handleRootFile() -> undefined - * - * Parses the rootfile XML and calls rootfile parser - **/ -EPub.prototype.handleRootFile = function () { - - this.zip.readFile(this.rootFile, (function (err, data) { - if (err) { - this.emit("error", new Error("Reading archive failed")); - return; + }; + + /** + * EPub#parseRootFile() -> undefined + * + * Parses elements "metadata," "manifest," "spine" and TOC. + * Emits "end" if no TOC + **/ + parseRootFile(rootfile) { + + this.version = rootfile['@'].version || '2.0'; + + var i, len, keys, keyparts, key; + keys = Object.keys(rootfile); + for (i = 0, len = keys.length; i < len; i++) { + keyparts = keys[i].split(":"); + key = (keyparts.pop() || "").toLowerCase().trim(); + switch (key) { + case "metadata": + this.parseMetadata(rootfile[keys[i]]); + break; + case "manifest": + this.parseManifest(rootfile[keys[i]]); + break; + case "spine": + this.parseSpine(rootfile[keys[i]]); + break; + case "guide": + //this.parseGuide(rootfile[keys[i]]); + break; + } } - var xml = data.toString("utf-8"), - xmlparser = new xml2js.Parser(xml2jsOptions); - - xmlparser.on("end", this.parseRootFile.bind(this)); - - xmlparser.on("error", (function (err) { - this.emit("error", new Error("Parsing container XML failed")); - return; - }).bind(this)); - - xmlparser.parseString(xml); - - }).bind(this)); -}; - -/** - * EPub#parseRootFile() -> undefined - * - * Parses elements "metadata," "manifest," "spine" and TOC. - * Emits "end" if no TOC - **/ -EPub.prototype.parseRootFile = function (rootfile) { - - this.version = rootfile['@'].version || '2.0'; - - var i, len, keys, keyparts, key; - keys = Object.keys(rootfile); - for (i = 0, len = keys.length; i < len; i++) { - keyparts = keys[i].split(":"); - key = (keyparts.pop() || "").toLowerCase().trim(); - switch (key) { - case "metadata": - this.parseMetadata(rootfile[keys[i]]); - break; - case "manifest": - this.parseManifest(rootfile[keys[i]]); - break; - case "spine": - this.parseSpine(rootfile[keys[i]]); - break; - case "guide": - //this.parseGuide(rootfile[keys[i]]); - break; + + if (this.spine.toc) { + this.parseTOC(); + } else { + this.emit("end"); } - } - - if (this.spine.toc) { - this.parseTOC(); - } else { - this.emit("end"); - } -}; - -/** - * EPub#parseMetadata() -> undefined - * - * Parses "metadata" block (book metadata, title, author etc.) - **/ -EPub.prototype.parseMetadata = function (metadata) { - var i, j, len, keys, keyparts, key; - - keys = Object.keys(metadata); - for (i = 0, len = keys.length; i < len; i++) { - keyparts = keys[i].split(":"); - key = (keyparts.pop() || "").toLowerCase().trim(); - switch (key) { - case "publisher": - if (Array.isArray(metadata[keys[i]])) { - this.metadata.publisher = String(metadata[keys[i]][0] && metadata[keys[i]][0]["#"] || metadata[keys[i]][0] || "").trim(); - } else { - this.metadata.publisher = String(metadata[keys[i]]["#"] || metadata[keys[i]] || "").trim(); - } - break; - case "language": - if (Array.isArray(metadata[keys[i]])) { - this.metadata.language = String(metadata[keys[i]][0] && metadata[keys[i]][0]["#"] || metadata[keys[i]][0] || "").toLowerCase().trim(); - } else { - this.metadata.language = String(metadata[keys[i]]["#"] || metadata[keys[i]] || "").toLowerCase().trim(); - } - break; - case "title": - if (Array.isArray(metadata[keys[i]])) { - this.metadata.title = String(metadata[keys[i]][0] && metadata[keys[i]][0]["#"] || metadata[keys[i]][0] || "").trim(); - } else { - this.metadata.title = String(metadata[keys[i]]["#"] || metadata[keys[i]] || "").trim(); - } - break; - case "subject": - if (Array.isArray(metadata[keys[i]])) { - this.metadata.subject = String(metadata[keys[i]][0] && metadata[keys[i]][0]["#"] || metadata[keys[i]][0] || "").trim(); - } else { - this.metadata.subject = String(metadata[keys[i]]["#"] || metadata[keys[i]] || "").trim(); + }; + + /** + * EPub#parseMetadata() -> undefined + * + * Parses "metadata" block (book metadata, title, author etc.) + **/ + parseMetadata(metadata) { + var i, j, len, keys, keyparts, key; + + keys = Object.keys(metadata); + for (i = 0, len = keys.length; i < len; i++) { + keyparts = keys[i].split(":"); + key = (keyparts.pop() || "").toLowerCase().trim(); + switch (key) { + case "publisher": + if (Array.isArray(metadata[keys[i]])) { + this.metadata.publisher = String(metadata[keys[i]][0] && metadata[keys[i]][0]["#"] || metadata[keys[i]][0] || "").trim(); + } else { + this.metadata.publisher = String(metadata[keys[i]]["#"] || metadata[keys[i]] || "").trim(); + } + break; + case "language": + if (Array.isArray(metadata[keys[i]])) { + this.metadata.language = String(metadata[keys[i]][0] && metadata[keys[i]][0]["#"] || metadata[keys[i]][0] || "").toLowerCase().trim(); + } else { + this.metadata.language = String(metadata[keys[i]]["#"] || metadata[keys[i]] || "").toLowerCase().trim(); + } + break; + case "title": + if (Array.isArray(metadata[keys[i]])) { + this.metadata.title = String(metadata[keys[i]][0] && metadata[keys[i]][0]["#"] || metadata[keys[i]][0] || "").trim(); + } else { + this.metadata.title = String(metadata[keys[i]]["#"] || metadata[keys[i]] || "").trim(); + } + break; + case "subject": + if (Array.isArray(metadata[keys[i]])) { + this.metadata.subject = String(metadata[keys[i]][0] && metadata[keys[i]][0]["#"] || metadata[keys[i]][0] || "").trim(); + } else { + this.metadata.subject = String(metadata[keys[i]]["#"] || metadata[keys[i]] || "").trim(); + } + break; + case "description": + if (Array.isArray(metadata[keys[i]])) { + this.metadata.description = String(metadata[keys[i]][0] && metadata[keys[i]][0]["#"] || metadata[keys[i]][0] || "").trim(); + } else { + this.metadata.description = String(metadata[keys[i]]["#"] || metadata[keys[i]] || "").trim(); + } + break; + case "creator": + if (Array.isArray(metadata[keys[i]])) { + this.metadata.creator = String(metadata[keys[i]][0] && metadata[keys[i]][0]["#"] || metadata[keys[i]][0] || "").trim(); + this.metadata.creatorFileAs = String(metadata[keys[i]][0] && metadata[keys[i]][0]['@'] && metadata[keys[i]][0]['@']["opf:file-as"] || this.metadata.creator).trim(); + } else { + this.metadata.creator = String(metadata[keys[i]]["#"] || metadata[keys[i]] || "").trim(); + this.metadata.creatorFileAs = String(metadata[keys[i]]['@'] && metadata[keys[i]]['@']["opf:file-as"] || this.metadata.creator).trim(); + } + break; + case "date": + if (Array.isArray(metadata[keys[i]])) { + this.metadata.date = String(metadata[keys[i]][0] && metadata[keys[i]][0]["#"] || metadata[keys[i]][0] || "").trim(); + } else { + this.metadata.date = String(metadata[keys[i]]["#"] || metadata[keys[i]] || "").trim(); + } + break; + case "identifier": + if (metadata[keys[i]]["@"] && metadata[keys[i]]["@"]["opf:scheme"] == "ISBN") { + this.metadata.ISBN = String(metadata[keys[i]]["#"] || "").trim(); + } else if (metadata[keys[i]]["@"] && metadata[keys[i]]["@"].id && metadata[keys[i]]["@"].id.match(/uuid/i)) { + this.metadata.UUID = String(metadata[keys[i]]["#"] || "").replace('urn:uuid:', '').toUpperCase().trim(); + } else if (Array.isArray(metadata[keys[i]])) { + for (j = 0; j < metadata[keys[i]].length; j++) { + if (metadata[keys[i]][j]["@"]) { + if (metadata[keys[i]][j]["@"]["opf:scheme"] == "ISBN") { + this.metadata.ISBN = String(metadata[keys[i]][j]["#"] || "").trim(); + } else if (metadata[keys[i]][j]["@"].id && metadata[keys[i]][j]["@"].id.match(/uuid/i)) { + this.metadata.UUID = String(metadata[keys[i]][j]["#"] || "").replace('urn:uuid:', '').toUpperCase().trim(); + } + } + } + } + break; } - break; - case "description": - if (Array.isArray(metadata[keys[i]])) { - this.metadata.description = String(metadata[keys[i]][0] && metadata[keys[i]][0]["#"] || metadata[keys[i]][0] || "").trim(); - } else { - this.metadata.description = String(metadata[keys[i]]["#"] || metadata[keys[i]] || "").trim(); + } + + var metas = metadata['meta'] || {}; + Object.keys(metas).forEach(function(key) { + var meta = metas[key]; + if (meta['@'] && meta['@'].name) { + var name = meta['@'].name; + this.metadata[name] = meta['@'].content; } - break; - case "creator": - if (Array.isArray(metadata[keys[i]])) { - this.metadata.creator = String(metadata[keys[i]][0] && metadata[keys[i]][0]["#"] || metadata[keys[i]][0] || "").trim(); - this.metadata.creatorFileAs = String(metadata[keys[i]][0] && metadata[keys[i]][0]['@'] && metadata[keys[i]][0]['@']["opf:file-as"] || this.metadata.creator).trim(); - } else { - this.metadata.creator = String(metadata[keys[i]]["#"] || metadata[keys[i]] || "").trim(); - this.metadata.creatorFileAs = String(metadata[keys[i]]['@'] && metadata[keys[i]]['@']["opf:file-as"] || this.metadata.creator).trim(); + if (meta['#'] && meta['@'].property) { + this.metadata[meta['@'].property] = meta['#']; } - break; - case "date": - if (Array.isArray(metadata[keys[i]])) { - this.metadata.date = String(metadata[keys[i]][0] && metadata[keys[i]][0]["#"] || metadata[keys[i]][0] || "").trim(); - } else { - this.metadata.date = String(metadata[keys[i]]["#"] || metadata[keys[i]] || "").trim(); + + if(meta.name && meta.name =="cover"){ + this.metadata[meta.name] = meta.content; } - break; - case "identifier": - if (metadata[keys[i]]["@"] && metadata[keys[i]]["@"]["opf:scheme"] == "ISBN") { - this.metadata.ISBN = String(metadata[keys[i]]["#"] || "").trim(); - } else if (metadata[keys[i]]["@"] && metadata[keys[i]]["@"].id && metadata[keys[i]]["@"].id.match(/uuid/i)) { - this.metadata.UUID = String(metadata[keys[i]]["#"] || "").replace('urn:uuid:', '').toUpperCase().trim(); - } else if (Array.isArray(metadata[keys[i]])) { - for (j = 0; j < metadata[keys[i]].length; j++) { - if (metadata[keys[i]][j]["@"]) { - if (metadata[keys[i]][j]["@"]["opf:scheme"] == "ISBN") { - this.metadata.ISBN = String(metadata[keys[i]][j]["#"] || "").trim(); - } else if (metadata[keys[i]][j]["@"].id && metadata[keys[i]][j]["@"].id.match(/uuid/i)) { - this.metadata.UUID = String(metadata[keys[i]][j]["#"] || "").replace('urn:uuid:', '').toUpperCase().trim(); - } + }, this); + }; + + /** + * EPub#parseManifest() -> undefined + * + * Parses "manifest" block (all items included, html files, images, styles) + **/ + parseManifest(manifest) { + var i, len, path = this.rootFile.split("/"), element, path_str; + path.pop(); + path_str = path.join("/"); + + if (manifest.item) { + for (i = 0, len = manifest.item.length; i < len; i++) { + if (manifest.item[i]['@']) { + element = manifest.item[i]['@']; + + if (element.href && element.href.substr(0, path_str.length) != path_str) { + element.href = path.concat([element.href]).join("/"); } + + this.manifest[manifest.item[i]['@'].id] = element; + } } - break; - } - } - - var metas = metadata['meta'] || {}; - Object.keys(metas).forEach(function(key) { - var meta = metas[key]; - if (meta['@'] && meta['@'].name) { - var name = meta['@'].name; - this.metadata[name] = meta['@'].content; } - if (meta['#'] && meta['@'].property) { - this.metadata[meta['@'].property] = meta['#']; - } - - if(meta.name && meta.name =="cover"){ - this.metadata[meta.name] = meta.content; + }; + + /** + * EPub#parseSpine() -> undefined + * + * Parses "spine" block (all html elements that are shown to the reader) + **/ + parseSpine(spine) { + var i, len, path = this.rootFile.split("/"), element; + path.pop(); + + if (spine['@'] && spine['@'].toc) { + this.spine.toc = this.manifest[spine['@'].toc] || false; } - }, this); -}; - -/** - * EPub#parseManifest() -> undefined - * - * Parses "manifest" block (all items included, html files, images, styles) - **/ -EPub.prototype.parseManifest = function (manifest) { - var i, len, path = this.rootFile.split("/"), element, path_str; - path.pop(); - path_str = path.join("/"); - - if (manifest.item) { - for (i = 0, len = manifest.item.length; i < len; i++) { - if (manifest.item[i]['@']) { - element = manifest.item[i]['@']; - - if (element.href && element.href.substr(0, path_str.length) != path_str) { - element.href = path.concat([element.href]).join("/"); - } - - this.manifest[manifest.item[i]['@'].id] = element; - + + if (spine.itemref) { + if(!Array.isArray(spine.itemref)){ + spine.itemref = [spine.itemref]; } - } - } -}; - -/** - * EPub#parseSpine() -> undefined - * - * Parses "spine" block (all html elements that are shown to the reader) - **/ -EPub.prototype.parseSpine = function (spine) { - var i, len, path = this.rootFile.split("/"), element; - path.pop(); - - if (spine['@'] && spine['@'].toc) { - this.spine.toc = this.manifest[spine['@'].toc] || false; - } - - if (spine.itemref) { - if(!Array.isArray(spine.itemref)){ - spine.itemref = [spine.itemref]; - } - for (i = 0, len = spine.itemref.length; i < len; i++) { - if (spine.itemref[i]['@']) { - if (element = this.manifest[spine.itemref[i]['@'].idref]) { - this.spine.contents.push(element); + for (i = 0, len = spine.itemref.length; i < len; i++) { + if (spine.itemref[i]['@']) { + if (element = this.manifest[spine.itemref[i]['@'].idref]) { + this.spine.contents.push(element); + } } } } - } - this.flow = this.spine.contents; -}; - -/** - * EPub#parseTOC() -> undefined - * - * Parses ncx file for table of contents (title, html file) - **/ -EPub.prototype.parseTOC = function () { - var i, len, path = this.spine.toc.href.split("/"), id_list = {}, keys; - path.pop(); - - keys = Object.keys(this.manifest); - for (i = 0, len = keys.length; i < len; i++) { - id_list[this.manifest[keys[i]].href] = keys[i]; - } - - this.zip.readFile(this.spine.toc.href, (function (err, data) { - if (err) { - this.emit("error", new Error("Reading archive failed")); - return; + this.flow = this.spine.contents; + }; + + /** + * EPub#parseTOC() -> undefined + * + * Parses ncx file for table of contents (title, html file) + **/ + parseTOC() { + var i, len, path = this.spine.toc.href.split("/"), id_list = {}, keys; + path.pop(); + + keys = Object.keys(this.manifest); + for (i = 0, len = keys.length; i < len; i++) { + id_list[this.manifest[keys[i]].href] = keys[i]; } - var xml = data.toString("utf-8"), - xmlparser = new xml2js.Parser(xml2jsOptions); - - xmlparser.on("end", (function (result) { - if (result.navMap && result.navMap.navPoint) { - this.toc = this.walkNavMap(result.navMap.navPoint, path, id_list); - } - - this.emit("end"); - }).bind(this)); - - xmlparser.on("error", (function (err) { - this.emit("error", new Error("Parsing container XML failed")); - return; - }).bind(this)); - - xmlparser.parseString(xml); - - }).bind(this)); -}; - -/** - * EPub#walkNavMap(branch, path, id_list,[, level]) -> Array - * - branch (Array | Object): NCX NavPoint object - * - path (Array): Base path - * - id_list (Object): map of file paths and id values - * - level (Number): deepness - * - * Walks the NavMap object through all levels and finds elements - * for TOC - **/ -EPub.prototype.walkNavMap = function (branch, path, id_list, level) { - level = level || 0; - - // don't go too far - if (level > 7) { - return []; - } - - var output = []; - - if (!Array.isArray(branch)) { - branch = [branch]; - } - - for (var i = 0; i < branch.length; i++) { - if (branch[i].navLabel) { - - var title = ''; - if (branch[i].navLabel && typeof branch[i].navLabel.text == 'string') { - title = branch[i].navLabel && branch[i].navLabel.text || branch[i].navLabel===branch[i].navLabel ? - (branch[i].navLabel && branch[i].navLabel.text || branch[i].navLabel || "").trim() : ''; - } - var order = Number(branch[i]["@"] && branch[i]["@"].playOrder || 0); - if (isNaN(order)) { - order = 0; - } - var href = ''; - if (branch[i].content && branch[i].content["@"] && typeof branch[i].content["@"].src == 'string') { - href = branch[i].content["@"].src.trim(); + + this.zip.readFile(this.spine.toc.href, (function (err, data) { + if (err) { + this.emit("error", new Error("Reading archive failed")); + return; } - - var element = { - level: level, - order: order, - title: title - }; - - if (href) { - href = path.concat([href]).join("/"); - element.href = href; - - if (id_list[element.href]) { - // link existing object - element = this.manifest[id_list[element.href]]; - element.title = title; - element.order = order; - element.level = level; - } else { - // use new one - element.href = href; - element.id = (branch[i]["@"] && branch[i]["@"].id || "").trim(); + var xml = data.toString("utf-8"), + xmlparser = new xml2js.Parser(xml2jsOptions); + + xmlparser.on("end", (function (result) { + if (result.navMap && result.navMap.navPoint) { + this.toc = this.walkNavMap(result.navMap.navPoint, path, id_list); } - - output.push(element); - } - } - if (branch[i].navPoint) { - output = output.concat(this.walkNavMap(branch[i].navPoint, path, id_list, level + 1)); + + this.emit("end"); + }).bind(this)); + + xmlparser.on("error", (function (err) { + this.emit("error", new Error("Parsing container XML failed")); + return; + }).bind(this)); + + xmlparser.parseString(xml); + + }).bind(this)); + }; + + /** + * EPub#walkNavMap(branch, path, id_list,[, level]) -> Array + * - branch (Array | Object): NCX NavPoint object + * - path (Array): Base path + * - id_list (Object): map of file paths and id values + * - level (Number): deepness + * + * Walks the NavMap object through all levels and finds elements + * for TOC + **/ + walkNavMap(branch, path, id_list, level) { + level = level || 0; + + // don't go too far + if (level > 7) { + return []; } - } - return output; -}; - -/** - * EPub#getChapter(id, callback) -> undefined - * - id (String): Manifest id value for a chapter - * - callback (Function): callback function - * - * Finds a chapter text for an id. Replaces image and link URL's, removes - *
etc. elements. Return only chapters with mime type application/xhtml+xml - **/ -EPub.prototype.getChapter = function (id, callback) { - this.getChapterRaw(id, (function (err, str) { - if (err) { - callback(err); - return; + + var output = []; + + if (!Array.isArray(branch)) { + branch = [branch]; } - - var i, len, path = this.rootFile.split("/"), keys = Object.keys(this.manifest); - path.pop(); - - // remove linebreaks (no multi line matches in JS regex!) - str = str.replace(/\r?\n/g, "\u0000"); - - // keep only contents - str.replace(/]*?>(.*)<\/body[^>]*?>/i, function (o, d) { - str = d.trim(); - }); - - // remove