mirror of
https://github.com/ciromattia/kcc
synced 2026-05-22 15:32:06 +00:00
234 lines
10 KiB
Python
Executable File
234 lines
10 KiB
Python
Executable File
#!/usr/bin/env python
|
|
#
|
|
# Copyright (c) 2012 Ciro Mattia Gonano <ciromattia@gmail.com>
|
|
#
|
|
# Permission to use, copy, modify, and/or distribute this software for
|
|
# any purpose with or without fee is hereby granted, provided that the
|
|
# above copyright notice and this permission notice appear in all
|
|
# copies.
|
|
#
|
|
# THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL
|
|
# WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED
|
|
# WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE
|
|
# AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL
|
|
# DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA
|
|
# OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER
|
|
# TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
|
|
# PERFORMANCE OF THIS SOFTWARE.
|
|
#
|
|
# Changelog
|
|
# 1.00 - Initial version
|
|
# 1.10 - Added support for CBZ/CBR files
|
|
# 1.11 - Added support for ZIP/RAR extensions
|
|
# 1.20 - Comic optimizations! Split pages not target-oriented (landscape
|
|
# with portrait target or portrait with landscape target), add palette
|
|
# and other image optimizations from Mangle.
|
|
# WARNING: PIL is required for all image mangling!
|
|
# 1.30 - Fixed an issue in OPF generation for device resolution
|
|
# Reworked options system (call with -h option to get the inline help)
|
|
# 1.40 - Added some options for controlling image optimization
|
|
# Further optimization (ImageOps, page numbering cut, autocontrast)
|
|
# 1.41 - Fixed a serious bug on resizing when img ratio was bigger than device one
|
|
#
|
|
# Todo:
|
|
# - Add gracefully exit for CBR if no rarfile.py and no unrar
|
|
# executable are found
|
|
# - Improve error reporting
|
|
# - recurse into dirtree for multiple comics
|
|
|
|
__version__ = '1.30'
|
|
|
|
import os
|
|
import sys
|
|
from optparse import OptionParser
|
|
import image, cbxarchive, pdfjpgextract
|
|
|
|
class HTMLbuilder:
|
|
|
|
def getResult(self):
|
|
return getImageFileName(self.file)
|
|
|
|
def __init__(self, dstdir, file):
|
|
self.file = file
|
|
filename = getImageFileName(file)
|
|
if filename is not None:
|
|
htmlfile = dstdir + '/' + filename[0] + '.html'
|
|
f = open(htmlfile, "w")
|
|
f.writelines(["<!DOCTYPE html SYSTEM \"http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd\">\n",
|
|
"<html xmlns=\"http://www.w3.org/1999/xhtml\">\n",
|
|
"<head>\n",
|
|
"<title>",filename[0],"</title>\n",
|
|
"<meta http-equiv=\"Content-Type\" content=\"text/html; charset=utf-8\"/>\n",
|
|
"</head>\n",
|
|
"<body>\n",
|
|
"<div><img src=\"",file,"\" /></div>\n",
|
|
"</body>\n",
|
|
"</html>"
|
|
])
|
|
f.close()
|
|
return
|
|
|
|
class NCXbuilder:
|
|
def __init__(self, dstdir, title):
|
|
ncxfile = dstdir + '/content.ncx'
|
|
f = open(ncxfile, "w")
|
|
f.writelines(["<?xml version=\"1.0\" encoding=\"UTF-8\"?>\n",
|
|
"<!DOCTYPE ncx PUBLIC \"-//NISO//DTD ncx 2005-1//EN\" \"http://www.daisy.org/z3986/2005/ncx-2005-1.dtd\">\n",
|
|
"<ncx version=\"2005-1\" xml:lang=\"en-US\" xmlns=\"http://www.daisy.org/z3986/2005/ncx/\">\n",
|
|
"<head>\n</head>\n",
|
|
"<docTitle><text>",title,"</text></docTitle>\n",
|
|
"<navMap></navMap>\n</ncx>"
|
|
])
|
|
f.close()
|
|
return
|
|
|
|
class OPFBuilder:
|
|
def __init__(self, profile, dstdir, title, filelist):
|
|
opffile = dstdir + '/content.opf'
|
|
# read the first file resolution
|
|
profilelabel, deviceres, palette = image.ProfileData.Profiles[profile]
|
|
imgres = str(deviceres[0]) + "x" + str(deviceres[1])
|
|
f = open(opffile, "w")
|
|
f.writelines(["<?xml version=\"1.0\" encoding=\"UTF-8\"?>\n",
|
|
"<package version=\"2.0\" unique-identifier=\"PrimaryID\" xmlns=\"http://www.idpf.org/2007/opf\">\n",
|
|
"<metadata xmlns:dc=\"http://purl.org/dc/elements/1.1/\" xmlns:opf=\"http://www.idpf.org/2007/opf\">\n",
|
|
"<dc:title>",title,"</dc:title>\n",
|
|
"<dc:language>en-US</dc:language>\n",
|
|
"<meta name=\"book-type\" content=\"comic\"/>\n",
|
|
"<meta name=\"zero-gutter\" content=\"true\"/>\n",
|
|
"<meta name=\"zero-margin\" content=\"true\"/>\n",
|
|
"<meta name=\"fixed-layout\" content=\"true\"/>\n",
|
|
"<meta name=\"orientation-lock\" content=\"portrait\"/>\n",
|
|
"<meta name=\"original-resolution\" content=\"" + imgres + "\"/>\n",
|
|
"</metadata><manifest><item id=\"ncx\" href=\"content.ncx\" media-type=\"application/x-dtbncx+xml\"/>\n"])
|
|
for filename in filelist:
|
|
f.write("<item id=\"page_" + filename[0] + "\" href=\"" + filename[0] + ".html\" media-type=\"application/xhtml+xml\"/>\n")
|
|
for filename in filelist:
|
|
if '.png' == filename[1]:
|
|
mt = 'image/png'
|
|
else:
|
|
mt = 'image/jpeg'
|
|
f.write("<item id=\"img_" + filename[0] + "\" href=\"" + filename[0] + filename[1] + "\" media-type=\"" + mt + "\"/>\n")
|
|
f.write("</manifest>\n<spine toc=\"ncx\">\n")
|
|
for filename in filelist:
|
|
f.write("<itemref idref=\"page_" + filename[0] + "\" />\n")
|
|
f.write("</spine>\n<guide>\n</guide>\n</package>\n")
|
|
f.close()
|
|
return
|
|
|
|
def getImageFileName(file):
|
|
filename = os.path.splitext(file)
|
|
if filename[0].startswith('.') or (filename[1].lower() != '.png' and filename[1].lower() != '.jpg' and filename[1].lower() != '.jpeg'):
|
|
return None
|
|
return filename
|
|
|
|
def isInFilelist(file,list):
|
|
filename = os.path.splitext(file)
|
|
seen = False
|
|
for item in list:
|
|
if filename[0] == item[0]:
|
|
seen = True
|
|
return seen
|
|
|
|
def Copyright():
|
|
print ('comic2ebook v%(__version__)s. '
|
|
'Written 2012 by Ciro Mattia Gonano.' % globals())
|
|
|
|
def Usage():
|
|
print "Generates HTML, NCX and OPF for a Comic ebook from a bunch of images"
|
|
print "Optimized for creating Mobipockets to be read into Kindle Paperwhite"
|
|
parser.print_help()
|
|
|
|
def main(argv=None):
|
|
global parser
|
|
usage = "Usage: %prog [options] comic_file|comic_folder"
|
|
parser = OptionParser(usage=usage, version=__version__)
|
|
parser.add_option("-p", "--profile", action="store", dest="profile", default="KHD",
|
|
help="Device profile (choose one among K1, K2, K3, K4, KDX, KDXG or KHD) [default=KHD]")
|
|
parser.add_option("-t", "--title", action="store", dest="title", default="defaulttitle",
|
|
help="Comic title [default=filename]")
|
|
parser.add_option("-m", "--manga-style", action="store_true", dest="righttoleft", default=False,
|
|
help="Split pages 'manga style' (right-to-left reading) [default=False]")
|
|
parser.add_option("-v", "--verbose", action="store_true", dest="verbose", default=False,
|
|
help="Verbose output [default=False]")
|
|
parser.add_option("-i", "--image-processing", action="store_false", dest="imgproc", default=True,
|
|
help="Apply image preprocessing (page splitting and optimizations) [default=True]")
|
|
parser.add_option("--upscale-images", action="store_true", dest="upscale", default=False,
|
|
help="Resize images smaller than device's resolution [default=False]")
|
|
parser.add_option("--stretch-images", action="store_true", dest="stretch", default=False,
|
|
help="Stretch images to device's resolution [default=False]")
|
|
parser.add_option("--cut-page-numbers", action="store_false", dest="cutpagenumbers", default=True,
|
|
help="Try to cut page numbering on images [default=True]")
|
|
options, args = parser.parse_args(argv)
|
|
if len(args) != 1:
|
|
parser.print_help()
|
|
return
|
|
dir = args[0]
|
|
fname = os.path.splitext(dir)
|
|
if fname[1].lower() == '.pdf':
|
|
pdf = pdfjpgextract.PdfJpgExtract(dir)
|
|
pdf.extract()
|
|
dir = pdf.getPath()
|
|
else:
|
|
cbx = cbxarchive.CBxArchive(dir)
|
|
if cbx.isCbxFile():
|
|
cbx.extract()
|
|
dir = cbx.getPath()
|
|
else:
|
|
try:
|
|
import shutil
|
|
shutil.copytree(dir, dir + "_orig")
|
|
#dir = dir + "_orig"
|
|
except OSError as exc:
|
|
raise
|
|
filelist = []
|
|
if options.imgproc:
|
|
print "Processing images..."
|
|
try:
|
|
if options.verbose:
|
|
print "Splitting double pages..."
|
|
for file in os.listdir(dir):
|
|
if getImageFileName(file) is not None:
|
|
print ".",
|
|
img = image.ComicPage(dir+'/'+file, options.profile)
|
|
img.splitPage(dir, options.righttoleft)
|
|
for file in os.listdir(dir):
|
|
if getImageFileName(file) is not None:
|
|
if options.verbose:
|
|
print "Optimizing " + file + " for " + options.profile
|
|
else:
|
|
print ".",
|
|
img = image.ComicPage(dir+'/'+file, options.profile)
|
|
img.optimizeImage()
|
|
img.cropWhiteSpace(10.0)
|
|
if options.cutpagenumbers:
|
|
img.cutPageNumber()
|
|
img.resizeImage(options.upscale,options.stretch)
|
|
img.quantizeImage()
|
|
img.saveToDir(dir)
|
|
except ImportError:
|
|
print "Could not load PIL, not optimizing image"
|
|
|
|
print "Creating ePub structure..."
|
|
for file in os.listdir(dir):
|
|
if getImageFileName(file) is not None and isInFilelist(file,filelist) == False:
|
|
# put credits at the end
|
|
if "credits" in file.lower():
|
|
os.rename(dir+'/'+file, dir+'/ZZZ999_'+file)
|
|
file = 'ZZZ999_'+file
|
|
filename = HTMLbuilder(dir,file).getResult()
|
|
if filename is not None:
|
|
filelist.append(filename)
|
|
if options.title == 'defaulttitle':
|
|
options.title = os.path.basename(dir)
|
|
NCXbuilder(dir,options.title)
|
|
# ensure we're sorting files alphabetically
|
|
filelist = sorted(filelist, key=lambda name: name[0].lower())
|
|
OPFBuilder(options.profile,dir,options.title,filelist)
|
|
|
|
|
|
if __name__ == "__main__":
|
|
Copyright()
|
|
main(sys.argv[1:])
|
|
sys.exit(0)
|