# -*- coding: utf-8 -*- # # Copyright (c) 2012-2014 Ciro Mattia Gonano # Copyright (c) 2013-2019 Pawel Jastrzebski # # Permission to use, copy, modify, and/or distribute this software for # any purpose with or without fee is hereby granted, provided that the # above copyright notice and this permission notice appear in all # copies. # # THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL # WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED # WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE # AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL # DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA # OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER # TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR # PERFORMANCE OF THIS SOFTWARE. # import os import pathlib import re import sys from argparse import ArgumentParser from time import strftime, gmtime from copy import copy from glob import glob, escape from re import sub from stat import S_IWRITE, S_IREAD, S_IEXEC from zipfile import ZipFile, ZIP_STORED, ZIP_DEFLATED from tempfile import mkdtemp, gettempdir, TemporaryFile from shutil import move, copytree, rmtree, copyfile from multiprocessing import Pool from uuid import uuid4 from natsort import os_sorted from slugify import slugify as slugify_ext from PIL import Image, ImageFile from subprocess import STDOUT, PIPE from psutil import virtual_memory, disk_usage from html import escape as hescape from .shared import md5Checksum, getImageFileName, walkSort, walkLevel, sanitizeTrace, subprocess_run from . import comic2panel from . import image from . import comicarchive from . import pdfjpgextract from . import dualmetafix from . import metadata from . import kindle from . import __version__ ImageFile.LOAD_TRUNCATED_IMAGES = True def main(argv=None): global options parser = makeParser() args = parser.parse_args(argv) options = copy(args) if not argv or options.input == []: parser.print_help() return 0 if sys.platform.startswith('win'): sources = set([source for option in options.input for source in glob(escape(option))]) else: sources = set(options.input) if len(sources) == 0: print('No matching files found.') return 1 for source in sources: source = source.rstrip('\\').rstrip('/') options = copy(args) options = checkOptions(options) print('Working on ' + source + '...') makeBook(source) return 0 def buildHTML(path, imgfile, imgfilepath): imgfilepath = md5Checksum(imgfilepath) filename = getImageFileName(imgfile) deviceres = options.profileData[1] if not options.noprocessing and "Rotated" in options.imgMetadata[imgfilepath]: rotatedPage = True else: rotatedPage = False if not options.noprocessing and "BlackBackground" in options.imgMetadata[imgfilepath]: additionalStyle = 'background-color:#000000;' else: additionalStyle = '' postfix = '' backref = 1 head = path while True: head, tail = os.path.split(head) if tail == 'Images': htmlpath = os.path.join(head, 'Text', postfix) break postfix = tail + "/" + postfix backref += 1 if not os.path.exists(htmlpath): os.makedirs(htmlpath) htmlfile = os.path.join(htmlpath, filename[0] + '.xhtml') imgsize = Image.open(os.path.join(head, "Images", postfix, imgfile)).size if options.hq: imgsizeframe = (int(imgsize[0] // 1.5), int(imgsize[1] // 1.5)) else: imgsizeframe = imgsize f = open(htmlfile, "w", encoding='UTF-8') f.writelines(["\n", "\n", "\n", "\n", "", hescape(filename[0]), "\n", "\n", "\n" "\n", "\n", "
\n", "\n
\n"]) if options.iskindle and options.panelview: if options.autoscale: size = (getPanelViewResolution(imgsize, deviceres)) else: if options.hq: size = imgsize else: size = (int(imgsize[0] * 1.5), int(imgsize[1] * 1.5)) if size[0] - deviceres[0] < deviceres[0] * 0.01: noHorizontalPV = True else: noHorizontalPV = False if size[1] - deviceres[1] < deviceres[1] * 0.01: noVerticalPV = True else: noVerticalPV = False x, y = getPanelViewSize(deviceres, size) boxStyles = {"PV-TL": "position:absolute;left:0;top:0;", "PV-TR": "position:absolute;right:0;top:0;", "PV-BL": "position:absolute;left:0;bottom:0;", "PV-BR": "position:absolute;right:0;bottom:0;", "PV-T": "position:absolute;top:0;left:" + x + "%;", "PV-B": "position:absolute;bottom:0;left:" + x + "%;", "PV-L": "position:absolute;left:0;top:" + y + "%;", "PV-R": "position:absolute;right:0;top:" + y + "%;"} f.write("
\n") if not noHorizontalPV and not noVerticalPV: if rotatedPage: if options.righttoleft: order = [1, 3, 2, 4] else: order = [2, 4, 1, 3] else: if options.righttoleft: order = [2, 1, 4, 3] else: order = [1, 2, 3, 4] boxes = ["PV-TL", "PV-TR", "PV-BL", "PV-BR"] elif noHorizontalPV and not noVerticalPV: if rotatedPage: if options.righttoleft: order = [1, 2] else: order = [2, 1] else: order = [1, 2] boxes = ["PV-T", "PV-B"] elif not noHorizontalPV and noVerticalPV: if rotatedPage: order = [1, 2] else: if options.righttoleft: order = [2, 1] else: order = [1, 2] boxes = ["PV-L", "PV-R"] else: order = [] boxes = [] for i in range(0, len(boxes)): f.writelines(["
\n", "\n", "
\n"]) f.write("
\n") for box in boxes: f.writelines(["
\n", "\n", "
\n"]) f.writelines(["\n", "\n"]) f.close() return path, imgfile def buildNCX(dstdir, title, chapters, chapternames): ncxfile = os.path.join(dstdir, 'OEBPS', 'toc.ncx') f = open(ncxfile, "w", encoding='UTF-8') f.writelines(["\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "", hescape(title), "\n", "\n"]) for chapter in chapters: folder = chapter[0].replace(os.path.join(dstdir, 'OEBPS'), '').lstrip('/').lstrip('\\\\') filename = getImageFileName(os.path.join(folder, chapter[1])) navID = folder.replace('/', '_').replace('\\', '_') if options.chapters: title = chapternames[chapter[1]] navID = filename[0].replace('/', '_').replace('\\', '_') elif os.path.basename(folder) != "Text": title = chapternames[os.path.basename(folder)] f.write("" + hescape(title) + "\n") f.write("\n") f.close() def buildNAV(dstdir, title, chapters, chapternames): navfile = os.path.join(dstdir, 'OEBPS', 'nav.xhtml') f = open(navfile, "w", encoding='UTF-8') f.writelines(["\n", "\n", "\n", "\n", "" + hescape(title) + "\n", "\n", "\n", "\n", "\n", "\n\n") f.close() def buildOPF(dstdir, title, filelist, cover=None): opffile = os.path.join(dstdir, 'OEBPS', 'content.opf') deviceres = options.profileData[1] if options.righttoleft: writingmode = "horizontal-rl" else: writingmode = "horizontal-lr" f = open(opffile, "w", encoding='UTF-8') f.writelines(["\n", "\n", "\n", "", hescape(title), "\n", "en-US\n", "urn:uuid:", options.uuid, "\n", "KindleComicConverter-" + __version__ + "\n"]) if len(options.summary) > 0: f.writelines(["", options.summary, "\n"]) for author in options.authors: f.writelines(["", author, "\n"]) f.writelines(["" + strftime("%Y-%m-%dT%H:%M:%SZ", gmtime()) + "\n", "\n"]) if options.iskindle and options.profile != 'Custom': f.writelines(["\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "landscape\n", "pre-paginated\n", "\n"]) if options.kfx: f.writelines(["\n"]) else: f.writelines(["\n"]) elif options.supportSyntheticSpread: f.writelines([ "landscape\n", "pre-paginated\n" ]) else: f.writelines(["portrait\n", "portrait\n", "pre-paginated\n"]) f.writelines(["\n\n\n", "\n"]) if cover is not None: filename = getImageFileName(cover.replace(os.path.join(dstdir, 'OEBPS'), '').lstrip('/').lstrip('\\\\')) if '.png' == filename[1]: mt = 'image/png' else: mt = 'image/jpeg' f.write("\n") reflist = [] for path in filelist: folder = path[0].replace(os.path.join(dstdir, 'OEBPS'), '').lstrip('/').lstrip('\\\\').replace("\\", "/") filename = getImageFileName(path[1]) uniqueid = os.path.join(folder, filename[0]).replace('/', '_').replace('\\', '_') reflist.append(uniqueid) f.write("\n") if '.png' == filename[1]: mt = 'image/png' else: mt = 'image/jpeg' f.write("\n") f.write("\n") def pageSpreadProperty(pageside): if options.iskindle: return "linear=\"yes\" properties=\"page-spread-%s\"" % pageside elif options.isKobo: return "properties=\"rendition:page-spread-%s\"" % pageside else: return "" if options.righttoleft: f.write("\n\n") pageside = "right" else: f.write("\n\n") pageside = "left" if options.iskindle or options.supportSyntheticSpread: for entry in reflist: if options.righttoleft: if entry.endswith("-a"): f.write( "\n" % (entry, pageSpreadProperty("center")) ) pageside = "right" elif entry.endswith("-b"): f.write( "\n" % (entry, pageSpreadProperty("right")) ) pageside = "right" elif entry.endswith("-c"): f.write( "\n" % (entry, pageSpreadProperty("left")) ) pageside = "right" else: f.write( "\n" % (entry, pageSpreadProperty(pageside)) ) if pageside == "right": pageside = "left" else: pageside = "right" else: if entry.endswith("-a"): f.write( "\n" % (entry, pageSpreadProperty("center")) ) pageside = "left" elif entry.endswith("-b"): f.write( "\n" % (entry, pageSpreadProperty("left")) ) pageside = "left" elif entry.endswith("-c"): f.write( "\n" % (entry, pageSpreadProperty("right")) ) pageside = "left" else: f.write( "\n" % (entry, pageSpreadProperty(pageside)) ) if pageside == "right": pageside = "left" else: pageside = "right" else: for entry in reflist: f.write("\n") f.write("\n\n") f.close() os.mkdir(os.path.join(dstdir, 'META-INF')) f = open(os.path.join(dstdir, 'META-INF', 'container.xml'), 'w', encoding='UTF-8') f.writelines(["\n", "\n", "\n", "\n", "\n", ""]) f.close() def buildEPUB(path, chapternames, tomenumber, ischunked): filelist = [] chapterlist = [] cover = None os.mkdir(os.path.join(path, 'OEBPS', 'Text')) f = open(os.path.join(path, 'OEBPS', 'Text', 'style.css'), 'w', encoding='UTF-8') f.writelines(["@page {\n", "margin: 0;\n", "}\n", "body {\n", "display: block;\n", "margin: 0;\n", "padding: 0;\n", "}\n"]) if options.iskindle and options.panelview: f.writelines(["#PV {\n", "position: absolute;\n", "width: 100%;\n", "height: 100%;\n", "top: 0;\n", "left: 0;\n", "}\n", "#PV-T {\n", "top: 0;\n", "width: 100%;\n", "height: 50%;\n", "}\n", "#PV-B {\n", "bottom: 0;\n", "width: 100%;\n", "height: 50%;\n", "}\n", "#PV-L {\n", "left: 0;\n", "width: 49.5%;\n", "height: 100%;\n", "float: left;\n", "}\n", "#PV-R {\n", "right: 0;\n", "width: 49.5%;\n", "height: 100%;\n", "float: right;\n", "}\n", "#PV-TL {\n", "top: 0;\n", "left: 0;\n", "width: 49.5%;\n", "height: 50%;\n", "float: left;\n", "}\n", "#PV-TR {\n", "top: 0;\n", "right: 0;\n", "width: 49.5%;\n", "height: 50%;\n", "float: right;\n", "}\n", "#PV-BL {\n", "bottom: 0;\n", "left: 0;\n", "width: 49.5%;\n", "height: 50%;\n", "float: left;\n", "}\n", "#PV-BR {\n", "bottom: 0;\n", "right: 0;\n", "width: 49.5%;\n", "height: 50%;\n", "float: right;\n", "}\n", ".PV-P {\n", "width: 100%;\n", "height: 100%;\n", "top: 0;\n", "position: absolute;\n", "display: none;\n", "}\n"]) f.close() for dirpath, dirnames, filenames in os.walk(os.path.join(path, 'OEBPS', 'Images')): chapter = False dirnames, filenames = walkSort(dirnames, filenames) for afile in filenames: if cover is None: cover = os.path.join(os.path.join(path, 'OEBPS', 'Images'), 'cover' + getImageFileName(afile)[1]) options.covers.append((image.Cover(os.path.join(dirpath, afile), cover, options, tomenumber), options.uuid)) if options.dedupecover: os.remove(os.path.join(dirpath, afile)) continue filelist.append(buildHTML(dirpath, afile, os.path.join(dirpath, afile))) if not chapter: chapterlist.append((dirpath.replace('Images', 'Text'), filelist[-1][1])) chapter = True # Overwrite chapternames if tree is flat and ComicInfo.xml has bookmarks if not chapternames and options.chapters and not ischunked: chapterlist = [] global_diff = 0 diff_delta = 0 # if split if options.splitter == 0: diff_delta = 1 # if rotate and split elif options.splitter == 2: diff_delta = 2 for aChapter in options.chapters: pageid = aChapter[0] if options.dedupecover: if pageid == 0: continue else: pageid -= 1 cur_diff = global_diff global_diff = 0 for x in range(0, pageid + cur_diff + 1): if '-kcc-b' in filelist[x][1]: pageid += diff_delta global_diff += diff_delta filename = filelist[pageid][1] chapterlist.append((filelist[pageid][0].replace('Images', 'Text'), filename)) chapternames[filename] = aChapter[1] buildNCX(path, options.title, chapterlist, chapternames) buildNAV(path, options.title, chapterlist, chapternames) buildOPF(path, options.title, filelist, cover) def imgDirectoryProcessing(path): global workerPool, workerOutput workerPool = Pool(maxtasksperchild=100) workerOutput = [] options.imgMetadata = {} options.imgOld = [] work = [] pagenumber = 0 for dirpath, _, filenames in os.walk(path): for afile in filenames: pagenumber += 1 work.append([afile, dirpath, options]) if GUI: GUI.progressBarTick.emit(str(pagenumber)) if len(work) > 0: for i in work: workerPool.apply_async(func=imgFileProcessing, args=(i,), callback=imgFileProcessingTick) workerPool.close() workerPool.join() if GUI and not GUI.conversionAlive: rmtree(os.path.join(path, '..', '..'), True) raise UserWarning("Conversion interrupted.") if len(workerOutput) > 0: rmtree(os.path.join(path, '..', '..'), True) raise RuntimeError("One of workers crashed. Cause: " + workerOutput[0][0], workerOutput[0][1]) for file in options.imgOld: if os.path.isfile(file): os.remove(file) else: rmtree(os.path.join(path, '..', '..'), True) raise UserWarning("Source directory is empty.") def imgFileProcessingTick(output): if isinstance(output, tuple): workerOutput.append(output) workerPool.terminate() else: for page in output: if page is not None: options.imgMetadata[page[0]] = page[1] options.imgOld.append(page[2]) if GUI: GUI.progressBarTick.emit('tick') if not GUI.conversionAlive: workerPool.terminate() def imgFileProcessing(work): try: afile = work[0] dirpath = work[1] opt = work[2] output = [] workImg = image.ComicPageParser((dirpath, afile), opt) for i in workImg.payload: img = image.ComicPage(opt, *i) if opt.cropping == 2 and not opt.webtoon: img.cropPageNumber(opt.croppingp, opt.croppingm) if opt.cropping > 0 and not opt.webtoon: img.cropMargin(opt.croppingp, opt.croppingm) img.autocontrastImage() img.resizeImage() if opt.forcepng and not opt.forcecolor: img.quantizeImage() output.append(img.saveToDir()) return output except Exception: return str(sys.exc_info()[1]), sanitizeTrace(sys.exc_info()[2]) def getWorkFolder(afile): if os.path.isdir(afile): if disk_usage(gettempdir())[2] < getDirectorySize(afile) * 2.5: raise UserWarning("Not enough disk space to perform conversion.") workdir = mkdtemp('', 'KCC-') try: os.rmdir(workdir) fullPath = os.path.join(workdir, 'OEBPS', 'Images') copytree(afile, fullPath) sanitizePermissions(fullPath) return workdir except Exception: rmtree(workdir, True) raise UserWarning("Failed to prepare a workspace.") elif os.path.isfile(afile): if disk_usage(gettempdir())[2] < os.path.getsize(afile) * 2.5: raise UserWarning("Not enough disk space to perform conversion.") if afile.lower().endswith('.pdf'): pdf = pdfjpgextract.PdfJpgExtract(afile) path, njpg = pdf.extract() if njpg == 0: rmtree(path, True) raise UserWarning("Failed to extract images from PDF file.") else: workdir = mkdtemp('', 'KCC-') try: cbx = comicarchive.ComicArchive(afile) path = cbx.extract(workdir) tdir = os.listdir(workdir) if 'ComicInfo.xml' in tdir: tdir.remove('ComicInfo.xml') except OSError as e: rmtree(workdir, True) raise UserWarning(e) else: raise UserWarning("Failed to open source file/directory.") sanitizePermissions(path) newpath = mkdtemp('', 'KCC-') copytree(path, os.path.join(newpath, 'OEBPS', 'Images')) rmtree(path, True) return newpath def getOutputFilename(srcpath, wantedname, ext, tomenumber): if srcpath[-1] == os.path.sep: srcpath = srcpath[:-1] if 'Ko' in options.profile and options.format == 'EPUB': ext = '.kepub.epub' if wantedname is not None: if wantedname.endswith(ext): filename = os.path.abspath(wantedname) elif os.path.isdir(srcpath): filename = os.path.join(os.path.abspath(options.output), os.path.basename(srcpath) + ext) else: filename = os.path.join(os.path.abspath(options.output), os.path.basename(os.path.splitext(srcpath)[0]) + ext) elif os.path.isdir(srcpath): filename = srcpath + tomenumber + ext else: if 'Ko' in options.profile and options.format == 'EPUB': src = pathlib.Path(srcpath) name = re.sub(r'\W+', '_', src.stem) + tomenumber + ext filename = src.with_name(name) else: filename = os.path.splitext(srcpath)[0] + tomenumber + ext if os.path.isfile(filename): counter = 0 basename = os.path.splitext(filename)[0] while os.path.isfile(basename + '_kcc' + str(counter) + ext): counter += 1 filename = basename + '_kcc' + str(counter) + ext return filename def getComicInfo(path, originalpath): xmlPath = os.path.join(path, 'ComicInfo.xml') options.chapters = [] options.summary = '' titleSuffix = '' if options.title == 'defaulttitle': defaultTitle = True if os.path.isdir(originalpath): options.title = os.path.basename(originalpath) else: options.title = os.path.splitext(os.path.basename(originalpath))[0] else: defaultTitle = False if options.author == 'defaultauthor': defaultAuthor = True options.authors = ['KCC'] else: defaultAuthor = False options.authors = [options.author] if os.path.exists(xmlPath): try: xml = metadata.MetadataParser(xmlPath) except Exception: os.remove(xmlPath) return if xml.data['Title']: options.title = hescape(xml.data['Title']) elif defaultTitle: if xml.data['Series']: options.title = hescape(xml.data['Series']) if xml.data['Volume']: titleSuffix += ' V' + xml.data['Volume'].zfill(2) if xml.data['Number']: titleSuffix += ' #' + xml.data['Number'].zfill(3) options.title += titleSuffix if defaultAuthor: options.authors = [] for field in ['Writers', 'Pencillers', 'Inkers', 'Colorists']: for person in xml.data[field]: options.authors.append(hescape(person)) if len(options.authors) > 0: options.authors = list(set(options.authors)) options.authors.sort() else: options.authors = ['KCC'] if xml.data['Bookmarks']: options.chapters = xml.data['Bookmarks'] if xml.data['Summary']: options.summary = hescape(xml.data['Summary']) os.remove(xmlPath) def getDirectorySize(start_path='.'): total_size = 0 for dirpath, _, filenames in os.walk(start_path): for f in filenames: fp = os.path.join(dirpath, f) total_size += os.path.getsize(fp) return total_size def getTopMargin(deviceres, size): y = int((deviceres[1] - size[1]) / 2) / deviceres[1] * 100 return str(round(y, 1)) def getPanelViewResolution(imagesize, deviceres): scale = float(deviceres[0]) / float(imagesize[0]) return int(deviceres[0]), int(scale * imagesize[1]) def getPanelViewSize(deviceres, size): x = int(deviceres[0] / 2 - size[0] / 2) / deviceres[0] * 100 y = int(deviceres[1] / 2 - size[1] / 2) / deviceres[1] * 100 return str(int(x)), str(int(y)) def sanitizeTree(filetree): chapterNames = {} for root, dirs, files in os.walk(filetree, False): for i, name in enumerate(os_sorted(files)): splitname = os.path.splitext(name) # file needs kcc at front AND back to avoid renaming issues slugified = f'kcc-{i:04}' for suffix in '-KCC', '-KCC-A', '-KCC-B', '-KCC-C': if splitname[0].endswith(suffix): slugified += suffix.lower() break newKey = os.path.join(root, slugified + splitname[1]) key = os.path.join(root, name) if key != newKey: os.replace(key, newKey) for name in dirs: tmpName = name slugified = slugify(name) while os.path.exists(os.path.join(root, slugified)) and name.upper() != slugified.upper(): slugified += "A" chapterNames[slugified] = tmpName newKey = os.path.join(root, slugified) key = os.path.join(root, name) if key != newKey: os.replace(key, newKey) return chapterNames def sanitizePermissions(filetree): for root, dirs, files in os.walk(filetree, False): for name in files: os.chmod(os.path.join(root, name), S_IWRITE | S_IREAD) for name in dirs: os.chmod(os.path.join(root, name), S_IWRITE | S_IREAD | S_IEXEC) def splitDirectory(path): level = -1 for root, _, files in os.walk(os.path.join(path, 'OEBPS', 'Images')): for f in files: if f.endswith('.jpg') or f.endswith('.jpeg') or f.endswith('.png') or f.endswith('.gif') or \ f.endswith('.webp'): newLevel = os.path.join(root, f).replace(os.path.join(path, 'OEBPS', 'Images'), '').count(os.sep) if level != -1 and level != newLevel: level = 0 break else: level = newLevel if level > 0: splitter = splitProcess(os.path.join(path, 'OEBPS', 'Images'), level) path = [path] for tome in splitter: path.append(tome) return path else: raise UserWarning('Unsupported directory structure.') def splitProcess(path, mode): output = [] currentSize = 0 currentTarget = path if options.targetsize: targetSize = options.targetsize * 1048576 elif options.webtoon: targetSize = 104857600 else: targetSize = 419430400 if options.batchsplit == 2 and mode == 2: mode = 3 if mode < 3: for root, dirs, files in walkLevel(path, 0): for name in files if mode == 1 else dirs: if mode == 1: size = os.path.getsize(os.path.join(root, name)) else: size = getDirectorySize(os.path.join(root, name)) if currentSize + size > targetSize: currentTarget, pathRoot = createNewTome() output.append(pathRoot) currentSize = size else: currentSize += size if path != currentTarget: move(os.path.join(root, name), os.path.join(currentTarget, name)) else: firstTome = True for root, dirs, _ in walkLevel(path, 0): for name in dirs: if not firstTome: currentTarget, pathRoot = createNewTome() output.append(pathRoot) move(os.path.join(root, name), os.path.join(currentTarget, name)) else: firstTome = False return output def detectCorruption(tmppath, orgpath): imageNumber = 0 imageSmaller = 0 alreadyProcessed = False for root, _, files in os.walk(tmppath, False): for name in files: if getImageFileName(name) is not None: if not alreadyProcessed and getImageFileName(name)[0].endswith('-kcc'): alreadyProcessed = True path = os.path.join(root, name) pathOrg = orgpath + path.split('OEBPS' + os.path.sep + 'Images')[1] if os.path.getsize(path) == 0: rmtree(os.path.join(tmppath, '..', '..'), True) raise RuntimeError('Image file %s is corrupted.' % pathOrg) try: img = Image.open(path) img.verify() img = Image.open(path) img.load() imageNumber += 1 if options.profileData[1][0] > img.size[0] and options.profileData[1][1] > img.size[1]: imageSmaller += 1 except Exception as err: rmtree(os.path.join(tmppath, '..', '..'), True) if 'decoder' in str(err) and 'not available' in str(err): raise RuntimeError('Pillow was compiled without JPG and/or PNG decoder.') else: raise RuntimeError('Image file %s is corrupted. Error: %s' % (pathOrg, str(err))) else: os.remove(os.path.join(root, name)) if alreadyProcessed: print("WARNING: Source files are probably created by KCC. The second conversion will decrease quality.") if GUI: GUI.addMessage.emit('Source files are probably created by KCC. The second conversion will decrease quality.' , 'warning', False) GUI.addMessage.emit('', '', False) if imageSmaller > imageNumber * 0.25 and not options.upscale and not options.stretch and options.profile != 'KS': print("WARNING: More than 25% of images are smaller than target device resolution. " "Consider enabling stretching or upscaling to improve readability.") if GUI: GUI.addMessage.emit('More than 25% of images are smaller than target device resolution.', 'warning', False) GUI.addMessage.emit('Consider enabling stretching or upscaling to improve readability.', 'warning', False) GUI.addMessage.emit('', '', False) def createNewTome(): tomePathRoot = mkdtemp('', 'KCC-') tomePath = os.path.join(tomePathRoot, 'OEBPS', 'Images') os.makedirs(tomePath) return tomePath, tomePathRoot def slugify(value): value = slugify_ext(value, regex_pattern=r'[^-a-z0-9_\.]+').strip('.') value = sub(r'0*([0-9]{4,})', r'\1', sub(r'([0-9]+)', r'0000\1', value, count=2)) return value def makeZIP(zipfilename, basedir, isepub=False): zipfilename = os.path.abspath(zipfilename) + '.zip' zipOutput = ZipFile(zipfilename, 'w', ZIP_DEFLATED) if isepub: zipOutput.writestr('mimetype', 'application/epub+zip', ZIP_STORED) for dirpath, _, filenames in os.walk(basedir): for name in filenames: path = os.path.normpath(os.path.join(dirpath, name)) aPath = os.path.normpath(os.path.join(dirpath.replace(basedir, ''), name)) if os.path.isfile(path): zipOutput.write(path, aPath) zipOutput.close() return zipfilename def makeParser(): psr = ArgumentParser(prog="kcc-c2e", usage="kcc-c2e [options] [input]", add_help=False) mandatory_options = psr.add_argument_group("MANDATORY") main_options = psr.add_argument_group("MAIN") processing_options = psr.add_argument_group("PROCESSING") output_options = psr.add_argument_group("OUTPUT SETTINGS") custom_profile_options = psr.add_argument_group("CUSTOM PROFILE") other_options = psr.add_argument_group("OTHER") mandatory_options.add_argument("input", action="extend", nargs="*", default=None, help="Full path to comic folder or file(s) to be processed.") main_options.add_argument("-p", "--profile", action="store", dest="profile", default="KV", help=f"Device profile (Available options: {', '.join(image.ProfileData.Profiles.keys())})" " [Default=KV]") main_options.add_argument("-m", "--manga-style", action="store_true", dest="righttoleft", default=False, help="Manga style (right-to-left reading and splitting)") main_options.add_argument("-q", "--hq", action="store_true", dest="hq", default=False, help="Try to increase the quality of magnification") main_options.add_argument("-2", "--two-panel", action="store_true", dest="autoscale", default=False, help="Display two not four panels in Panel View mode") main_options.add_argument("-w", "--webtoon", action="store_true", dest="webtoon", default=False, help="Webtoon processing mode"), main_options.add_argument("--ts", "--targetsize", type=int, dest="targetsize", default=None, help="the maximal size of output file in MB." " [Default=100MB for webtoon and 400MB for others]") output_options.add_argument("-o", "--output", action="store", dest="output", default=None, help="Output generated file to specified directory or file") output_options.add_argument("-t", "--title", action="store", dest="title", default="defaulttitle", help="Comic title [Default=filename or directory name]") output_options.add_argument("-a", "--author", action="store", dest="author", default="defaultauthor", help="Author name [Default=KCC]") output_options.add_argument("-f", "--format", action="store", dest="format", default="Auto", help="Output format (Available options: Auto, MOBI, EPUB, CBZ, KFX, MOBI+EPUB) " "[Default=Auto]") output_options.add_argument("-b", "--batchsplit", type=int, dest="batchsplit", default="0", help="Split output into multiple files. 0: Don't split 1: Automatic mode " "2: Consider every subdirectory as separate volume [Default=0]") output_options.add_argument("--dedupecover", action="store_true", dest="dedupecover", default=False, help="De-duplicate the cover as the first page in the book") processing_options.add_argument("-n", "--noprocessing", action="store_true", dest="noprocessing", default=False, help="Do not modify image and ignore any profil or processing option") processing_options.add_argument("-u", "--upscale", action="store_true", dest="upscale", default=False, help="Resize images smaller than device's resolution") processing_options.add_argument("-s", "--stretch", action="store_true", dest="stretch", default=False, help="Stretch images to device's resolution") processing_options.add_argument("-r", "--splitter", type=int, dest="splitter", default="0", help="Double page parsing mode. 0: Split 1: Rotate 2: Both [Default=0]") processing_options.add_argument("-g", "--gamma", type=float, dest="gamma", default="0.0", help="Apply gamma correction to linearize the image [Default=Auto]") processing_options.add_argument("-c", "--cropping", type=int, dest="cropping", default="2", help="Set cropping mode. 0: Disabled 1: Margins 2: Margins + page numbers [Default=2]") processing_options.add_argument("--cp", "--croppingpower", type=float, dest="croppingp", default="1.0", help="Set cropping power [Default=1.0]") processing_options.add_argument("--cm", "--croppingminimum", type=float, dest="croppingm", default="0.0", help="Set cropping minimum area ratio [Default=0.0]") processing_options.add_argument("--blackborders", action="store_true", dest="black_borders", default=False, help="Disable autodetection and force black borders") processing_options.add_argument("--whiteborders", action="store_true", dest="white_borders", default=False, help="Disable autodetection and force white borders") processing_options.add_argument("--forcecolor", action="store_true", dest="forcecolor", default=False, help="Don't convert images to grayscale") processing_options.add_argument("--forcepng", action="store_true", dest="forcepng", default=False, help="Create PNG files instead JPEG") processing_options.add_argument("--mozjpeg", action="store_true", dest="mozjpeg", default=False, help="Create JPEG files using mozJpeg") processing_options.add_argument("--maximizestrips", action="store_true", dest="maximizestrips", default=False, help="Turn 1x4 strips to 2x2 strips") processing_options.add_argument("-d", "--delete", action="store_true", dest="delete", default=False, help="Delete source file(s) or a directory. It's not recoverable.") custom_profile_options.add_argument("--customwidth", type=int, dest="customwidth", default=0, help="Replace screen width provided by device profile") custom_profile_options.add_argument("--customheight", type=int, dest="customheight", default=0, help="Replace screen height provided by device profile") other_options.add_argument("-h", "--help", action="help", help="Show this help message and exit") return psr def checkOptions(options): options.panelview = True options.iskindle = False options.isKobo = False options.bordersColor = None options.keep_epub = False if options.format == 'EPUB-200MB': options.targetsize = 195 options.format = 'EPUB' if options.batchsplit != 2: options.batchsplit = 1 if options.format == 'MOBI+EPUB': options.keep_epub = True options.format = 'MOBI' options.kfx = False options.supportSyntheticSpread = False if options.format == 'Auto': if options.profile in ['KDX']: options.format = 'CBZ' elif options.profile in image.ProfileData.ProfilesKindle.keys(): options.format = 'MOBI' else: options.format = 'EPUB' if options.profile in image.ProfileData.ProfilesKindle.keys(): options.iskindle = True else: options.isKobo = True # Other Kobo devices probably support synthetic spreads as well, but # they haven't been tested. if options.profile in ['KoF']: options.supportSyntheticSpread = True if options.white_borders: options.bordersColor = 'white' if options.black_borders: options.bordersColor = 'black' # Splitting MOBI is not optional if (options.format == 'MOBI' or options.format == 'KFX') and options.batchsplit != 2: options.batchsplit = 1 # Older Kindle models don't support Panel View. if options.profile == 'K1' or options.profile == 'K2' or options.profile == 'K34' or options.profile == 'KDX': options.panelview = False options.hq = False # Webtoon mode mandatory options if options.webtoon: options.panelview = False options.righttoleft = False options.upscale = True options.hq = False # Disable all Kindle features for other e-readers if options.profile == 'OTHER': options.panelview = False options.hq = False if 'Ko' in options.profile: options.panelview = False options.hq = False # CBZ files on Kindle DX/DXG support higher resolution if options.profile == 'KDX' and options.format == 'CBZ': options.customheight = 1200 # KFX output create EPUB that might be can be by jhowell KFX Output Calibre plugin if options.format == 'KFX': options.format = 'EPUB' options.kfx = True options.panelview = False # Override profile data if options.customwidth != 0 or options.customheight != 0: X = image.ProfileData.Profiles[options.profile][1][0] Y = image.ProfileData.Profiles[options.profile][1][1] if options.customwidth != 0: X = options.customwidth if options.customheight != 0: Y = options.customheight newProfile = ("Custom", (int(X), int(Y)), image.ProfileData.Palette16, image.ProfileData.Profiles[options.profile][3]) image.ProfileData.Profiles["Custom"] = newProfile options.profile = "Custom" options.profileData = image.ProfileData.Profiles[options.profile] return options def checkTools(source): source = source.upper() if source.endswith('.CB7') or source.endswith('.7Z') or source.endswith('.RAR') or source.endswith('.CBR') or \ source.endswith('.ZIP') or source.endswith('.CBZ'): try: subprocess_run(['7z'], stdout=PIPE, stderr=STDOUT) except FileNotFoundError: print('ERROR: 7z is missing!') sys.exit(1) if options.format == 'MOBI': try: subprocess_run(['kindlegen', '-locale', 'en'], stdout=PIPE, stderr=STDOUT) except FileNotFoundError: print('ERROR: KindleGen is missing!') sys.exit(1) def checkPre(source): # Make sure that all temporary files are gone for root, dirs, _ in walkLevel(gettempdir(), 0): for tempdir in dirs: if tempdir.startswith('KCC-'): rmtree(os.path.join(root, tempdir), True) # Make sure that target directory is writable if os.path.isdir(source): src = os.path.abspath(os.path.join(source, '..')) else: src = os.path.dirname(source) try: with TemporaryFile(prefix='KCC-', dir=src): pass except Exception: raise UserWarning("Target directory is not writable.") def makeBook(source, qtgui=None): global GUI GUI = qtgui if GUI: GUI.progressBarTick.emit('1') else: checkTools(source) checkPre(source) print("Preparing source images...") path = getWorkFolder(source) print("Checking images...") getComicInfo(os.path.join(path, "OEBPS", "Images"), source) detectCorruption(os.path.join(path, "OEBPS", "Images"), source) if options.webtoon: y = image.ProfileData.Profiles[options.profile][1][1] comic2panel.main(['-y ' + str(y), '-i', '-m', path], qtgui) if options.noprocessing: print("Do not process image, ignore any profile or processing option") else: print("Processing images...") if GUI: GUI.progressBarTick.emit('Processing images') imgDirectoryProcessing(os.path.join(path, "OEBPS", "Images")) if GUI: GUI.progressBarTick.emit('1') chapterNames = sanitizeTree(os.path.join(path, 'OEBPS', 'Images')) if options.batchsplit > 0: tomes = splitDirectory(path) else: tomes = [path] filepath = [] tomeNumber = 0 if GUI: if options.format == 'CBZ': GUI.progressBarTick.emit('Compressing CBZ files') else: GUI.progressBarTick.emit('Compressing EPUB files') GUI.progressBarTick.emit(str(len(tomes) + 1)) GUI.progressBarTick.emit('tick') options.baseTitle = options.title options.covers = [] for tome in tomes: options.uuid = str(uuid4()) if len(tomes) > 9: tomeNumber += 1 options.title = options.baseTitle + ' [' + str(tomeNumber).zfill(2) + '/' + str(len(tomes)).zfill(2) + ']' elif len(tomes) > 1: tomeNumber += 1 options.title = options.baseTitle + ' [' + str(tomeNumber) + '/' + str(len(tomes)) + ']' if options.format == 'CBZ': print("Creating CBZ file...") if len(tomes) > 1: filepath.append(getOutputFilename(source, options.output, '.cbz', ' ' + str(tomeNumber))) else: filepath.append(getOutputFilename(source, options.output, '.cbz', '')) makeZIP(tome + '_comic', os.path.join(tome, "OEBPS", "Images")) else: print("Creating EPUB file...") if len(tomes) > 1: buildEPUB(tome, chapterNames, tomeNumber, True) filepath.append(getOutputFilename(source, options.output, '.epub', ' ' + str(tomeNumber))) else: buildEPUB(tome, chapterNames, tomeNumber, False) filepath.append(getOutputFilename(source, options.output, '.epub', '')) makeZIP(tome + '_comic', tome, True) copyfile(tome + '_comic.zip', filepath[-1]) try: os.remove(tome + '_comic.zip') except FileNotFoundError: # newly temporary created file is not found. It might have been already deleted pass rmtree(tome, True) if GUI: GUI.progressBarTick.emit('tick') if not GUI and options.format == 'MOBI': print("Creating MOBI files...") work = [] for i in filepath: work.append([i]) output = makeMOBI(work, GUI) for errors in output: if errors[0] != 0: print('Error: KindleGen failed to create MOBI!') print(errors) return filepath k = kindle.Kindle(options.profile) if k.path and k.coverSupport: print("Kindle detected. Uploading covers...") for i in filepath: output = makeMOBIFix(i, options.covers[filepath.index(i)][1]) if not output[0]: print('Error: Failed to tweak KindleGen output!') return filepath else: os.remove(i.replace('.epub', '.mobi') + '_toclean') if k.path and k.coverSupport: options.covers[filepath.index(i)][0].saveToKindle(k, options.covers[filepath.index(i)][1]) if options.delete: if os.path.isfile(source): os.remove(source) elif os.path.isdir(source): rmtree(source) return filepath def makeMOBIFix(item, uuid): is_pdoc = options.profile in image.ProfileData.ProfilesKindlePDOC.keys() if not options.keep_epub: os.remove(item) mobiPath = item.replace('.epub', '.mobi') move(mobiPath, mobiPath + '_toclean') try: dualmetafix.DualMobiMetaFix(mobiPath + '_toclean', mobiPath, bytes(uuid, 'UTF-8'), is_pdoc) return [True] except Exception as err: return [False, format(err)] def makeMOBIWorkerTick(output): makeMOBIWorkerOutput.append(output) if output[0] != 0: makeMOBIWorkerPool.terminate() if GUI: GUI.progressBarTick.emit('tick') if not GUI.conversionAlive: makeMOBIWorkerPool.terminate() def makeMOBIWorker(item): item = item[0] kindlegenErrorCode = 0 kindlegenError = '' try: if os.path.getsize(item) < 629145600: output = subprocess_run(['kindlegen', '-dont_append_source', '-locale', 'en', item], stdout=PIPE, stderr=STDOUT, encoding='UTF-8') for line in output.stdout.splitlines(): # ERROR: Generic error if "Error(" in line: kindlegenErrorCode = 1 kindlegenError = line # ERROR: EPUB too big if ":E23026:" in line: kindlegenErrorCode = 23026 if kindlegenErrorCode > 0: break if ":I1036: Mobi file built successfully" in line: break else: # ERROR: EPUB too big kindlegenErrorCode = 23026 return [kindlegenErrorCode, kindlegenError, item] except Exception as err: # ERROR: KCC unknown generic error kindlegenErrorCode = 1 kindlegenError = format(err) return [kindlegenErrorCode, kindlegenError, item] def makeMOBI(work, qtgui=None): global GUI, makeMOBIWorkerPool, makeMOBIWorkerOutput GUI = qtgui makeMOBIWorkerOutput = [] availableMemory = virtual_memory().total / 1000000000 if availableMemory <= 2: threadNumber = 1 elif 2 < availableMemory <= 4: threadNumber = 2 elif 4 < availableMemory: threadNumber = 4 else: threadNumber = None makeMOBIWorkerPool = Pool(threadNumber, maxtasksperchild=10) for i in work: makeMOBIWorkerPool.apply_async(func=makeMOBIWorker, args=(i, ), callback=makeMOBIWorkerTick) makeMOBIWorkerPool.close() makeMOBIWorkerPool.join() return makeMOBIWorkerOutput