Переименования

This commit is contained in:
Book Pauk
2022-11-10 00:40:44 +07:00
parent 8ee1b98a12
commit ec6b72868b
4 changed files with 31 additions and 95 deletions

View File

@@ -1,101 +1,37 @@
const fs = require('fs-extra');
const iconv = require('iconv-lite');
const textUtils = require('./textUtils');
const XmlParser = require('../xml/XmlParser');
const utils = require('../utils');
class Fb2Parser {
checkEncoding(data) {
//Корректируем кодировку UTF-16
let encoding = textUtils.getEncoding(data);
if (encoding.indexOf('UTF-16') == 0) {
data = Buffer.from(iconv.decode(data, encoding));
encoding = 'utf-8';
}
//Корректируем пробелы, всякие файлы попадаются :(
if (data[0] == 32) {
data = Buffer.from(data.toString().trim());
}
//Окончательно корректируем кодировку
let result = data;
let left = data.indexOf('<?xml version="1.0"');
if (left < 0) {
left = data.indexOf('<?xml version=\'1.0\'');
}
if (left >= 0) {
const right = data.indexOf('?>', left);
if (right >= 0) {
const head = data.slice(left, right + 2).toString();
const m = head.match(/encoding=['"](.*?)['"]/);
if (m) {
let enc = m[1].toLowerCase();
if (enc != 'utf-8') {
//enc может не соответсвовать реальной кодировке файла, поэтому:
if (encoding.indexOf('ISO-8859') >= 0) {
encoding = enc;
}
result = iconv.decode(data, encoding);
result = Buffer.from(result.toString().replace(m[0], `encoding="utf-8"`));
}
}
}
}
return result;
constructor() {
this.xml = new XmlParser();
}
async getDescAndCover(bookFile) {
let data = await fs.readFile(bookFile);
data = await utils.gunzipBuffer(data);
toString(options) {
return this.xml.toString(options);
}
data = this.checkEncoding(data);
fromString(fb2String) {
this.xml.fromString(fb2String);
return this;
}
const xml = new XmlParser();
toObject(options) {
return this.xml.toObject(options);
}
xml.fromString(data.toString(), {
lowerCase: true,
pickNode: route => route.indexOf('fictionbook/body') !== 0,
});
fromObject(fb2Object) {
this.xml.fromObject(fb2Object);
return this;
}
const desc = xml.$$('description').toObject();
const coverImage = xml.navigator(desc).$('description/title-info/coverpage/image');
bookInfo(fb2Object) {
if (!fb2Object)
fb2Object = this.toObject();
let cover = null;
let coverExt = '';
if (coverImage) {
const coverAttrs = coverImage.attrs();
const href = coverAttrs['l:href'];
let coverType = coverAttrs['content-type'];
coverType = (coverType == 'image/jpg' || coverType == 'application/octet-stream' ? 'image/jpeg' : coverType);
coverExt = (coverType == 'image/png' ? '.png' : '.jpg');
//const result = {};
if (href) {
const binaryId = (href[0] == '#' ? href.substring(1) : href);
}
//найдем нужный image
xml.$$('binary').eachSelf(node => {
let attrs = node.attrs();
if (!attrs)
return;
attrs = Object.fromEntries(attrs);
if (attrs.id === binaryId) {
const textNode = new XmlParser(node.value);
const base64 = textNode.$self('*TEXT').value;
cover = (base64 ? Buffer.from(base64, 'base64') : null);
}
});
}
}
return {desc, cover, coverExt};
bookInfoList(fb2Object) {
}
}