Улучшение парсинга html

This commit is contained in:
Book Pauk
2019-03-16 16:40:31 +07:00
parent e800dfe796
commit 983d9ee1b9
3 changed files with 9 additions and 0 deletions

View File

@@ -1,6 +1,7 @@
const fs = require('fs-extra');
const iconv = require('iconv-lite');
const chardet = require('chardet');
const he = require('he');
const textUtils = require('./textUtils');
const utils = require('../utils');
@@ -80,6 +81,10 @@ class ConvertBase {
return text.replace(/ |[\t\n\r]/g, ' ');
}
escapeEntities(text) {
return he.escape(text);
}
formatFb2(fb2) {
let out = '<?xml version="1.0" encoding="utf-8"?>';
out += '<FictionBook xmlns="http://www.gribuser.ru/xml/fictionbook/2.0" xmlns:l="http://www.w3.org/1999/xlink">';