WebWorker.js 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631
  1. const os = require('os');
  2. const path = require('path');
  3. const fs = require('fs-extra');
  4. const _ = require('lodash');
  5. const ZipReader = require('./ZipReader');
  6. const WorkerState = require('./WorkerState');//singleton
  7. const { JembaDb, JembaDbThread } = require('jembadb');
  8. const DbCreator = require('./DbCreator');
  9. const DbSearcher = require('./DbSearcher');
  10. const InpxHashCreator = require('./InpxHashCreator');
  11. const RemoteLib = require('./RemoteLib');//singleton
  12. const ayncExit = new (require('./AsyncExit'))();
  13. const log = new (require('./AppLogger'))().log;//singleton
  14. const utils = require('./utils');
  15. const genreTree = require('./genres');
  16. //server states
  17. const ssNormal = 'normal';
  18. const ssDbLoading = 'db_loading';
  19. const ssDbCreating = 'db_creating';
  20. const stateToText = {
  21. [ssNormal]: '',
  22. [ssDbLoading]: 'Загрузка поисковой базы',
  23. [ssDbCreating]: 'Создание поисковой базы',
  24. };
  25. const cleanDirPeriod = 60*60*1000;//каждый час
  26. //singleton
  27. let instance = null;
  28. class WebWorker {
  29. constructor(config) {
  30. if (!instance) {
  31. this.config = config;
  32. this.workerState = new WorkerState();
  33. this.remoteLib = null;
  34. if (config.remoteLib) {
  35. this.remoteLib = new RemoteLib(config);
  36. }
  37. this.inpxHashCreator = new InpxHashCreator(config);
  38. this.inpxFileHash = '';
  39. this.wState = this.workerState.getControl('server_state');
  40. this.myState = '';
  41. this.db = null;
  42. this.dbSearcher = null;
  43. ayncExit.add(this.closeDb.bind(this));
  44. this.loadOrCreateDb();//no await
  45. this.periodicLogServerStats();//no await
  46. const dirConfig = [
  47. {
  48. dir: config.filesDir,
  49. maxSize: config.maxFilesDirSize,
  50. },
  51. ];
  52. this.periodicCleanDir(dirConfig);//no await
  53. this.periodicCheckInpx();//no await
  54. instance = this;
  55. }
  56. return instance;
  57. }
  58. checkMyState() {
  59. if (this.myState != ssNormal)
  60. throw new Error('server_busy');
  61. }
  62. setMyState(newState, workerState = {}) {
  63. this.myState = newState;
  64. this.wState.set(Object.assign({}, workerState, {
  65. state: newState,
  66. serverMessage: stateToText[newState]
  67. }));
  68. }
  69. async closeDb() {
  70. if (this.db) {
  71. await this.db.unlock();
  72. this.db = null;
  73. }
  74. }
  75. async createDb(dbPath) {
  76. this.setMyState(ssDbCreating);
  77. log('Searcher DB create start');
  78. const config = this.config;
  79. if (await fs.pathExists(dbPath))
  80. throw new Error(`createDb.pathExists: ${dbPath}`);
  81. const db = new JembaDbThread();
  82. await db.lock({
  83. dbPath,
  84. create: true,
  85. softLock: true,
  86. tableDefaults: {
  87. cacheSize: config.dbCacheSize,
  88. },
  89. });
  90. try {
  91. const dbCreator = new DbCreator(config);
  92. await dbCreator.run(db, (state) => {
  93. this.setMyState(ssDbCreating, state);
  94. if (state.fileName)
  95. log(` load ${state.fileName}`);
  96. if (state.recsLoaded)
  97. log(` processed ${state.recsLoaded} records`);
  98. if (state.job)
  99. log(` ${state.job}`);
  100. });
  101. log('Searcher DB successfully created');
  102. } finally {
  103. await db.unlock();
  104. }
  105. }
  106. async loadOrCreateDb(recreate = false) {
  107. this.setMyState(ssDbLoading);
  108. try {
  109. const config = this.config;
  110. const dbPath = `${config.dataDir}/db`;
  111. this.inpxFileHash = await this.inpxHashCreator.getInpxFileHash();
  112. //проверим полный InxpHash (включая фильтр и версию БД)
  113. //для этого заглянем в конфиг внутри БД, если он есть
  114. if (!(config.recreateDb || recreate) && await fs.pathExists(dbPath)) {
  115. const newInpxHash = await this.inpxHashCreator.getHash();
  116. const tmpDb = new JembaDb();
  117. await tmpDb.lock({dbPath, softLock: true});
  118. try {
  119. await tmpDb.open({table: 'config'});
  120. const rows = await tmpDb.select({table: 'config', where: `@@id('inpxHash')`});
  121. if (!rows.length || newInpxHash !== rows[0].value)
  122. throw new Error('inpx file: changes found on start, recreating DB');
  123. } catch (e) {
  124. log(LM_WARN, e.message);
  125. recreate = true;
  126. } finally {
  127. await tmpDb.unlock();
  128. }
  129. }
  130. //удалим БД если нужно
  131. if (config.recreateDb || recreate)
  132. await fs.remove(dbPath);
  133. //пересоздаем БД из INPX если нужно
  134. if (!await fs.pathExists(dbPath)) {
  135. try {
  136. await this.createDb(dbPath);
  137. } catch (e) {
  138. //при ошибке создания БД удалим ее, чтобы не работать с поломанной базой при следующем запуске
  139. await fs.remove(dbPath);
  140. throw e;
  141. }
  142. utils.freeMemory();
  143. }
  144. //загружаем БД
  145. this.setMyState(ssDbLoading);
  146. log('Searcher DB loading');
  147. const db = new JembaDbThread();//в отдельном потоке
  148. await db.lock({
  149. dbPath,
  150. softLock: true,
  151. tableDefaults: {
  152. cacheSize: config.dbCacheSize,
  153. },
  154. });
  155. //открываем почти все таблицы
  156. await db.openAll({exclude: ['author', 'title_book']});
  157. //откроем таблицу 'author' с бОльшим размером кеша блоков, для ускорения выборки
  158. await db.open({table: 'author', cacheSize: (config.dbCacheSize > 100 ? config.dbCacheSize : 100)});
  159. if (config.extendedSearch)
  160. await db.open({table: 'title_book'});
  161. this.dbSearcher = new DbSearcher(config, db);
  162. db.wwCache = {};
  163. this.db = db;
  164. this.setMyState(ssNormal);
  165. log('Searcher DB ready');
  166. this.logServerStats();
  167. } catch (e) {
  168. log(LM_FATAL, e.message);
  169. ayncExit.exit(1);
  170. }
  171. }
  172. async recreateDb() {
  173. this.setMyState(ssDbCreating);
  174. if (this.dbSearcher) {
  175. await this.dbSearcher.close();
  176. this.dbSearcher = null;
  177. }
  178. await this.closeDb();
  179. await this.loadOrCreateDb(true);
  180. }
  181. async dbConfig() {
  182. this.checkMyState();
  183. const db = this.db;
  184. if (!db.wwCache.config) {
  185. const rows = await db.select({table: 'config'});
  186. const config = {};
  187. for (const row of rows) {
  188. config[row.id] = row.value;
  189. }
  190. db.wwCache.config = config;
  191. }
  192. return db.wwCache.config;
  193. }
  194. async authorSearch(query) {
  195. this.checkMyState();
  196. const config = await this.dbConfig();
  197. const result = await this.dbSearcher.authorSearch(query);
  198. return {
  199. author: result.result,
  200. totalFound: result.totalFound,
  201. inpxHash: (config.inpxHash ? config.inpxHash : ''),
  202. };
  203. }
  204. async seriesSearch(query) {
  205. this.checkMyState();
  206. const config = await this.dbConfig();
  207. const result = await this.dbSearcher.seriesSearch(query);
  208. return {
  209. series: result.result,
  210. totalFound: result.totalFound,
  211. inpxHash: (config.inpxHash ? config.inpxHash : ''),
  212. };
  213. }
  214. async titleSearch(query) {
  215. this.checkMyState();
  216. const config = await this.dbConfig();
  217. const result = await this.dbSearcher.titleSearch(query);
  218. return {
  219. title: result.result,
  220. totalFound: result.totalFound,
  221. inpxHash: (config.inpxHash ? config.inpxHash : ''),
  222. };
  223. }
  224. async getAuthorBookList(authorId) {
  225. this.checkMyState();
  226. return await this.dbSearcher.getAuthorBookList(authorId);
  227. }
  228. async getSeriesBookList(series) {
  229. this.checkMyState();
  230. return await this.dbSearcher.getSeriesBookList(series);
  231. }
  232. async getGenreTree() {
  233. this.checkMyState();
  234. const config = await this.dbConfig();
  235. let result;
  236. const db = this.db;
  237. if (!db.wwCache.genres) {
  238. const genres = _.cloneDeep(genreTree);
  239. const last = genres[genres.length - 1];
  240. const genreValues = new Set();
  241. for (const section of genres) {
  242. for (const g of section.value)
  243. genreValues.add(g.value);
  244. }
  245. //добавим к жанрам те, что нашлись при парсинге
  246. const genreParsed = new Set();
  247. let rows = await db.select({table: 'genre', map: `(r) => ({value: r.value})`});
  248. for (const row of rows) {
  249. genreParsed.add(row.value);
  250. if (!genreValues.has(row.value))
  251. last.value.push({name: row.value, value: row.value});
  252. }
  253. //уберем те, которые не нашлись при парсинге
  254. for (let j = 0; j < genres.length; j++) {
  255. const section = genres[j];
  256. for (let i = 0; i < section.value.length; i++) {
  257. const g = section.value[i];
  258. if (!genreParsed.has(g.value))
  259. section.value.splice(i--, 1);
  260. }
  261. if (!section.value.length)
  262. genres.splice(j--, 1);
  263. }
  264. // langs
  265. rows = await db.select({table: 'lang', map: `(r) => ({value: r.value})`});
  266. const langs = rows.map(r => r.value);
  267. result = {
  268. genreTree: genres,
  269. langList: langs,
  270. inpxHash: (config.inpxHash ? config.inpxHash : ''),
  271. };
  272. db.wwCache.genres = result;
  273. } else {
  274. result = db.wwCache.genres;
  275. }
  276. return result;
  277. }
  278. async extractBook(bookPath) {
  279. const outFile = `${this.config.tempDir}/${utils.randomHexString(30)}`;
  280. const folder = `${this.config.libDir}/${path.dirname(bookPath)}`;
  281. const file = path.basename(bookPath);
  282. const zipReader = new ZipReader();
  283. await zipReader.open(folder);
  284. try {
  285. await zipReader.extractToFile(file, outFile);
  286. return outFile;
  287. } finally {
  288. await zipReader.close();
  289. }
  290. }
  291. async restoreBook(bookPath, downFileName) {
  292. const db = this.db;
  293. let extractedFile = '';
  294. let hash = '';
  295. if (!this.remoteLib) {
  296. extractedFile = await this.extractBook(bookPath);
  297. hash = await utils.getFileHash(extractedFile, 'sha256', 'hex');
  298. } else {
  299. hash = await this.remoteLib.downloadBook(bookPath, downFileName);
  300. }
  301. const link = `${this.config.filesPathStatic}/${hash}`;
  302. const bookFile = `${this.config.filesDir}/${hash}`;
  303. const bookFileDesc = `${bookFile}.json`;
  304. if (!await fs.pathExists(bookFile) || !await fs.pathExists(bookFileDesc)) {
  305. await fs.ensureDir(path.dirname(bookFile));
  306. const tmpFile = `${this.config.tempDir}/${utils.randomHexString(30)}`;
  307. await utils.gzipFile(extractedFile, tmpFile, 4);
  308. await fs.remove(extractedFile);
  309. await fs.move(tmpFile, bookFile, {overwrite: true});
  310. await fs.writeFile(bookFileDesc, JSON.stringify({bookPath, downFileName}));
  311. } else {
  312. if (extractedFile)
  313. await fs.remove(extractedFile);
  314. await utils.touchFile(bookFile);
  315. await utils.touchFile(bookFileDesc);
  316. }
  317. await db.insert({
  318. table: 'file_hash',
  319. replace: true,
  320. rows: [
  321. {id: bookPath, hash},
  322. {id: hash, bookPath, downFileName}
  323. ]
  324. });
  325. return link;
  326. }
  327. async getBookLink(params) {
  328. this.checkMyState();
  329. const {bookPath, downFileName} = params;
  330. try {
  331. const db = this.db;
  332. let link = '';
  333. //найдем хеш
  334. const rows = await db.select({table: 'file_hash', where: `@@id(${db.esc(bookPath)})`});
  335. if (rows.length) {//хеш найден по bookPath
  336. const hash = rows[0].hash;
  337. const bookFileDesc = `${this.config.filesDir}/${hash}.json`;
  338. if (await fs.pathExists(bookFileDesc)) {
  339. link = `${this.config.filesPathStatic}/${hash}`;
  340. }
  341. }
  342. if (!link) {
  343. link = await this.restoreBook(bookPath, downFileName)
  344. }
  345. if (!link)
  346. throw new Error('404 Файл не найден');
  347. return {link};
  348. } catch(e) {
  349. log(LM_ERR, `getBookLink error: ${e.message}`);
  350. if (e.message.indexOf('ENOENT') >= 0)
  351. throw new Error('404 Файл не найден');
  352. throw e;
  353. }
  354. }
  355. /*
  356. async restoreBookFile(publicPath) {
  357. this.checkMyState();
  358. try {
  359. const db = this.db;
  360. const hash = path.basename(publicPath);
  361. //найдем bookPath и downFileName
  362. const rows = await db.select({table: 'file_hash', where: `@@id(${db.esc(hash)})`});
  363. if (rows.length) {//нашли по хешу
  364. const rec = rows[0];
  365. await this.restoreBook(rec.bookPath, rec.downFileName);
  366. return rec.downFileName;
  367. } else {//bookPath не найден
  368. throw new Error('404 Файл не найден');
  369. }
  370. } catch(e) {
  371. log(LM_ERR, `restoreBookFile error: ${e.message}`);
  372. if (e.message.indexOf('ENOENT') >= 0)
  373. throw new Error('404 Файл не найден');
  374. throw e;
  375. }
  376. }
  377. async getDownFileName(publicPath) {
  378. this.checkMyState();
  379. const db = this.db;
  380. const hash = path.basename(publicPath);
  381. //найдем downFileName
  382. const rows = await db.select({table: 'file_hash', where: `@@id(${db.esc(hash)})`});
  383. if (rows.length) {//downFileName найден по хешу
  384. return rows[0].downFileName;
  385. } else {//bookPath не найден
  386. throw new Error('404 Файл не найден');
  387. }
  388. }
  389. */
  390. async getInpxFile(params) {
  391. let data = null;
  392. if (params.inpxFileHash && this.inpxFileHash && params.inpxFileHash === this.inpxFileHash) {
  393. data = false;
  394. }
  395. if (data === null)
  396. data = await fs.readFile(this.config.inpxFile, 'base64');
  397. return {data};
  398. }
  399. logServerStats() {
  400. try {
  401. const memUsage = process.memoryUsage().rss/(1024*1024);//Mb
  402. let loadAvg = os.loadavg();
  403. loadAvg = loadAvg.map(v => v.toFixed(2));
  404. log(`Server info [ memUsage: ${memUsage.toFixed(2)}MB, loadAvg: (${loadAvg.join(', ')}) ]`);
  405. if (this.config.server.ready)
  406. log(`Server accessible at http://127.0.0.1:${this.config.server.port} (listening on ${this.config.server.host}:${this.config.server.port})`);
  407. } catch (e) {
  408. log(LM_ERR, e.message);
  409. }
  410. }
  411. async periodicLogServerStats() {
  412. while (1) {// eslint-disable-line
  413. this.logServerStats();
  414. await utils.sleep(60*1000);
  415. }
  416. }
  417. async cleanDir(config) {
  418. const {dir, maxSize} = config;
  419. const list = await fs.readdir(dir);
  420. let size = 0;
  421. let files = [];
  422. //формируем список
  423. for (const filename of list) {
  424. const filePath = `${dir}/${filename}`;
  425. const stat = await fs.stat(filePath);
  426. if (!stat.isDirectory()) {
  427. size += stat.size;
  428. files.push({name: filePath, stat});
  429. }
  430. }
  431. log(LM_WARN, `clean dir ${dir}, maxSize=${maxSize}, found ${files.length} files, total size=${size}`);
  432. files.sort((a, b) => a.stat.mtimeMs - b.stat.mtimeMs);
  433. let i = 0;
  434. //удаляем
  435. while (i < files.length && size > maxSize) {
  436. const file = files[i];
  437. const oldFile = file.name;
  438. await fs.remove(oldFile);
  439. size -= file.stat.size;
  440. i++;
  441. }
  442. log(LM_WARN, `removed ${i} files`);
  443. }
  444. async periodicCleanDir(dirConfig) {
  445. try {
  446. for (const config of dirConfig)
  447. await fs.ensureDir(config.dir);
  448. let lastCleanDirTime = 0;
  449. while (1) {// eslint-disable-line no-constant-condition
  450. //чистка папок
  451. if (Date.now() - lastCleanDirTime >= cleanDirPeriod) {
  452. for (const config of dirConfig) {
  453. try {
  454. await this.cleanDir(config);
  455. } catch(e) {
  456. log(LM_ERR, e.stack);
  457. }
  458. }
  459. lastCleanDirTime = Date.now();
  460. }
  461. await utils.sleep(60*1000);//интервал проверки 1 минута
  462. }
  463. } catch (e) {
  464. log(LM_FATAL, e.message);
  465. ayncExit.exit(1);
  466. }
  467. }
  468. async periodicCheckInpx() {
  469. const inpxCheckInterval = this.config.inpxCheckInterval;
  470. if (!inpxCheckInterval)
  471. return;
  472. while (1) {// eslint-disable-line no-constant-condition
  473. try {
  474. while (this.myState != ssNormal)
  475. await utils.sleep(1000);
  476. if (this.remoteLib) {
  477. await this.remoteLib.downloadInpxFile();
  478. }
  479. const newInpxHash = await this.inpxHashCreator.getHash();
  480. const dbConfig = await this.dbConfig();
  481. const currentInpxHash = (dbConfig.inpxHash ? dbConfig.inpxHash : '');
  482. if (newInpxHash !== currentInpxHash) {
  483. log('inpx file: changes found, recreating DB');
  484. await this.recreateDb();
  485. } else {
  486. log('inpx file: no changes');
  487. }
  488. } catch(e) {
  489. log(LM_ERR, `periodicCheckInpx: ${e.message}`);
  490. }
  491. await utils.sleep(inpxCheckInterval*60*1000);
  492. }
  493. }
  494. }
  495. module.exports = WebWorker;