fb2read.cpp 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430
  1. #include <QtGui>
  2. #include <QtDebug>
  3. #include "fb2read.h"
  4. //---------------------------------------------------------------------------
  5. // Fb2ReadThread
  6. //---------------------------------------------------------------------------
  7. Fb2ReadThread::Fb2ReadThread(QObject *parent, const QString &filename)
  8. : QThread(parent)
  9. , m_filename(filename)
  10. , m_abort(false)
  11. {
  12. }
  13. Fb2ReadThread::~Fb2ReadThread()
  14. {
  15. stop();
  16. wait();
  17. }
  18. void Fb2ReadThread::stop()
  19. {
  20. QMutexLocker locker(&mutex);
  21. Q_UNUSED(locker);
  22. m_abort = true;
  23. }
  24. void Fb2ReadThread::run()
  25. {
  26. if (parse()) emit html(m_filename, m_html);
  27. }
  28. void Fb2ReadThread::onFile(const QString &name, const QString &path)
  29. {
  30. emit file(name, path);
  31. }
  32. bool Fb2ReadThread::parse()
  33. {
  34. QFile file(m_filename);
  35. if (!file.open(QFile::ReadOnly | QFile::Text)) {
  36. qCritical() << QObject::tr("Cannot read file %1:\n%2.").arg(m_filename).arg(file.errorString());
  37. return false;
  38. }
  39. Fb2Handler handler(*this);
  40. QXmlSimpleReader reader;
  41. reader.setContentHandler(&handler);
  42. reader.setErrorHandler(&handler);
  43. QXmlInputSource source(&file);
  44. return reader.parse(source);
  45. }
  46. //---------------------------------------------------------------------------
  47. // Fb2HtmlWriter
  48. //---------------------------------------------------------------------------
  49. Fb2HtmlWriter::Fb2HtmlWriter(Fb2ReadThread &thread)
  50. : QXmlStreamWriter(thread.data())
  51. , m_thread(thread)
  52. {
  53. }
  54. QString Fb2HtmlWriter::addFile(const QString &name, const QByteArray &data)
  55. {
  56. QString path = getFile(name);
  57. QFile file(path);
  58. if (file.open(QIODevice::WriteOnly)) {
  59. file.write(data);
  60. m_thread.onFile(name, path);
  61. }
  62. return path;
  63. }
  64. QString Fb2HtmlWriter::getFile(const QString &name)
  65. {
  66. StringHash::const_iterator i = m_hash.find(name);
  67. if (i == m_hash.end()) {
  68. QTemporaryFile file;
  69. file.setAutoRemove(false);
  70. file.open();
  71. return m_hash.insert(name, file.fileName()).value();
  72. } else {
  73. return i.value();
  74. }
  75. }
  76. //---------------------------------------------------------------------------
  77. // Fb2Handler::BaseHandler
  78. //---------------------------------------------------------------------------
  79. #define FB2_BEGIN_KEYHASH(x) \
  80. Fb2Handler::x::Keyword Fb2Handler::x::toKeyword(const QString &name) \
  81. { \
  82. static const KeywordHash map; \
  83. KeywordHash::const_iterator i = map.find(name); \
  84. return i == map.end() ? None : i.value(); \
  85. } \
  86. Fb2Handler::x::KeywordHash::KeywordHash() {
  87. #define FB2_END_KEYHASH }
  88. #define FB2_KEY(key,str) insert(str,key);
  89. static QString Value(const QXmlAttributes &attributes, const QString &name)
  90. {
  91. int count = attributes.count();
  92. for (int i = 0; i < count; i++ ) {
  93. if (attributes.localName(i).compare(name, Qt::CaseInsensitive) == 0) {
  94. return attributes.value(i);
  95. }
  96. }
  97. return QString();
  98. }
  99. Fb2Handler::BaseHandler::~BaseHandler()
  100. {
  101. if (m_handler) delete m_handler;
  102. }
  103. bool Fb2Handler::BaseHandler::doStart(const QString &name, const QXmlAttributes &attributes)
  104. {
  105. if (m_handler) return m_handler->doStart(name, attributes);
  106. m_handler = NewTag(name, attributes); if (m_handler) return true;
  107. // qCritical() << QObject::tr("Unknown XML child tag: <%1> <%2>").arg(m_name).arg(name);
  108. m_handler = new BaseHandler(name);
  109. return true;
  110. }
  111. bool Fb2Handler::BaseHandler::doText(const QString &text)
  112. {
  113. if (m_handler) m_handler->doText(text); else TxtTag(text);
  114. return true;
  115. }
  116. bool Fb2Handler::BaseHandler::doEnd(const QString &name, bool & exists)
  117. {
  118. if (m_handler) {
  119. bool found = exists || name == m_name;
  120. m_handler->doEnd(name, found);
  121. if (m_handler->m_closed) { delete m_handler; m_handler = NULL; }
  122. if (found) { exists = true; return true; }
  123. }
  124. bool found = name == m_name;
  125. if (!found) qCritical() << QObject::tr("Conglict XML tags: <%1> - </%2>").arg(m_name).arg(name);
  126. m_closed = found || exists;
  127. if (m_closed) EndTag(m_name);
  128. exists = found;
  129. return true;
  130. }
  131. //---------------------------------------------------------------------------
  132. // Fb2Handler::RootHandler
  133. //---------------------------------------------------------------------------
  134. FB2_BEGIN_KEYHASH(RootHandler)
  135. insert("stylesheet", Style);
  136. insert("description", Descr);
  137. insert("body", Body);
  138. insert("binary", Binary);
  139. FB2_END_KEYHASH
  140. Fb2Handler::RootHandler::RootHandler(Fb2HtmlWriter &writer, const QString &name)
  141. : BaseHandler(name)
  142. , m_writer(writer)
  143. {
  144. m_writer.writeStartElement("html");
  145. m_writer.writeStartElement("head");
  146. m_writer.writeStartElement("link");
  147. m_writer.writeAttribute("rel", "stylesheet");
  148. m_writer.writeAttribute("href", "qrc:/res/style.css");
  149. m_writer.writeEndElement();
  150. m_writer.writeEndElement();
  151. m_writer.writeStartElement("body");
  152. }
  153. Fb2Handler::RootHandler::~RootHandler()
  154. {
  155. m_writer.writeEndElement();
  156. m_writer.writeEndElement();
  157. }
  158. Fb2Handler::BaseHandler * Fb2Handler::RootHandler::NewTag(const QString &name, const QXmlAttributes &attributes)
  159. {
  160. switch (toKeyword(name)) {
  161. case Body : return new BodyHandler(m_writer, name, attributes, "div", name);
  162. case Descr : return new DescrHandler(m_writer, name);
  163. case Binary : return new BinaryHandler(m_writer, name, attributes);
  164. default: return NULL;
  165. }
  166. }
  167. //---------------------------------------------------------------------------
  168. // Fb2Handler::DescrHandler
  169. //---------------------------------------------------------------------------
  170. FB2_BEGIN_KEYHASH(DescrHandler)
  171. insert( "title-info" , Title );
  172. insert( "publish-info" , Publish );
  173. FB2_END_KEYHASH
  174. Fb2Handler::BaseHandler * Fb2Handler::DescrHandler::NewTag(const QString &name, const QXmlAttributes &attributes)
  175. {
  176. Q_UNUSED(attributes);
  177. switch (toKeyword(name)) {
  178. case Title : return new HeaderHandler(m_writer, name);
  179. case Publish : return new BaseHandler(name);
  180. default: return NULL;
  181. }
  182. }
  183. //---------------------------------------------------------------------------
  184. // Fb2Handler::HeaderHandler
  185. //---------------------------------------------------------------------------
  186. FB2_BEGIN_KEYHASH(HeaderHandler)
  187. insert( "book-title" , Title );
  188. insert( "author" , Author );
  189. insert( "sequence" , Sequence );
  190. insert( "genre" , Genre );
  191. insert( "lang" , Lang );
  192. insert( "annotation" , Annot );
  193. insert( "coverpage" , Cover );
  194. FB2_END_KEYHASH
  195. Fb2Handler::BaseHandler * Fb2Handler::HeaderHandler::NewTag(const QString &name, const QXmlAttributes &attributes)
  196. {
  197. Q_UNUSED(attributes);
  198. switch (toKeyword(name)) {
  199. case Title : return new BaseHandler(name);
  200. case Annot : return new BaseHandler(name);
  201. default: return NULL;
  202. }
  203. }
  204. //---------------------------------------------------------------------------
  205. // Fb2Handler::BodyHandler
  206. //---------------------------------------------------------------------------
  207. FB2_BEGIN_KEYHASH(BodyHandler)
  208. FB2_KEY( Section, "annotation" );
  209. FB2_KEY( Section, "author" );
  210. FB2_KEY( Section, "cite" );
  211. FB2_KEY( Section, "date" );
  212. FB2_KEY( Section, "epigraph" );
  213. FB2_KEY( Section, "poem" );
  214. FB2_KEY( Section, "section" );
  215. FB2_KEY( Section, "stanza" );
  216. FB2_KEY( Section, "subtitle" );
  217. FB2_KEY( Section, "title" );
  218. FB2_KEY( Anchor, "a" );
  219. FB2_KEY( Table, "table" );
  220. FB2_KEY( Image, "image" );
  221. FB2_KEY( Parag, "empty-line" );
  222. FB2_KEY( Parag, "p" );
  223. FB2_KEY( Parag, "v" );
  224. FB2_KEY( Style, "style" );
  225. FB2_KEY( Strong, "strong" );
  226. FB2_KEY( Emphas, "emphasis" );
  227. FB2_KEY( Strike, "strikethrough" );
  228. FB2_KEY( Sub, "sub" );
  229. FB2_KEY( Sup, "sup" );
  230. FB2_KEY( Code, "code" );
  231. FB2_END_KEYHASH
  232. Fb2Handler::BodyHandler::BodyHandler(Fb2HtmlWriter &writer, const QString &name, const QXmlAttributes &attributes, const QString &tag, const QString &style)
  233. : BaseHandler(name)
  234. , m_writer(writer)
  235. {
  236. m_writer.writeStartElement(tag);
  237. QString id = Value(attributes, "id");
  238. if (!id.isEmpty()) m_writer.writeAttribute("id", id);
  239. if (!style.isEmpty()) m_writer.writeAttribute("class", style);
  240. }
  241. Fb2Handler::BodyHandler::~BodyHandler()
  242. {
  243. m_writer.writeEndElement();
  244. }
  245. Fb2Handler::BaseHandler * Fb2Handler::BodyHandler::NewTag(const QString &name, const QXmlAttributes &attributes)
  246. {
  247. switch (toKeyword(name)) {
  248. case Section : return new BodyHandler(m_writer, name, attributes, "div", name);
  249. case Anchor : return new AnchorHandler(m_writer, name, attributes);
  250. case Image : return new ImageHandler(m_writer, name, attributes);
  251. case Parag : return new BodyHandler(m_writer, name, attributes, "p");
  252. case Strong : return new BodyHandler(m_writer, name, attributes, "b");
  253. case Emphas : return new BodyHandler(m_writer, name, attributes, "i");
  254. case Strike : return new BodyHandler(m_writer, name, attributes, "s");
  255. case Code : return new BodyHandler(m_writer, name, attributes, "tt");
  256. case Sub : return new BodyHandler(m_writer, name, attributes, "sub");
  257. case Sup : return new BodyHandler(m_writer, name, attributes, "sup");
  258. default: return NULL;
  259. }
  260. }
  261. void Fb2Handler::BodyHandler::TxtTag(const QString &text)
  262. {
  263. m_writer.writeCharacters(text);
  264. }
  265. //---------------------------------------------------------------------------
  266. // Fb2Handler::AnchorHandler
  267. //---------------------------------------------------------------------------
  268. Fb2Handler::AnchorHandler::AnchorHandler(Fb2HtmlWriter &writer, const QString &name, const QXmlAttributes &attributes)
  269. : BodyHandler(writer, name, attributes, "a")
  270. {
  271. QString href = Value(attributes, "href");
  272. writer.writeAttribute("href", href);
  273. }
  274. //---------------------------------------------------------------------------
  275. // Fb2Handler::ImageHandler
  276. //---------------------------------------------------------------------------
  277. Fb2Handler::ImageHandler::ImageHandler(Fb2HtmlWriter &writer, const QString &name, const QXmlAttributes &attributes)
  278. : BodyHandler(writer, name, attributes, "img")
  279. {
  280. QString href = Value(attributes, "href");
  281. while (href.left(1) == "#") href.remove(0, 1);
  282. QString path = writer.getFile(href);
  283. writer.writeAttribute("src", path);
  284. writer.writeAttribute("alt", href);
  285. }
  286. //---------------------------------------------------------------------------
  287. // Fb2Handler::BinaryHandler
  288. //---------------------------------------------------------------------------
  289. Fb2Handler::BinaryHandler::BinaryHandler(Fb2HtmlWriter &writer, const QString &name, const QXmlAttributes &attributes)
  290. : BaseHandler(name)
  291. , m_writer(writer)
  292. , m_file(Value(attributes, "id"))
  293. {
  294. }
  295. Fb2Handler::BinaryHandler::~BinaryHandler()
  296. {
  297. QByteArray in; in.append(m_text);
  298. if (!m_file.isEmpty()) m_writer.addFile(m_file, QByteArray::fromBase64(in));
  299. }
  300. void Fb2Handler::BinaryHandler::TxtTag(const QString &text)
  301. {
  302. m_text += text;
  303. }
  304. //---------------------------------------------------------------------------
  305. // Fb2Handler
  306. //---------------------------------------------------------------------------
  307. Fb2Handler::Fb2Handler(Fb2ReadThread &thread)
  308. : QXmlDefaultHandler()
  309. , m_writer(thread)
  310. , m_handler(NULL)
  311. {
  312. m_writer.setAutoFormatting(true);
  313. }
  314. Fb2Handler::~Fb2Handler()
  315. {
  316. if (m_handler) delete m_handler;
  317. }
  318. bool Fb2Handler::startElement(const QString & namespaceURI, const QString & localName, const QString &qName, const QXmlAttributes &attributes)
  319. {
  320. Q_UNUSED(namespaceURI);
  321. Q_UNUSED(localName);
  322. const QString name = qName.toLower();
  323. if (m_handler) return m_handler->doStart(name, attributes);
  324. qCritical() << name;
  325. if (name == "fictionbook") {
  326. m_handler = new RootHandler(m_writer, name);
  327. return true;
  328. } else {
  329. m_error = QObject::tr("The file is not an FB2 file.");
  330. return false;
  331. }
  332. }
  333. static bool isWhiteSpace(const QString &str)
  334. {
  335. return str.simplified().isEmpty();
  336. }
  337. bool Fb2Handler::characters(const QString &str)
  338. {
  339. QString s = str.simplified();
  340. if (s.isEmpty()) return true;
  341. if (isWhiteSpace(str.left(1))) s.prepend(" ");
  342. if (isWhiteSpace(str.right(1))) s.append(" ");
  343. return m_handler && m_handler->doText(s);
  344. }
  345. bool Fb2Handler::endElement(const QString & namespaceURI, const QString & localName, const QString &qName)
  346. {
  347. Q_UNUSED(namespaceURI);
  348. Q_UNUSED(localName);
  349. bool found = false;
  350. return m_handler && m_handler->doEnd(qName.toLower(), found);
  351. }
  352. bool Fb2Handler::fatalError(const QXmlParseException &exception)
  353. {
  354. qCritical() << QObject::tr("Parse error at line %1, column %2:\n%3")
  355. .arg(exception.lineNumber())
  356. .arg(exception.columnNumber())
  357. .arg(exception.message());
  358. return false;
  359. }
  360. QString Fb2Handler::errorString() const
  361. {
  362. return m_error;
  363. }
  364. #undef FB2_BEGIN_KEYHASH
  365. #undef FB2_END_KEYHASH
  366. #undef FB2_KEY