XML2SAXMetalinkProcessor.cc 5.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187
  1. /* <!-- copyright */
  2. /*
  3. * aria2 - The high speed download utility
  4. *
  5. * Copyright (C) 2006 Tatsuhiro Tsujikawa
  6. *
  7. * This program is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU General Public License as published by
  9. * the Free Software Foundation; either version 2 of the License, or
  10. * (at your option) any later version.
  11. *
  12. * This program is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  15. * GNU General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU General Public License
  18. * along with this program; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. *
  21. * In addition, as a special exception, the copyright holders give
  22. * permission to link the code of portions of this program with the
  23. * OpenSSL library under certain conditions as described in each
  24. * individual source file, and distribute linked combinations
  25. * including the two.
  26. * You must obey the GNU General Public License in all respects
  27. * for all of the code used other than OpenSSL. If you modify
  28. * file(s) with this exception, you may extend this exception to your
  29. * version of the file(s), but you are not obligated to do so. If you
  30. * do not wish to do so, delete this exception statement from your
  31. * version. If you delete this exception statement from all source
  32. * files in the program, then also delete it here.
  33. */
  34. /* copyright --> */
  35. #include "XML2SAXMetalinkProcessor.h"
  36. #include "BinaryStream.h"
  37. #include "MetalinkParserStateMachine.h"
  38. #include "Metalinker.h"
  39. #include "MetalinkEntry.h"
  40. #include "util.h"
  41. #include "message.h"
  42. #include "DlAbortEx.h"
  43. namespace aria2 {
  44. class SessionData {
  45. public:
  46. SharedHandle<MetalinkParserStateMachine> _stm;
  47. std::deque<std::string> _charactersStack;
  48. SessionData(const SharedHandle<MetalinkParserStateMachine>& stm):_stm(stm) {}
  49. };
  50. static void mlStartElement(void* userData, const xmlChar* name, const xmlChar** attrs)
  51. {
  52. SessionData* sd = reinterpret_cast<SessionData*>(userData);
  53. std::map<std::string, std::string> attrmap;
  54. if(attrs) {
  55. const xmlChar** p = attrs;
  56. while(*p != 0) {
  57. std::string name = reinterpret_cast<const char*>(*p);
  58. ++p;
  59. if(*p == 0) {
  60. break;
  61. }
  62. std::string value = util::trim(reinterpret_cast<const char*>(*p));
  63. ++p;
  64. attrmap[name] = value;
  65. }
  66. }
  67. sd->_stm->beginElement(reinterpret_cast<const char*>(name), attrmap);
  68. if(sd->_stm->needsCharactersBuffering()) {
  69. sd->_charactersStack.push_front(std::string());
  70. }
  71. }
  72. static void mlEndElement(void* userData, const xmlChar* name)
  73. {
  74. SessionData* sd = reinterpret_cast<SessionData*>(userData);
  75. std::string characters;
  76. if(sd->_stm->needsCharactersBuffering()) {
  77. characters = util::trim(sd->_charactersStack.front());
  78. sd->_charactersStack.pop_front();
  79. }
  80. sd->_stm->endElement(reinterpret_cast<const char*>(name), characters);
  81. }
  82. static void mlCharacters(void* userData, const xmlChar* ch, int len)
  83. {
  84. SessionData* sd = reinterpret_cast<SessionData*>(userData);
  85. if(sd->_stm->needsCharactersBuffering()) {
  86. sd->_charactersStack.front() += std::string(&ch[0], &ch[len]);
  87. }
  88. }
  89. static xmlSAXHandler mySAXHandler =
  90. {
  91. 0, // internalSubsetSAXFunc
  92. 0, // isStandaloneSAXFunc
  93. 0, // hasInternalSubsetSAXFunc
  94. 0, // hasExternalSubsetSAXFunc
  95. 0, // resolveEntitySAXFunc
  96. 0, // getEntitySAXFunc
  97. 0, // entityDeclSAXFunc
  98. 0, // notationDeclSAXFunc
  99. 0, // attributeDeclSAXFunc
  100. 0, // elementDeclSAXFunc
  101. 0, // unparsedEntityDeclSAXFunc
  102. 0, // setDocumentLocatorSAXFunc
  103. 0, // startDocumentSAXFunc
  104. 0, // endDocumentSAXFunc
  105. &mlStartElement, // startElementSAXFunc
  106. &mlEndElement, // endElementSAXFunc
  107. 0, // referenceSAXFunc
  108. &mlCharacters, // charactersSAXFunc
  109. 0, // ignorableWhitespaceSAXFunc
  110. 0, // processingInstructionSAXFunc
  111. 0, // commentSAXFunc
  112. 0, // warningSAXFunc
  113. 0, // errorSAXFunc
  114. 0, // fatalErrorSAXFunc
  115. 0, // getParameterEntitySAXFunc
  116. 0, // cdataBlockSAXFunc
  117. 0, // externalSubsetSAXFunc
  118. 0, // unsigned int initialized
  119. 0, // void * _private
  120. 0, // startElementNsSAX2Func
  121. 0, // endElementNsSAX2Func
  122. 0, // xmlStructuredErrorFunc
  123. };
  124. SharedHandle<Metalinker>
  125. MetalinkProcessor::parseFile(const std::string& filename)
  126. {
  127. _stm.reset(new MetalinkParserStateMachine());
  128. SharedHandle<SessionData> sessionData(new SessionData(_stm));
  129. int retval = xmlSAXUserParseFile(&mySAXHandler, sessionData.get(),
  130. filename.c_str());
  131. if(retval != 0) {
  132. throw DL_ABORT_EX(MSG_CANNOT_PARSE_METALINK);
  133. }
  134. return _stm->getResult();
  135. }
  136. SharedHandle<Metalinker>
  137. MetalinkProcessor::parseFromBinaryStream(const SharedHandle<BinaryStream>& binaryStream)
  138. {
  139. _stm.reset(new MetalinkParserStateMachine());
  140. size_t bufSize = 4096;
  141. unsigned char buf[bufSize];
  142. ssize_t res = binaryStream->readData(buf, 4, 0);
  143. if(res != 4) {
  144. throw DL_ABORT_EX("Too small data for parsing XML.");
  145. }
  146. SharedHandle<SessionData> sessionData(new SessionData(_stm));
  147. xmlParserCtxtPtr ctx = xmlCreatePushParserCtxt
  148. (&mySAXHandler, sessionData.get(),
  149. reinterpret_cast<const char*>(buf), res, 0);
  150. try {
  151. off_t readOffset = res;
  152. while(1) {
  153. ssize_t res = binaryStream->readData(buf, bufSize, readOffset);
  154. if(res == 0) {
  155. break;
  156. }
  157. if(xmlParseChunk(ctx, reinterpret_cast<const char*>(buf), res, 0) != 0) {
  158. throw DL_ABORT_EX(MSG_CANNOT_PARSE_METALINK);
  159. }
  160. readOffset += res;
  161. }
  162. xmlParseChunk(ctx, reinterpret_cast<const char*>(buf), 0, 1);
  163. } catch(Exception& e) {
  164. xmlFreeParserCtxt(ctx);
  165. throw;
  166. }
  167. xmlFreeParserCtxt(ctx);
  168. if(!_stm->finished()) {
  169. throw DL_ABORT_EX(MSG_CANNOT_PARSE_METALINK);
  170. }
  171. return _stm->getResult();
  172. }
  173. } // namespace aria2