XML2SAXMetalinkProcessor.cc 5.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185
  1. /* <!-- copyright */
  2. /*
  3. * aria2 - The high speed download utility
  4. *
  5. * Copyright (C) 2006 Tatsuhiro Tsujikawa
  6. *
  7. * This program is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU General Public License as published by
  9. * the Free Software Foundation; either version 2 of the License, or
  10. * (at your option) any later version.
  11. *
  12. * This program is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  15. * GNU General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU General Public License
  18. * along with this program; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. *
  21. * In addition, as a special exception, the copyright holders give
  22. * permission to link the code of portions of this program with the
  23. * OpenSSL library under certain conditions as described in each
  24. * individual source file, and distribute linked combinations
  25. * including the two.
  26. * You must obey the GNU General Public License in all respects
  27. * for all of the code used other than OpenSSL. If you modify
  28. * file(s) with this exception, you may extend this exception to your
  29. * version of the file(s), but you are not obligated to do so. If you
  30. * do not wish to do so, delete this exception statement from your
  31. * version. If you delete this exception statement from all source
  32. * files in the program, then also delete it here.
  33. */
  34. /* copyright --> */
  35. #include "XML2SAXMetalinkProcessor.h"
  36. #include "BinaryStream.h"
  37. #include "MetalinkParserStateMachine.h"
  38. #include "Metalinker.h"
  39. #include "MetalinkEntry.h"
  40. #include "Util.h"
  41. #include "message.h"
  42. #include "DlAbortEx.h"
  43. namespace aria2 {
  44. class SessionData {
  45. public:
  46. SharedHandle<MetalinkParserStateMachine> _stm;
  47. std::deque<std::string> _charactersStack;
  48. SessionData(const SharedHandle<MetalinkParserStateMachine>& stm):_stm(stm) {}
  49. };
  50. static void mlStartElement(void* userData, const xmlChar* name, const xmlChar** attrs)
  51. {
  52. SessionData* sd = reinterpret_cast<SessionData*>(userData);
  53. std::map<std::string, std::string> attrmap;
  54. if(attrs) {
  55. const xmlChar** p = attrs;
  56. while(*p != 0) {
  57. std::string name = (const char*)*p++;
  58. if(*p == 0) {
  59. break;
  60. }
  61. std::string value = Util::trim((const char*)*p++);
  62. attrmap[name] = value;
  63. }
  64. }
  65. sd->_stm->beginElement((const char*)name, attrmap);
  66. if(sd->_stm->needsCharactersBuffering()) {
  67. sd->_charactersStack.push_front(std::string());
  68. }
  69. }
  70. static void mlEndElement(void* userData, const xmlChar* name)
  71. {
  72. SessionData* sd = reinterpret_cast<SessionData*>(userData);
  73. std::string characters;
  74. if(sd->_stm->needsCharactersBuffering()) {
  75. characters = Util::trim(sd->_charactersStack.front());
  76. sd->_charactersStack.pop_front();
  77. }
  78. sd->_stm->endElement((const char*)name, characters);
  79. }
  80. static void mlCharacters(void* userData, const xmlChar* ch, int len)
  81. {
  82. SessionData* sd = reinterpret_cast<SessionData*>(userData);
  83. if(sd->_stm->needsCharactersBuffering()) {
  84. sd->_charactersStack.front() += std::string(&ch[0], &ch[len]);
  85. }
  86. }
  87. static xmlSAXHandler mySAXHandler =
  88. {
  89. 0, // internalSubsetSAXFunc
  90. 0, // isStandaloneSAXFunc
  91. 0, // hasInternalSubsetSAXFunc
  92. 0, // hasExternalSubsetSAXFunc
  93. 0, // resolveEntitySAXFunc
  94. 0, // getEntitySAXFunc
  95. 0, // entityDeclSAXFunc
  96. 0, // notationDeclSAXFunc
  97. 0, // attributeDeclSAXFunc
  98. 0, // elementDeclSAXFunc
  99. 0, // unparsedEntityDeclSAXFunc
  100. 0, // setDocumentLocatorSAXFunc
  101. 0, // startDocumentSAXFunc
  102. 0, // endDocumentSAXFunc
  103. &mlStartElement, // startElementSAXFunc
  104. &mlEndElement, // endElementSAXFunc
  105. 0, // referenceSAXFunc
  106. &mlCharacters, // charactersSAXFunc
  107. 0, // ignorableWhitespaceSAXFunc
  108. 0, // processingInstructionSAXFunc
  109. 0, // commentSAXFunc
  110. 0, // warningSAXFunc
  111. 0, // errorSAXFunc
  112. 0, // fatalErrorSAXFunc
  113. 0, // getParameterEntitySAXFunc
  114. 0, // cdataBlockSAXFunc
  115. 0, // externalSubsetSAXFunc
  116. 0, // unsigned int initialized
  117. 0, // void * _private
  118. 0, // startElementNsSAX2Func
  119. 0, // endElementNsSAX2Func
  120. 0, // xmlStructuredErrorFunc
  121. };
  122. XML2SAXMetalinkProcessor::XML2SAXMetalinkProcessor() {}
  123. SharedHandle<Metalinker>
  124. XML2SAXMetalinkProcessor::parseFile(const std::string& filename)
  125. {
  126. _stm.reset(new MetalinkParserStateMachine());
  127. SharedHandle<SessionData> sessionData(new SessionData(_stm));
  128. int retval = xmlSAXUserParseFile(&mySAXHandler, sessionData.get(),
  129. filename.c_str());
  130. if(retval != 0) {
  131. throw DlAbortEx(MSG_CANNOT_PARSE_METALINK);
  132. }
  133. return _stm->getResult();
  134. }
  135. SharedHandle<Metalinker>
  136. XML2SAXMetalinkProcessor::parseFromBinaryStream(const SharedHandle<BinaryStream>& binaryStream)
  137. {
  138. _stm.reset(new MetalinkParserStateMachine());
  139. size_t bufSize = 4096;
  140. unsigned char buf[bufSize];
  141. ssize_t res = binaryStream->readData(buf, 4, 0);
  142. if(res != 4) {
  143. throw DlAbortEx("Too small data for parsing XML.");
  144. }
  145. SharedHandle<SessionData> sessionData(new SessionData(_stm));
  146. xmlParserCtxtPtr ctx = xmlCreatePushParserCtxt(&mySAXHandler, sessionData.get(), (const char*)buf, res, 0);
  147. try {
  148. off_t readOffset = res;
  149. while(1) {
  150. ssize_t res = binaryStream->readData(buf, bufSize, readOffset);
  151. if(res == 0) {
  152. break;
  153. }
  154. if(xmlParseChunk(ctx, (const char*)buf, res, 0) != 0) {
  155. throw DlAbortEx(MSG_CANNOT_PARSE_METALINK);
  156. }
  157. readOffset += res;
  158. }
  159. xmlParseChunk(ctx, (const char*)buf, 0, 1);
  160. } catch(Exception& e) {
  161. xmlFreeParserCtxt(ctx);
  162. throw;
  163. }
  164. xmlFreeParserCtxt(ctx);
  165. if(!_stm->finished()) {
  166. throw DlAbortEx(MSG_CANNOT_PARSE_METALINK);
  167. }
  168. return _stm->getResult();
  169. }
  170. } // namespace aria2