XML2SAXMetalinkProcessor.cc 5.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176
  1. /* <!-- copyright */
  2. /*
  3. * aria2 - The high speed download utility
  4. *
  5. * Copyright (C) 2006 Tatsuhiro Tsujikawa
  6. *
  7. * This program is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU General Public License as published by
  9. * the Free Software Foundation; either version 2 of the License, or
  10. * (at your option) any later version.
  11. *
  12. * This program is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  15. * GNU General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU General Public License
  18. * along with this program; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. *
  21. * In addition, as a special exception, the copyright holders give
  22. * permission to link the code of portions of this program with the
  23. * OpenSSL library under certain conditions as described in each
  24. * individual source file, and distribute linked combinations
  25. * including the two.
  26. * You must obey the GNU General Public License in all respects
  27. * for all of the code used other than OpenSSL. If you modify
  28. * file(s) with this exception, you may extend this exception to your
  29. * version of the file(s), but you are not obligated to do so. If you
  30. * do not wish to do so, delete this exception statement from your
  31. * version. If you delete this exception statement from all source
  32. * files in the program, then also delete it here.
  33. */
  34. /* copyright --> */
  35. #include "XML2SAXMetalinkProcessor.h"
  36. #include "BinaryStream.h"
  37. #include "MetalinkParserStateMachine.h"
  38. #include "Metalinker.h"
  39. #include "MetalinkEntry.h"
  40. #include "Util.h"
  41. #include "message.h"
  42. #include "DlAbortEx.h"
  43. namespace aria2 {
  44. class SessionData {
  45. public:
  46. SharedHandle<MetalinkParserStateMachine> _stm;
  47. std::deque<std::string> _charactersStack;
  48. SessionData(const SharedHandle<MetalinkParserStateMachine>& stm):_stm(stm) {}
  49. };
  50. static void mlStartElement(void* userData, const xmlChar* name, const xmlChar** attrs)
  51. {
  52. ((SessionData*)userData)->_charactersStack.push_front(std::string());
  53. std::map<std::string, std::string> attrmap;
  54. if(attrs) {
  55. const xmlChar** p = attrs;
  56. while(*p != 0) {
  57. std::string name = (const char*)*p++;
  58. if(*p == 0) {
  59. break;
  60. }
  61. std::string value = Util::trim((const char*)*p++);
  62. attrmap[name] = value;
  63. }
  64. }
  65. ((SessionData*)userData)->_stm->beginElement((const char*)name, attrmap);
  66. }
  67. static void mlEndElement(void* userData, const xmlChar* name)
  68. {
  69. SessionData* sd = (SessionData*)userData;
  70. sd->_stm->endElement((const char*)name, Util::trim(sd->_charactersStack.front()));
  71. sd->_charactersStack.pop_front();
  72. }
  73. static void mlCharacters(void* userData, const xmlChar* ch, int len)
  74. {
  75. ((SessionData*)userData)->_charactersStack.front() += std::string(&ch[0], &ch[len]);
  76. }
  77. static xmlSAXHandler mySAXHandler =
  78. {
  79. 0, // internalSubsetSAXFunc
  80. 0, // isStandaloneSAXFunc
  81. 0, // hasInternalSubsetSAXFunc
  82. 0, // hasExternalSubsetSAXFunc
  83. 0, // resolveEntitySAXFunc
  84. 0, // getEntitySAXFunc
  85. 0, // entityDeclSAXFunc
  86. 0, // notationDeclSAXFunc
  87. 0, // attributeDeclSAXFunc
  88. 0, // elementDeclSAXFunc
  89. 0, // unparsedEntityDeclSAXFunc
  90. 0, // setDocumentLocatorSAXFunc
  91. 0, // startDocumentSAXFunc
  92. 0, // endDocumentSAXFunc
  93. &mlStartElement, // startElementSAXFunc
  94. &mlEndElement, // endElementSAXFunc
  95. 0, // referenceSAXFunc
  96. &mlCharacters, // charactersSAXFunc
  97. 0, // ignorableWhitespaceSAXFunc
  98. 0, // processingInstructionSAXFunc
  99. 0, // commentSAXFunc
  100. 0, // warningSAXFunc
  101. 0, // errorSAXFunc
  102. 0, // fatalErrorSAXFunc
  103. 0, // getParameterEntitySAXFunc
  104. 0, // cdataBlockSAXFunc
  105. 0, // externalSubsetSAXFunc
  106. 0, // unsigned int initialized
  107. 0, // void * _private
  108. 0, // startElementNsSAX2Func
  109. 0, // endElementNsSAX2Func
  110. 0, // xmlStructuredErrorFunc
  111. };
  112. XML2SAXMetalinkProcessor::XML2SAXMetalinkProcessor() {}
  113. SharedHandle<Metalinker>
  114. XML2SAXMetalinkProcessor::parseFile(const std::string& filename)
  115. {
  116. _stm.reset(new MetalinkParserStateMachine());
  117. SharedHandle<SessionData> sessionData(new SessionData(_stm));
  118. int retval = xmlSAXUserParseFile(&mySAXHandler, sessionData.get(),
  119. filename.c_str());
  120. if(retval != 0) {
  121. throw new DlAbortEx(MSG_CANNOT_PARSE_METALINK);
  122. }
  123. return _stm->getResult();
  124. }
  125. SharedHandle<Metalinker>
  126. XML2SAXMetalinkProcessor::parseFromBinaryStream(const SharedHandle<BinaryStream>& binaryStream)
  127. {
  128. _stm.reset(new MetalinkParserStateMachine());
  129. size_t bufSize = 4096;
  130. unsigned char buf[bufSize];
  131. ssize_t res = binaryStream->readData(buf, 4, 0);
  132. if(res != 4) {
  133. throw new DlAbortEx("Too small data for parsing XML.");
  134. }
  135. SharedHandle<SessionData> sessionData(new SessionData(_stm));
  136. xmlParserCtxtPtr ctx = xmlCreatePushParserCtxt(&mySAXHandler, sessionData.get(), (const char*)buf, res, 0);
  137. try {
  138. off_t readOffset = res;
  139. while(1) {
  140. ssize_t res = binaryStream->readData(buf, bufSize, readOffset);
  141. if(res == 0) {
  142. break;
  143. }
  144. if(xmlParseChunk(ctx, (const char*)buf, res, 0) != 0) {
  145. throw new DlAbortEx(MSG_CANNOT_PARSE_METALINK);
  146. }
  147. readOffset += res;
  148. }
  149. xmlParseChunk(ctx, (const char*)buf, 0, 1);
  150. } catch(Exception* e) {
  151. xmlFreeParserCtxt(ctx);
  152. throw e;
  153. }
  154. xmlFreeParserCtxt(ctx);
  155. if(!_stm->finished()) {
  156. throw new DlAbortEx(MSG_CANNOT_PARSE_METALINK);
  157. }
  158. return _stm->getResult();
  159. }
  160. } // namespace aria2