util.h 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388
  1. /* <!-- copyright */
  2. /*
  3. * aria2 - The high speed download utility
  4. *
  5. * Copyright (C) 2006 Tatsuhiro Tsujikawa
  6. *
  7. * This program is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU General Public License as published by
  9. * the Free Software Foundation; either version 2 of the License, or
  10. * (at your option) any later version.
  11. *
  12. * This program is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  15. * GNU General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU General Public License
  18. * along with this program; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. *
  21. * In addition, as a special exception, the copyright holders give
  22. * permission to link the code of portions of this program with the
  23. * OpenSSL library under certain conditions as described in each
  24. * individual source file, and distribute linked combinations
  25. * including the two.
  26. * You must obey the GNU General Public License in all respects
  27. * for all of the code used other than OpenSSL. If you modify
  28. * file(s) with this exception, you may extend this exception to your
  29. * version of the file(s), but you are not obligated to do so. If you
  30. * do not wish to do so, delete this exception statement from your
  31. * version. If you delete this exception statement from all source
  32. * files in the program, then also delete it here.
  33. */
  34. /* copyright --> */
  35. #ifndef _D_UTIL_H_
  36. #define _D_UTIL_H_
  37. #include "common.h"
  38. #include <sys/time.h>
  39. #include <string>
  40. #include <utility>
  41. #include <deque>
  42. #include <iosfwd>
  43. #include <ostream>
  44. #include <numeric>
  45. #include <map>
  46. #include <iomanip>
  47. #include <algorithm>
  48. #include <vector>
  49. #include "SharedHandle.h"
  50. #include "IntSequence.h"
  51. #include "a2time.h"
  52. #include "a2netcompat.h"
  53. #include "a2functional.h"
  54. namespace aria2 {
  55. class Randomizer;
  56. class BitfieldMan;
  57. class BinaryStream;
  58. class FileEntry;
  59. #define STRTOLL(X) strtoll(X, reinterpret_cast<char**>(0), 10)
  60. #define STRTOULL(X) strtoull(X, reinterpret_cast<char**>(0), 10)
  61. #define START_INDEX(OFFSET, PIECE_LENGTH) ((OFFSET)/(PIECE_LENGTH))
  62. #define END_INDEX(OFFSET, LENGTH, PIECE_LENGTH) (((OFFSET)+(LENGTH)-1)/(PIECE_LENGTH))
  63. #define DIV_FLOOR(X,Y) ((X)/(Y)+((X)%(Y)? 1:0))
  64. #ifdef WORDS_BIGENDIAN
  65. inline uint64_t ntoh64(uint64_t x) { return x; }
  66. inline uint64_t hton64(uint64_t x) { return x; }
  67. #else // !WORDS_BIGENDIAN
  68. inline uint64_t byteswap64(uint64_t x) {
  69. uint64_t v1 = ntohl(x & 0x00000000ffffffff);
  70. uint64_t v2 = ntohl(x >> 32);
  71. return (v1 << 32)|v2;
  72. }
  73. inline uint64_t ntoh64(uint64_t x) { return byteswap64(x); }
  74. inline uint64_t hton64(uint64_t x) { return byteswap64(x); }
  75. #endif // !WORDS_BIGENDIAN
  76. namespace util {
  77. void split(std::pair<std::string, std::string>& hp,
  78. const std::string& src, char delim);
  79. std::pair<std::string, std::string>
  80. split(const std::string& src, const std::string& delims);
  81. template<typename T>
  82. std::string uitos(T value, bool comma = false)
  83. {
  84. std::string str;
  85. if(value == 0) {
  86. str = "0";
  87. return str;
  88. }
  89. unsigned int count = 0;
  90. while(value) {
  91. ++count;
  92. char digit = value%10+'0';
  93. if(comma && count > 3 && count%3 == 1) {
  94. str += ',';
  95. }
  96. str += digit;
  97. value /= 10;
  98. }
  99. std::reverse(str.begin(), str.end());
  100. return str;
  101. }
  102. template<typename T>
  103. std::string itos(T value, bool comma = false)
  104. {
  105. bool flag = false;
  106. if(value < 0) {
  107. flag = true;
  108. value = -value;
  109. }
  110. std::string str = uitos(value, comma);
  111. if(flag) {
  112. str.insert(str.begin(), '-');
  113. }
  114. return str;
  115. }
  116. /**
  117. * Computes difference in micro-seconds between tv1 and tv2,
  118. * assuming tv1 is newer than tv2.
  119. * If tv1 is older than tv2, then this method returns 0.
  120. */
  121. int64_t difftv(struct timeval tv1, struct timeval tv2);
  122. int32_t difftvsec(struct timeval tv1, struct timeval tv2);
  123. extern const std::string DEFAULT_TRIM_CHARSET;
  124. std::string trim(const std::string& src,
  125. const std::string& trimCharset = DEFAULT_TRIM_CHARSET);
  126. void trimSelf(std::string& str,
  127. const std::string& trimCharset = DEFAULT_TRIM_CHARSET);
  128. bool startsWith(const std::string& target, const std::string& part);
  129. bool endsWith(const std::string& target, const std::string& part);
  130. std::string replace(const std::string& target, const std::string& oldstr, const std::string& newstr);
  131. std::string urlencode(const unsigned char* target, size_t len);
  132. std::string urlencode(const std::string& target);
  133. bool inRFC3986ReservedChars(const char c);
  134. bool inRFC3986UnreservedChars(const char c);
  135. std::string urldecode(const std::string& target);
  136. std::string torrentUrlencode(const unsigned char* target, size_t len);
  137. std::string torrentUrlencode(const std::string& target);
  138. std::string toHex(const unsigned char* src, size_t len);
  139. std::string toHex(const char* src, size_t len);
  140. std::string toHex(const std::string& src);
  141. // Converts hexadecimal ascii string 'src' into packed binary form and
  142. // return the result. If src is not well formed, then empty string is
  143. // returned.
  144. std::string fromHex(const std::string& src);
  145. FILE* openFile(const std::string& filename, const std::string& mode);
  146. bool isPowerOf(int num, int base);
  147. std::string secfmt(time_t sec);
  148. int32_t parseInt(const std::string& s, int32_t base = 10);
  149. uint32_t parseUInt(const std::string& s, int base = 10);
  150. bool parseUIntNoThrow(uint32_t& result, const std::string& s, int base = 10);
  151. int64_t parseLLInt(const std::string& s, int32_t base = 10);
  152. uint64_t parseULLInt(const std::string& s, int base = 10);
  153. IntSequence parseIntRange(const std::string& src);
  154. // Parses string which specifies the range of piece index for higher
  155. // priority and appends those indexes into result. The input string
  156. // src can contain 2 keywords "head" and "tail". To include both
  157. // keywords, they must be separated by comma. "head" means the pieces
  158. // where the first byte of each file sits. "tail" means the pieces
  159. // where the last byte of each file sits. These keywords can take one
  160. // parameter, SIZE. For example, if "head=SIZE" is specified, pieces
  161. // in the range of first SIZE bytes of each file get higher
  162. // priority. SIZE can include K or M(1K = 1024, 1M = 1024K).
  163. // If SIZE is omitted, SIZE=defaultSize is used.
  164. //
  165. // sample: head=512K,tail=512K
  166. void parsePrioritizePieceRange
  167. (std::vector<size_t>& result, const std::string& src,
  168. const std::vector<SharedHandle<FileEntry> >& fileEntries,
  169. size_t pieceLength,
  170. uint64_t defaultSize = 1048576 /* 1MiB */);
  171. // Converts ISO/IEC 8859-1 string src to utf-8.
  172. std::string iso8859ToUtf8(const std::string& src);
  173. std::string getContentDispositionFilename(const std::string& header);
  174. std::string randomAlpha(size_t length,
  175. const SharedHandle<Randomizer>& randomizer);
  176. std::string toUpper(const std::string& src);
  177. std::string toLower(const std::string& src);
  178. bool isNumericHost(const std::string& name);
  179. void setGlobalSignalHandler(int signal, void (*handler)(int), int flags);
  180. std::string getHomeDir();
  181. int64_t getRealSize(const std::string& sizeWithUnit);
  182. std::string abbrevSize(int64_t size);
  183. template<typename InputIterator>
  184. void toStream
  185. (InputIterator first, InputIterator last, std::ostream& os)
  186. {
  187. os << _("Files:") << "\n";
  188. os << "idx|path/length" << "\n";
  189. os << "===+===========================================================================" << "\n";
  190. int32_t count = 1;
  191. for(; first != last; ++first, ++count) {
  192. os << std::setw(3) << count << "|" << (*first)->getPath() << "\n";
  193. os << " |" << util::abbrevSize((*first)->getLength()) << "B ("
  194. << util::uitos((*first)->getLength(), true) << ")\n";
  195. os << "---+---------------------------------------------------------------------------" << "\n";
  196. }
  197. }
  198. void sleep(long seconds);
  199. void usleep(long microseconds);
  200. bool isNumber(const std::string& what);
  201. bool isLowercase(const std::string& what);
  202. bool isUppercase(const std::string& what);
  203. /**
  204. * Converts alphabets to unsigned int, assuming alphabets as a base 26
  205. * integer and 'a' or 'A' is 0.
  206. * This function assumes alphabets includes only a-z.
  207. * Upper case are allowed but all letters must be upper case.
  208. * If overflow occurs, returns 0.
  209. */
  210. unsigned int alphaToNum(const std::string& alphabets);
  211. void mkdirs(const std::string& dirpath);
  212. void convertBitfield(BitfieldMan* dest, const BitfieldMan* src);
  213. // binaryStream has to be opened before calling this function.
  214. std::string toString(const SharedHandle<BinaryStream>& binaryStream);
  215. #ifdef HAVE_POSIX_MEMALIGN
  216. void* allocateAlignedMemory(size_t alignment, size_t size);
  217. #endif // HAVE_POSIX_MEMALIGN
  218. std::pair<std::string, uint16_t>
  219. getNumericNameInfo(const struct sockaddr* sockaddr, socklen_t len);
  220. std::string htmlEscape(const std::string& src);
  221. // Joins path element specified in [first, last). If ".." is found,
  222. // it eats the previous element if it exists. If "." is found, it
  223. // is just ignored and it is not appeared in the result.
  224. template<typename InputIterator>
  225. std::string joinPath(InputIterator first, InputIterator last)
  226. {
  227. std::deque<std::string> elements;
  228. for(;first != last; ++first) {
  229. if(*first == "..") {
  230. if(!elements.empty()) {
  231. elements.pop_back();
  232. }
  233. } else if(*first == ".") {
  234. // do nothing
  235. } else {
  236. elements.push_back(*first);
  237. }
  238. }
  239. return strjoin(elements.begin(), elements.end(), "/");
  240. }
  241. // Parses INDEX=PATH format string. INDEX must be an unsigned
  242. // integer.
  243. std::map<size_t, std::string>::value_type
  244. parseIndexPath(const std::string& line);
  245. std::map<size_t, std::string> createIndexPathMap(std::istream& i);
  246. /**
  247. * Take a string src which is a delimited list and add its elements
  248. * into result. result is stored in out.
  249. */
  250. template<typename OutputIterator>
  251. OutputIterator split(const std::string& src, OutputIterator out,
  252. const std::string& delims, bool doTrim = false,
  253. bool allowEmpty = false)
  254. {
  255. std::string::size_type p = 0;
  256. while(1) {
  257. std::string::size_type np = src.find_first_of(delims, p);
  258. if(np == std::string::npos) {
  259. std::string term = src.substr(p);
  260. if(doTrim) {
  261. term = util::trim(term);
  262. }
  263. if(allowEmpty || !term.empty()) {
  264. *out = term;
  265. ++out;
  266. }
  267. break;
  268. }
  269. std::string term = src.substr(p, np-p);
  270. if(doTrim) {
  271. term = util::trim(term);
  272. }
  273. p = np+1;
  274. if(allowEmpty || !term.empty()) {
  275. *out = term;
  276. ++out;
  277. }
  278. }
  279. return out;
  280. }
  281. void generateRandomData(unsigned char* data, size_t length);
  282. // Saves data to file whose name is filename. If overwrite is true,
  283. // existing file is overwritten. Otherwise, this function doesn't do
  284. // nothing. If data is saved successfully, return true. Otherwise
  285. // returns false.
  286. bool saveAs
  287. (const std::string& filename, const std::string& data, bool overwrite=false);
  288. // Prepend dir to relPath. If dir is empty, it prepends "." to relPath.
  289. //
  290. // dir = "/dir", relPath = "foo" => "/dir/foo"
  291. // dir = "", relPath = "foo" => "./foo"
  292. // dir = "/", relPath = "foo" => "/foo"
  293. std::string applyDir(const std::string& dir, const std::string& relPath);
  294. // In HTTP/FTP, file name is file component in URI. In HTTP, filename
  295. // may be a value of Content-Disposition header. They are likely
  296. // percent encoded. If they contains, for example, %2F, when decoded,
  297. // basename contains dir component. This should be avoided. This
  298. // function is created to fix these issues. This function expects src
  299. // should be non-percent-encoded basename. Currently, this function
  300. // replaces '/' and '\' with '_'.
  301. std::string fixTaintedBasename(const std::string& src);
  302. // Generates 20 bytes random key and store it to the address pointed
  303. // by key. Caller must allocate at least 20 bytes for generated key.
  304. void generateRandomKey(unsigned char* key);
  305. // Returns true is given numeric ipv4addr is in Private Address Space.
  306. bool inPrivateAddress(const std::string& ipv4addr);
  307. } // namespace util
  308. } // namespace aria2
  309. #endif // _D_UTIL_H_