123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049 |
- /* <!-- copyright */
- /*
- * aria2 - The high speed download utility
- *
- * Copyright (C) 2006 Tatsuhiro Tsujikawa
- *
- * This program is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License as published by
- * the Free Software Foundation; either version 2 of the License, or
- * (at your option) any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with this program; if not, write to the Free Software
- * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
- *
- * In addition, as a special exception, the copyright holders give
- * permission to link the code of portions of this program with the
- * OpenSSL library under certain conditions as described in each
- * individual source file, and distribute linked combinations
- * including the two.
- * You must obey the GNU General Public License in all respects
- * for all of the code used other than OpenSSL. If you modify
- * file(s) with this exception, you may extend this exception to your
- * version of the file(s), but you are not obligated to do so. If you
- * do not wish to do so, delete this exception statement from your
- * version. If you delete this exception statement from all source
- * files in the program, then also delete it here.
- */
- /* copyright --> */
- #include "util.h"
- #ifdef __sun
- // For opensolaris, just include signal.h which includes sys/signal.h
- #ifdef HAVE_SIGNAL_H
- # include <signal.h>
- #endif // HAVE_SIGNAL_H
- #else // !__sun
- #ifdef HAVE_SYS_SIGNAL_H
- # include <sys/signal.h>
- #endif // HAVE_SYS_SIGNAL_H
- #ifdef HAVE_SIGNAL_H
- # include <signal.h>
- #endif // HAVE_SIGNAL_H
- #endif // !__sun
- #include <sys/types.h>
- #ifdef HAVE_PWD_H
- # include <pwd.h>
- #endif // HAVE_PWD_H
- #include <cerrno>
- #include <cassert>
- #include <cstring>
- #include <cstdio>
- #include <cstdlib>
- #include <sstream>
- #include <ostream>
- #include <algorithm>
- #include <fstream>
- #include <iomanip>
- #include "SimpleRandomizer.h"
- #include "File.h"
- #include "Randomizer.h"
- #include "a2netcompat.h"
- #include "BitfieldMan.h"
- #include "DefaultDiskWriter.h"
- #include "FatalException.h"
- #include "FileEntry.h"
- #include "A2STR.h"
- #include "array_fun.h"
- #include "bitfield.h"
- #include "DownloadHandlerConstants.h"
- #include "RequestGroup.h"
- #include "LogFactory.h"
- #include "Logger.h"
- #include "Option.h"
- #include "DownloadContext.h"
- #include "BufferedFile.h"
- #include "SocketCore.h"
- #include "Lock.h"
- #include "MessageDigest.h"
- #include "message_digest_helper.h"
- // For libc6 which doesn't define ULLONG_MAX properly because of broken limits.h
- #ifndef ULLONG_MAX
- # define ULLONG_MAX 18446744073709551615ULL
- #endif // ULLONG_MAX
- namespace aria2 {
- #ifdef __MINGW32__
- namespace {
- int utf8ToWChar(wchar_t* out, size_t outLength, const char* src)
- {
- return MultiByteToWideChar(CP_UTF8, 0, src, -1, out, outLength);
- }
- } // namespace
- namespace {
- int wCharToUtf8(char* out, size_t outLength, const wchar_t* src)
- {
- return WideCharToMultiByte(CP_UTF8, 0, src, -1, out, outLength,
- nullptr, nullptr);
- }
- } // namespace
- std::wstring utf8ToWChar(const char* src)
- {
- int len = utf8ToWChar(nullptr, 0, src);
- if(len <= 0) {
- abort();
- }
- auto buf = make_unique<wchar_t[]>((size_t)len);
- len = utf8ToWChar(buf.get(), len, src);
- if(len <= 0) {
- abort();
- } else {
- return buf.get();
- }
- }
- std::wstring utf8ToWChar(const std::string& src)
- {
- return utf8ToWChar(src.c_str());
- }
- std::string wCharToUtf8(const std::wstring& wsrc)
- {
- int len = wCharToUtf8(nullptr, 0, wsrc.c_str());
- if(len <= 0) {
- abort();
- }
- auto buf = make_unique<char[]>((size_t)len);
- len = wCharToUtf8(buf.get(), len, wsrc.c_str());
- if(len <= 0) {
- abort();
- } else {
- return buf.get();
- }
- }
- std::string toForwardSlash(const std::string &src) {
- auto dst = src;
- std::transform(std::begin(dst), std::end(dst), std::begin(dst),
- [](char c) { return c == '\\' ? '/' : c; });
- return dst;
- }
- #endif // __MINGW32__
- namespace util {
- const char DEFAULT_STRIP_CHARSET[] = "\r\n\t ";
- std::string strip(const std::string& str, const char* chars)
- {
- std::pair<std::string::const_iterator,
- std::string::const_iterator> p =
- stripIter(str.begin(), str.end(), chars);
- return std::string(p.first, p.second);
- }
- std::string itos(int64_t value, bool comma)
- {
- bool flag = false;
- std::string str;
- if(value < 0) {
- if(value == INT64_MIN) {
- if(comma) {
- str = "-9,223,372,036,854,775,808";
- } else {
- str = "-9223372036854775808";
- }
- return str;
- }
- flag = true;
- value = -value;
- }
- str = uitos(value, comma);
- if(flag) {
- str.insert(str.begin(), '-');
- }
- return str;
- }
- int64_t difftv(struct timeval tv1, struct timeval tv2) {
- if((tv1.tv_sec < tv2.tv_sec) ||
- ((tv1.tv_sec == tv2.tv_sec) && (tv1.tv_usec < tv2.tv_usec))) {
- return 0;
- }
- return ((int64_t)(tv1.tv_sec-tv2.tv_sec)*1000000+
- tv1.tv_usec-tv2.tv_usec);
- }
- int32_t difftvsec(struct timeval tv1, struct timeval tv2) {
- if(tv1.tv_sec < tv2.tv_sec) {
- return 0;
- }
- return tv1.tv_sec-tv2.tv_sec;
- }
- std::string replace(const std::string& target, const std::string& oldstr, const std::string& newstr) {
- if(target.empty() || oldstr.empty()) {
- return target;
- }
- std::string result;
- std::string::size_type p = 0;
- std::string::size_type np = target.find(oldstr);
- while(np != std::string::npos) {
- result.append(target.begin()+p, target.begin()+np);
- result += newstr;
- p = np+oldstr.size();
- np = target.find(oldstr, p);
- }
- result.append(target.begin()+p, target.end());
- return result;
- }
- bool isAlpha(const char c)
- {
- return ('A' <= c && c <= 'Z') || ('a' <= c && c <= 'z');
- }
- bool isDigit(const char c)
- {
- return '0' <= c && c <= '9';
- }
- bool isHexDigit(const char c)
- {
- return isDigit(c) || ('A' <= c && c <= 'F') || ('a' <= c && c <= 'f');
- }
- bool isHexDigit(const std::string& s)
- {
- for (const auto& c : s) {
- if(!isHexDigit(c)) {
- return false;
- }
- }
- return true;
- }
- bool inRFC3986ReservedChars(const char c)
- {
- static const char reserved[] = {
- ':' , '/' , '?' , '#' , '[' , ']' , '@',
- '!' , '$' , '&' , '\'' , '(' , ')',
- '*' , '+' , ',' , ';' , '=' };
- return std::find(std::begin(reserved), std::end(reserved), c)
- != std::end(reserved);
- }
- bool inRFC3986UnreservedChars(const char c)
- {
- static const char unreserved[] = { '-', '.', '_', '~' };
- return isAlpha(c) || isDigit(c) ||
- std::find(std::begin(unreserved), std::end(unreserved), c)
- != std::end(unreserved);
- }
- bool inRFC2978MIMECharset(const char c)
- {
- static const char chars[] = {
- '!', '#', '$', '%', '&',
- '\'', '+', '-', '^', '_',
- '`', '{', '}', '~'
- };
- return isAlpha(c) || isDigit(c) ||
- std::find(std::begin(chars), std::end(chars), c) != std::end(chars);
- }
- bool inRFC2616HttpToken(const char c)
- {
- static const char chars[] = {
- '!', '#', '$', '%', '&', '\'', '*', '+', '-', '.',
- '^', '_', '`', '|', '~'
- };
- return isAlpha(c) || isDigit(c) ||
- std::find(std::begin(chars), std::end(chars), c) != std::end(chars);
- }
- bool inRFC5987AttrChar(const char c)
- {
- return inRFC2616HttpToken(c) && c != '*' && c != '\'' && c != '%';
- }
- // Returns nonzero if |c| is in ISO/IEC 8859-1 character set.
- bool isIso8859p1(unsigned char c)
- {
- return (0x20u <= c && c <= 0x7eu) || 0xa0u <= c;
- }
- bool isLws(const char c)
- {
- return c == ' ' || c == '\t';
- }
- bool isCRLF(const char c)
- {
- return c == '\r' || c == '\n';
- }
- namespace {
- bool isUtf8Tail(unsigned char ch)
- {
- return in(ch, 0x80u, 0xbfu);
- }
- bool inPercentEncodeMini(const unsigned char c)
- {
- return c > 0x20 && c < 0x7fu &&
- // Chromium escapes following characters. Firefox4 escapes more.
- c != '"' && c != '<' && c != '>';
- }
- } // namespace
- bool isUtf8(const std::string& str)
- {
- for(std::string::const_iterator s = str.begin(), eos = str.end(); s != eos;
- ++s) {
- unsigned char firstChar = *s;
- // See ABNF in http://tools.ietf.org/search/rfc3629#section-4
- if(in(firstChar, 0x20u, 0x7eu) ||
- firstChar == 0x08u || // \b
- firstChar == 0x09u || // \t
- firstChar == 0x0au || // \n
- firstChar == 0x0cu || // \f
- firstChar == 0x0du // \r
- ) {
- // UTF8-1 (without ctrl chars)
- } else if(in(firstChar, 0xc2u, 0xdfu)) {
- // UTF8-2
- if(++s == eos || !isUtf8Tail(*s)) {
- return false;
- }
- } else if(0xe0u == firstChar) {
- // UTF8-3
- if(++s == eos || !in(static_cast<unsigned char>(*s), 0xa0u, 0xbfu) ||
- ++s == eos || !isUtf8Tail(*s)) {
- return false;
- }
- } else if(in(firstChar, 0xe1u, 0xecu) || in(firstChar, 0xeeu, 0xefu)) {
- // UTF8-3
- if(++s == eos || !isUtf8Tail(*s) ||
- ++s == eos || !isUtf8Tail(*s)) {
- return false;
- }
- } else if(0xedu == firstChar) {
- // UTF8-3
- if(++s == eos || !in(static_cast<unsigned char>(*s), 0x80u, 0x9fu) ||
- ++s == eos || !isUtf8Tail(*s)) {
- return false;
- }
- } else if(0xf0u == firstChar) {
- // UTF8-4
- if(++s == eos || !in(static_cast<unsigned char>(*s), 0x90u, 0xbfu) ||
- ++s == eos || !isUtf8Tail(*s) ||
- ++s == eos || !isUtf8Tail(*s)) {
- return false;
- }
- } else if(in(firstChar, 0xf1u, 0xf3u)) {
- // UTF8-4
- if(++s == eos || !isUtf8Tail(*s) ||
- ++s == eos || !isUtf8Tail(*s) ||
- ++s == eos || !isUtf8Tail(*s)) {
- return false;
- }
- } else if(0xf4u == firstChar) {
- // UTF8-4
- if(++s == eos || !in(static_cast<unsigned char>(*s), 0x80u, 0x8fu) ||
- ++s == eos || !isUtf8Tail(*s) ||
- ++s == eos || !isUtf8Tail(*s)) {
- return false;
- }
- } else {
- return false;
- }
- }
- return true;
- }
- std::string percentEncode(const unsigned char* target, size_t len)
- {
- std::string dest;
- for(size_t i = 0; i < len; ++i) {
- if(inRFC3986UnreservedChars(target[i])) {
- dest += target[i];
- } else {
- dest.append(fmt("%%%02X", target[i]));
- }
- }
- return dest;
- }
- std::string percentEncode(const std::string& target)
- {
- if (std::find_if_not(target.begin(), target.end(),
- inRFC3986UnreservedChars) == target.end()) {
- return target;
- }
- return percentEncode(reinterpret_cast<const unsigned char*>(target.c_str()),
- target.size());
- }
- std::string percentEncodeMini(const std::string& src)
- {
- if (std::find_if_not(src.begin(), src.end(), inPercentEncodeMini) ==
- src.end()) {
- return src;
- }
- std::string result;
- for (auto c: src) {
- if(!inPercentEncodeMini(c)) {
- result += fmt("%%%02X", static_cast<unsigned char>(c));
- } else {
- result += c;
- }
- }
- return result;
- }
- std::string torrentPercentEncode(const unsigned char* target, size_t len) {
- std::string dest;
- for(size_t i = 0; i < len; ++i) {
- if(isAlpha(target[i]) || isDigit(target[i])) {
- dest += target[i];
- } else {
- dest.append(fmt("%%%02X", target[i]));
- }
- }
- return dest;
- }
- std::string torrentPercentEncode(const std::string& target)
- {
- return torrentPercentEncode
- (reinterpret_cast<const unsigned char*>(target.c_str()), target.size());
- }
- std::string percentDecode
- (std::string::const_iterator first, std::string::const_iterator last)
- {
- std::string result;
- for(; first != last; ++first) {
- if(*first == '%') {
- if(first+1 != last && first+2 != last &&
- isHexDigit(*(first+1)) && isHexDigit(*(first+2))) {
- result += hexCharToUInt(*(first+1))*16+hexCharToUInt(*(first+2));
- first += 2;
- } else {
- result += *first;
- }
- } else {
- result += *first;
- }
- }
- return result;
- }
- std::string toHex(const unsigned char* src, size_t len) {
- std::string out(len*2, '\0');
- std::string::iterator o = out.begin();
- const unsigned char* last = src+len;
- for(const unsigned char* i = src; i != last; ++i) {
- *o = (*i >> 4);
- *(o+1) = (*i)&0x0fu;
- for(int j = 0; j < 2; ++j) {
- if(*o < 10) {
- *o += '0';
- } else {
- *o += 'a'-10;
- }
- ++o;
- }
- }
- return out;
- }
- std::string toHex(const char* src, size_t len)
- {
- return toHex(reinterpret_cast<const unsigned char*>(src), len);
- }
- std::string toHex(const std::string& src)
- {
- return toHex(reinterpret_cast<const unsigned char*>(src.c_str()), src.size());
- }
- unsigned int hexCharToUInt(unsigned char ch)
- {
- if('a' <= ch && ch <= 'f') {
- ch -= 'a';
- ch += 10;
- } else if('A' <= ch && ch <= 'F') {
- ch -= 'A';
- ch += 10;
- } else if('0' <= ch && ch <= '9') {
- ch -= '0';
- } else {
- ch = 255;
- }
- return ch;
- }
- std::string secfmt(time_t sec) {
- time_t tsec = sec;
- std::string str;
- if(sec >= 3600) {
- str = fmt("%" PRId64 "h", static_cast<int64_t>(sec/3600));
- sec %= 3600;
- }
- if(sec >= 60) {
- str += fmt("%dm", static_cast<int>(sec/60));
- sec %= 60;
- }
- if(sec || tsec == 0) {
- str += fmt("%ds", static_cast<int>(sec));
- }
- return str;
- }
- namespace {
- template<typename T, typename F>
- bool parseLong(T& res, F f, const std::string& s, int base)
- {
- if(s.empty()) {
- return false;
- }
- char* endptr;
- errno = 0;
- res = f(s.c_str(), &endptr, base);
- if(errno == ERANGE) {
- return false;
- }
- if(*endptr != '\0') {
- for(const char* i = endptr, *eoi = s.c_str()+s.size(); i < eoi; ++i) {
- if(!isspace(*i)) {
- return false;
- }
- }
- }
- return true;
- }
- } // namespace
- bool parseIntNoThrow(int32_t& res, const std::string& s, int base)
- {
- long int t;
- if(parseLong(t, strtol, s, base) &&
- t >= std::numeric_limits<int32_t>::min() &&
- t <= std::numeric_limits<int32_t>::max()) {
- res = t;
- return true;
- } else {
- return false;
- }
- }
- bool parseUIntNoThrow(uint32_t& res, const std::string& s, int base)
- {
- long int t;
- if(parseLong(t, strtol, s, base) &&
- t >= 0 &&
- t <= std::numeric_limits<int32_t>::max()) {
- res = t;
- return true;
- } else {
- return false;
- }
- }
- bool parseLLIntNoThrow(int64_t& res, const std::string& s, int base)
- {
- long long int t;
- if(parseLong(t, strtoll, s, base) &&
- t >= std::numeric_limits<int64_t>::min() &&
- t <= std::numeric_limits<int64_t>::max()) {
- res = t;
- return true;
- } else {
- return false;
- }
- }
- SegList<int> parseIntSegments(const std::string& src)
- {
- SegList<int> sgl;
- for(std::string::const_iterator i = src.begin(), eoi = src.end(); i != eoi;) {
- std::string::const_iterator j = std::find(i, eoi, ',');
- if(j == i) {
- ++i;
- continue;
- }
- std::string::const_iterator p = std::find(i, j, '-');
- if(p == j) {
- int a;
- if(parseIntNoThrow(a, std::string(i, j))) {
- sgl.add(a, a+1);
- } else {
- throw DL_ABORT_EX(fmt("Bad range %s", std::string(i, j).c_str()));
- }
- } else if(p == i || p+1 == j) {
- throw DL_ABORT_EX(fmt(MSG_INCOMPLETE_RANGE, std::string(i, j).c_str()));
- } else {
- int a, b;
- if(parseIntNoThrow(a, std::string(i, p)) &&
- parseIntNoThrow(b, (std::string(p+1, j)))) {
- sgl.add(a, b+1);
- } else {
- throw DL_ABORT_EX(fmt("Bad range %s", std::string(i, j).c_str()));
- }
- }
- if(j == eoi) {
- break;
- }
- i = j+1;
- }
- return sgl;
- }
- namespace {
- void computeHeadPieces
- (std::vector<size_t>& indexes,
- const std::vector<std::shared_ptr<FileEntry> >& fileEntries,
- size_t pieceLength,
- int64_t head)
- {
- if(head == 0) {
- return;
- }
- for (const auto& fi: fileEntries) {
- if(fi->getLength() == 0) {
- continue;
- }
- const size_t lastIndex = (fi->getOffset() +
- std::min(head, fi->getLength()) - 1
- ) / pieceLength;
- for(size_t idx = fi->getOffset() / pieceLength; idx <= lastIndex; ++idx) {
- indexes.push_back(idx);
- }
- }
- }
- } // namespace
- namespace {
- void computeTailPieces
- (std::vector<size_t>& indexes,
- const std::vector<std::shared_ptr<FileEntry> >& fileEntries,
- size_t pieceLength,
- int64_t tail)
- {
- if(tail == 0) {
- return;
- }
- for (const auto& fi: fileEntries) {
- if(fi->getLength() == 0) {
- continue;
- }
- int64_t endOffset = fi->getLastOffset();
- size_t fromIndex = (endOffset - 1 - (std::min(tail, fi->getLength()) - 1)) /
- pieceLength;
- const size_t toIndex = (endOffset - 1) / pieceLength;
- while (fromIndex <= toIndex) {
- indexes.push_back(fromIndex++);
- }
- }
- }
- } // namespace
- void parsePrioritizePieceRange
- (std::vector<size_t>& result, const std::string& src,
- const std::vector<std::shared_ptr<FileEntry> >& fileEntries,
- size_t pieceLength,
- int64_t defaultSize)
- {
- std::vector<size_t> indexes;
- std::vector<Scip> parts;
- splitIter(src.begin(), src.end(), std::back_inserter(parts), ',', true);
- for (const auto& i: parts) {
- if(util::streq(i.first, i.second, "head")) {
- computeHeadPieces(indexes, fileEntries, pieceLength, defaultSize);
- }
- else if(util::startsWith(i.first, i.second, "head=")) {
- std::string sizestr(i.first + 5, i.second);
- computeHeadPieces(indexes, fileEntries, pieceLength,
- std::max((int64_t)0, getRealSize(sizestr)));
- }
- else if(util::streq(i.first, i.second, "tail")) {
- computeTailPieces(indexes, fileEntries, pieceLength, defaultSize);
- }
- else if(util::startsWith(i.first, i.second, "tail=")) {
- std::string sizestr(i.first + 5, i.second);
- computeTailPieces(indexes, fileEntries, pieceLength,
- std::max((int64_t)0, getRealSize(sizestr)));
- }
- else {
- throw DL_ABORT_EX(fmt("Unrecognized token %s",
- std::string(i.first, i.second).c_str()));
- }
- }
- std::sort(indexes.begin(), indexes.end());
- indexes.erase(std::unique(indexes.begin(), indexes.end()), indexes.end());
- result.insert(result.end(), indexes.begin(), indexes.end());
- }
- // Converts ISO/IEC 8859-1 string to UTF-8 string. If there is a
- // character not in ISO/IEC 8859-1, returns empty string.
- std::string iso8859p1ToUtf8(const char* src, size_t len)
- {
- std::string dest;
- for(const char* p = src, *last = src+len; p != last; ++p) {
- unsigned char c = *p;
- if(0xa0u <= c) {
- if(c <= 0xbfu) {
- dest += 0xc2u;
- } else {
- dest += 0xc3u;
- }
- dest += c&(~0x40u);
- } else if(0x80u <= c && c <= 0x9fu) {
- return "";
- } else {
- dest += c;
- }
- }
- return dest;
- }
- std::string iso8859p1ToUtf8(const std::string& src)
- {
- return iso8859p1ToUtf8(src.c_str(), src.size());
- }
- /* Start of utf8 dfa */
- /* Copyright (c) 2008-2010 Bjoern Hoehrmann <bjoern@hoehrmann.de>
- * See http://bjoern.hoehrmann.de/utf-8/decoder/dfa/ for details.
- *
- * Copyright (c) 2008-2009 Bjoern Hoehrmann <bjoern@hoehrmann.de>
- *
- * Permission is hereby granted, free of charge, to any person
- * obtaining a copy of this software and associated documentation
- * files (the "Software"), to deal in the Software without
- * restriction, including without limitation the rights to use, copy,
- * modify, merge, publish, distribute, sublicense, and/or sell copies
- * of the Software, and to permit persons to whom the Software is
- * furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice shall be
- * included in all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
- * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
- * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
- * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
- * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
- * SOFTWARE.
- */
- #define UTF8_ACCEPT 0
- #define UTF8_REJECT 12
- static const uint8_t utf8d[] = {
- /*
- * The first part of the table maps bytes to character classes that
- * to reduce the size of the transition table and create bitmasks.
- */
- 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
- 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
- 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
- 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
- 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, 9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,
- 7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7, 7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,
- 8,8,2,2,2,2,2,2,2,2,2,2,2,2,2,2, 2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,
- 10,3,3,3,3,3,3,3,3,3,3,3,3,4,3,3, 11,6,6,6,5,8,8,8,8,8,8,8,8,8,8,8,
- /*
- * The second part is a transition table that maps a combination
- * of a state of the automaton and a character class to a state.
- */
- 0,12,24,36,60,96,84,12,12,12,48,72, 12,12,12,12,12,12,12,12,12,12,12,12,
- 12, 0,12,12,12,12,12, 0,12, 0,12,12, 12,24,12,12,12,12,12,24,12,24,12,12,
- 12,12,12,12,12,12,12,24,12,12,12,12, 12,24,12,12,12,12,12,12,12,24,12,12,
- 12,12,12,12,12,12,12,36,12,36,12,12, 12,36,12,12,12,12,12,36,12,36,12,12,
- 12,36,12,12,12,12,12,12,12,12,12,12,
- };
- static uint32_t
- utf8dfa(uint32_t* state, uint32_t* codep, uint32_t byte) {
- uint32_t type = utf8d[byte];
- *codep = (*state != UTF8_ACCEPT) ?
- (byte & 0x3fu) | (*codep << 6) :
- (0xff >> type) & (byte);
- *state = utf8d[256 + *state + type];
- return *state;
- }
- /* End of utf8 dfa */
- typedef enum {
- CD_BEFORE_DISPOSITION_TYPE,
- CD_AFTER_DISPOSITION_TYPE,
- CD_DISPOSITION_TYPE,
- CD_BEFORE_DISPOSITION_PARM_NAME,
- CD_AFTER_DISPOSITION_PARM_NAME,
- CD_DISPOSITION_PARM_NAME,
- CD_BEFORE_VALUE,
- CD_AFTER_VALUE,
- CD_QUOTED_STRING,
- CD_TOKEN,
- CD_BEFORE_EXT_VALUE,
- CD_CHARSET,
- CD_LANGUAGE,
- CD_VALUE_CHARS,
- CD_VALUE_CHARS_PCT_ENCODED1,
- CD_VALUE_CHARS_PCT_ENCODED2
- } content_disposition_parse_state;
- typedef enum {
- CD_FILENAME_FOUND = 1,
- CD_EXT_FILENAME_FOUND = 1 << 1
- } content_disposition_parse_flag;
- typedef enum {
- CD_ENC_UNKNOWN,
- CD_ENC_UTF8,
- CD_ENC_ISO_8859_1
- } content_disposition_charset;
- ssize_t parse_content_disposition(char *dest, size_t destlen,
- const char **charsetp, size_t *charsetlenp,
- const char *in, size_t len)
- {
- const char *p = in, *eop = in + len, *mark_first = nullptr, *mark_last = nullptr;
- int state = CD_BEFORE_DISPOSITION_TYPE;
- int in_file_parm = 0;
- int flags = 0;
- int quoted_seen = 0;
- int charset = 0;
- /* To suppress warnings */
- char *dp = dest;
- size_t dlen = destlen;
- uint32_t dfa_state = 0;
- uint32_t dfa_code = 0;
- uint8_t pctval = 0;
- *charsetp = nullptr;
- *charsetlenp = 0;
- for(; p != eop; ++p) {
- switch(state) {
- case CD_BEFORE_DISPOSITION_TYPE:
- if(inRFC2616HttpToken(*p)) {
- state = CD_DISPOSITION_TYPE;
- } else if(!isLws(*p)) {
- return -1;
- }
- break;
- case CD_AFTER_DISPOSITION_TYPE:
- case CD_DISPOSITION_TYPE:
- if(*p == ';') {
- state = CD_BEFORE_DISPOSITION_PARM_NAME;
- } else if(isLws(*p)) {
- state = CD_AFTER_DISPOSITION_TYPE;
- } else if(state == CD_AFTER_DISPOSITION_TYPE ||
- !inRFC2616HttpToken(*p)) {
- return -1;
- }
- break;
- case CD_BEFORE_DISPOSITION_PARM_NAME:
- if(inRFC2616HttpToken(*p)) {
- mark_first = p;
- state = CD_DISPOSITION_PARM_NAME;
- } else if(!isLws(*p)) {
- return -1;
- }
- break;
- case CD_AFTER_DISPOSITION_PARM_NAME:
- case CD_DISPOSITION_PARM_NAME:
- if(*p == '=') {
- if(state == CD_DISPOSITION_PARM_NAME) {
- mark_last = p;
- }
- in_file_parm = 0;
- if(strieq(mark_first, mark_last, "filename*")) {
- if((flags & CD_EXT_FILENAME_FOUND) == 0) {
- in_file_parm = 1;
- } else {
- return -1;
- }
- state = CD_BEFORE_EXT_VALUE;
- } else if(strieq(mark_first, mark_last, "filename")) {
- if(flags & CD_FILENAME_FOUND) {
- return -1;
- }
- if((flags & CD_EXT_FILENAME_FOUND) == 0) {
- in_file_parm = 1;
- }
- state = CD_BEFORE_VALUE;
- } else {
- /* ext-token must be characters in token, followed by "*" */
- if(mark_first != mark_last-1 && *(mark_last-1) == '*') {
- state = CD_BEFORE_EXT_VALUE;
- } else {
- state = CD_BEFORE_VALUE;
- }
- }
- if(in_file_parm) {
- dp = dest;
- dlen = destlen;
- }
- } else if(isLws(*p)) {
- mark_last = p;
- state = CD_AFTER_DISPOSITION_PARM_NAME;
- } else if(state == CD_AFTER_DISPOSITION_PARM_NAME ||
- !inRFC2616HttpToken(*p)) {
- return -1;
- }
- break;
- case CD_BEFORE_VALUE:
- if(*p == '"') {
- quoted_seen = 0;
- state = CD_QUOTED_STRING;
- } else if(inRFC2616HttpToken(*p)) {
- if(in_file_parm) {
- if(dlen == 0) {
- return -1;
- } else {
- *dp++ = *p;
- --dlen;
- }
- }
- state = CD_TOKEN;
- } else if(!isLws(*p)) {
- return -1;
- }
- break;
- case CD_AFTER_VALUE:
- if(*p == ';') {
- state = CD_BEFORE_DISPOSITION_PARM_NAME;
- } else if(!isLws(*p)) {
- return -1;
- }
- break;
- case CD_QUOTED_STRING:
- if(*p == '\\' && quoted_seen == 0) {
- quoted_seen = 1;
- } else if(*p == '"' && quoted_seen == 0) {
- if(in_file_parm) {
- flags |= CD_FILENAME_FOUND;
- }
- state = CD_AFTER_VALUE;
- } else {
- /* TEXT which is OCTET except CTLs, but including LWS. We only
- accept ISO-8859-1 chars. */
- quoted_seen = 0;
- if(!isIso8859p1(*p)) {
- return -1;
- }
- if(in_file_parm) {
- if(dlen == 0) {
- return -1;
- } else {
- *dp++ = *p;
- --dlen;
- }
- }
- }
- break;
- case CD_TOKEN:
- if(inRFC2616HttpToken(*p)) {
- if(in_file_parm) {
- if(dlen == 0) {
- return -1;
- } else {
- *dp++ = *p;
- --dlen;
- }
- }
- } else if(*p == ';') {
- if(in_file_parm) {
- flags |= CD_FILENAME_FOUND;
- }
- state = CD_BEFORE_DISPOSITION_PARM_NAME;
- } else if(isLws(*p)) {
- if(in_file_parm) {
- flags |= CD_FILENAME_FOUND;
- }
- state = CD_AFTER_VALUE;
- } else {
- return -1;
- }
- break;
- case CD_BEFORE_EXT_VALUE:
- if(*p == '\'') {
- /* Empty charset is not allowed */
- return -1;
- } else if(inRFC2978MIMECharset(*p)) {
- mark_first = p;
- state = CD_CHARSET;
- } else if(!isLws(*p)) {
- return -1;
- }
- break;
- case CD_CHARSET:
- if(*p == '\'') {
- mark_last = p;
- *charsetp = mark_first;
- *charsetlenp = mark_last - mark_first;
- if(strieq(mark_first, mark_last, "utf-8")) {
- charset = CD_ENC_UTF8;
- dfa_state = UTF8_ACCEPT;
- dfa_code = 0;
- } else if(strieq(mark_first, mark_last, "iso-8859-1")) {
- charset = CD_ENC_ISO_8859_1;
- } else {
- charset = CD_ENC_UNKNOWN;
- }
- state = CD_LANGUAGE;
- } else if(!inRFC2978MIMECharset(*p)) {
- return -1;
- }
- break;
- case CD_LANGUAGE:
- if(*p == '\'') {
- if(in_file_parm) {
- dp = dest;
- dlen = destlen;
- }
- state = CD_VALUE_CHARS;
- } else if(*p != '-' && !isAlpha(*p) && !isDigit(*p)) {
- return -1;
- }
- break;
- case CD_VALUE_CHARS:
- if(inRFC5987AttrChar(*p)) {
- if(charset == CD_ENC_UTF8) {
- if(utf8dfa(&dfa_state, &dfa_code, *p) == UTF8_REJECT) {
- return -1;
- }
- }
- if(in_file_parm) {
- if(dlen == 0) {
- return -1;
- } else {
- *dp++ = *p;
- --dlen;
- }
- }
- } else if(*p == '%') {
- if(in_file_parm) {
- if(dlen == 0) {
- return -1;
- }
- }
- pctval = 0;
- state = CD_VALUE_CHARS_PCT_ENCODED1;
- } else if(*p == ';' || isLws(*p)) {
- if(charset == CD_ENC_UTF8 && dfa_state != UTF8_ACCEPT) {
- return -1;
- }
- if(in_file_parm) {
- flags |= CD_EXT_FILENAME_FOUND;
- }
- if(*p == ';') {
- state = CD_BEFORE_DISPOSITION_PARM_NAME;
- } else {
- state = CD_AFTER_VALUE;
- }
- } else if(!inRFC5987AttrChar(*p)) {
- return -1;
- }
- break;
- case CD_VALUE_CHARS_PCT_ENCODED1:
- if(isHexDigit(*p)) {
- pctval |= hexCharToUInt(*p) << 4;
- state = CD_VALUE_CHARS_PCT_ENCODED2;
- } else {
- return -1;
- }
- break;
- case CD_VALUE_CHARS_PCT_ENCODED2:
- if(isHexDigit(*p)) {
- pctval |= hexCharToUInt(*p);
- if(charset == CD_ENC_UTF8) {
- if(utf8dfa(&dfa_state, &dfa_code, pctval) == UTF8_REJECT) {
- return -1;
- }
- } else if(charset == CD_ENC_ISO_8859_1) {
- if(!isIso8859p1(pctval)) {
- return -1;
- }
- }
- if(in_file_parm) {
- *dp++ = pctval;
- --dlen;
- }
- state = CD_VALUE_CHARS;
- } else {
- return -1;
- }
- break;
- }
- }
- switch(state) {
- case CD_BEFORE_DISPOSITION_TYPE:
- case CD_AFTER_DISPOSITION_TYPE:
- case CD_DISPOSITION_TYPE:
- case CD_AFTER_VALUE:
- case CD_TOKEN:
- return destlen-dlen;
- case CD_VALUE_CHARS:
- if(charset == CD_ENC_UTF8 && dfa_state != UTF8_ACCEPT) {
- return -1;
- }
- return destlen - dlen;
- default:
- return -1;
- }
- }
- std::string getContentDispositionFilename(const std::string& header)
- {
- std::array<char, 1_k> cdval;
- size_t cdvallen = cdval.size();
- const char* charset;
- size_t charsetlen;
- ssize_t rv = parse_content_disposition(cdval.data(), cdvallen,
- &charset, &charsetlen,
- header.c_str(), header.size());
- if(rv == -1) {
- return "";
- }
- std::string res;
- if(!charset || strieq(charset, charset+charsetlen, "iso-8859-1")) {
- res = iso8859p1ToUtf8(cdval.data(), rv);
- } else {
- res.assign(cdval.data(), rv);
- }
- if(!detectDirTraversal(res) &&
- res.find_first_of("/\\") == std::string::npos) {
- return res;
- }
- return "";
- }
- std::string toUpper(std::string src)
- {
- uppercase(src);
- return src;
- }
- std::string toLower(std::string src) {
- lowercase(src);
- return src;
- }
- void uppercase(std::string& s)
- {
- std::transform(s.begin(), s.end(), s.begin(), toUpperChar);
- }
- void lowercase(std::string& s)
- {
- std::transform(s.begin(), s.end(), s.begin(), toLowerChar);
- }
- char toUpperChar(char c)
- {
- if('a' <= c && c <= 'z') {
- c += 'A'-'a';
- }
- return c;
- }
- char toLowerChar(char c)
- {
- if('A' <= c && c <= 'Z') {
- c += 'a'-'A';
- }
- return c;
- }
- bool isNumericHost(const std::string& name)
- {
- struct addrinfo hints;
- struct addrinfo* res;
- memset(&hints, 0, sizeof(hints));
- hints.ai_family = AF_UNSPEC;
- hints.ai_flags = AI_NUMERICHOST;
- if(getaddrinfo(name.c_str(), nullptr, &hints, &res)) {
- return false;
- }
- freeaddrinfo(res);
- return true;
- }
- #if _WIN32
- namespace {
- static Lock win_signal_lock;
- static signal_handler_t win_int_handler = nullptr;
- static signal_handler_t win_term_handler = nullptr;
- static void win_ign_handler(int) {}
- static BOOL WINAPI HandlerRoutine(DWORD ctrlType)
- {
- void(*handler)(int) = nullptr;
- switch (ctrlType) {
- case CTRL_C_EVENT:
- case CTRL_BREAK_EVENT:
- {
- // Handler will be called on a new/different thread.
- LockGuard lg(win_signal_lock);
- handler = win_int_handler;
- }
- if (handler) {
- handler(SIGINT);
- return TRUE;
- }
- return FALSE;
- case CTRL_LOGOFF_EVENT:
- case CTRL_CLOSE_EVENT:
- case CTRL_SHUTDOWN_EVENT:
- {
- // Handler will be called on a new/different thread.
- LockGuard lg(win_signal_lock);
- handler = win_term_handler;;
- }
- if (handler) {
- handler(SIGTERM);
- return TRUE;
- }
- return FALSE;
- }
- return FALSE;
- }
- }
- #endif
- void setGlobalSignalHandler(int sig, sigset_t* mask, signal_handler_t handler,
- int flags) {
- #if _WIN32
- if (sig == SIGINT || sig == SIGTERM) {
- // Handler will be called on a new/different thread.
- LockGuard lg(win_signal_lock);
- if (handler == SIG_DFL) {
- handler = nullptr;
- }
- else if (handler == SIG_IGN) {
- handler = win_ign_handler;
- }
- // Not yet in use: add console handler.
- if (handler && !win_int_handler && !win_term_handler) {
- ::SetConsoleCtrlHandler(HandlerRoutine, TRUE);
- }
- if (sig == SIGINT) {
- win_int_handler = handler;
- }
- else {
- win_term_handler = handler;
- }
- // No handlers set: remove.
- if (!win_int_handler && !win_term_handler) {
- ::SetConsoleCtrlHandler(HandlerRoutine, FALSE);
- }
- return;
- }
- #endif
- #ifdef HAVE_SIGACTION
- struct sigaction sigact;
- sigact.sa_handler = handler;
- sigact.sa_flags = flags;
- sigact.sa_mask = *mask;
- sigaction(sig, &sigact, nullptr);
- #else
- signal(sig, handler);
- #endif // HAVE_SIGACTION
- }
- #ifndef __MINGW32__
- std::string getHomeDir()
- {
- const char* p = getenv("HOME");
- if (p) {
- return p;
- }
- #ifdef HAVE_PWD_H
- auto pw = getpwuid(geteuid());
- if (pw && pw->pw_dir) {
- return pw->pw_dir;
- }
- #endif // HAVE_PWD_H
- return A2STR::NIL;
- }
- #else // __MINGW32__
- std::string getHomeDir()
- {
- auto p = _wgetenv(L"HOME");
- if (p) {
- return toForwardSlash(wCharToUtf8(p));
- }
- p = _wgetenv(L"USERPROFILE");
- if (p) {
- return toForwardSlash(wCharToUtf8(p));
- }
- p = _wgetenv(L"HOMEDRIVE");
- if (p) {
- std::wstring homeDir = p;
- p = _wgetenv(L"HOMEPATH");
- if (p) {
- homeDir += p;
- return toForwardSlash(wCharToUtf8(homeDir));
- }
- }
- return A2STR::NIL;
- }
- #endif // __MINGW32__
- std::string getXDGDir(const std::string& environmentVariable,
- const std::string& fallbackDirectory)
- {
- std::string filename;
- const char* p = getenv(environmentVariable.c_str());
- if (p && p[0] == '/') {
- filename = p;
- } else {
- filename = fallbackDirectory;
- }
- return filename;
- }
- std::string getConfigFile() {
- std::string filename = getHomeDir() + "/.aria2/aria2.conf";
- if (!File(filename).exists()) {
- filename = getXDGDir("XDG_CONFIG_HOME", getHomeDir()+"/.config") +
- "/aria2/aria2.conf";
- }
- return filename;
- }
- std::string getDHTFile(bool ipv6) {
- std::string filename = getHomeDir() + (ipv6 ? "/.aria2/dht6.dat" : "/.aria2/dht.dat");
- if (!File(filename).exists()) {
- filename = getXDGDir("XDG_CACHE_HOME", getHomeDir()+"/.cache") +
- (ipv6 ? "/aria2/dht6.dat" : "/aria2/dht.dat");
- }
- return filename;
- }
- int64_t getRealSize(const std::string& sizeWithUnit)
- {
- std::string::size_type p = sizeWithUnit.find_first_of("KMkm");
- std::string size;
- int32_t mult = 1;
- if(p == std::string::npos) {
- size = sizeWithUnit;
- } else {
- switch(sizeWithUnit[p]) {
- case 'K':
- case 'k':
- mult = 1_k;
- break;
- case 'M':
- case 'm':
- mult = 1_m;
- break;
- }
- size.assign(sizeWithUnit.begin(), sizeWithUnit.begin()+p);
- }
- int64_t v;
- if(!parseLLIntNoThrow(v, size) || v < 0) {
- throw DL_ABORT_EX(fmt("Bad or negative value detected: %s",
- sizeWithUnit.c_str()));
- }
- if(INT64_MAX/mult < v) {
- throw DL_ABORT_EX(fmt(MSG_STRING_INTEGER_CONVERSION_FAILURE,
- "overflow/underflow"));
- }
- return v*mult;
- }
- std::string abbrevSize(int64_t size)
- {
- static const char* UNITS[] = { "", "Ki", "Mi", "Gi" };
- int64_t t = size;
- size_t uidx = 0;
- int r = 0;
- while(t >= static_cast<int64_t>(1_k) &&
- uidx + 1 < sizeof(UNITS) / sizeof(UNITS[0])) {
- lldiv_t d = lldiv(t, 1_k);
- t = d.quot;
- r = d.rem;
- ++uidx;
- }
- if(uidx+1 < sizeof(UNITS)/sizeof(UNITS[0]) && t >= 922) {
- ++uidx;
- r = t;
- t = 0;
- }
- std::string res;
- res += itos(t, true);
- if(t < 10 && uidx > 0) {
- res += ".";
- res += itos(r * 10 / 1_k);
- }
- res += UNITS[uidx];
- return res;
- }
- void sleep(long seconds) {
- #if defined(HAVE_WINSOCK2_H)
- ::Sleep(seconds * 1000);
- #elif HAVE_SLEEP
- ::sleep(seconds);
- #elif defined(HAVE_USLEEP)
- ::usleep(seconds * 1000000);
- #else
- # error no sleep function is available (nanosleep?)
- #endif
- }
- void usleep(long microseconds) {
- #ifdef HAVE_USLEEP
- ::usleep(microseconds);
- #elif defined(HAVE_WINSOCK2_H)
- LARGE_INTEGER current, freq, end;
- static enum {GET_FREQUENCY, GET_MICROSECONDS, SKIP_MICROSECONDS} state = GET_FREQUENCY;
- if (state == GET_FREQUENCY) {
- if (QueryPerformanceFrequency(&freq))
- state = GET_MICROSECONDS;
- else
- state = SKIP_MICROSECONDS;
- }
- long msec = microseconds / 1000;
- microseconds %= 1000;
- if (state == GET_MICROSECONDS && microseconds) {
- QueryPerformanceCounter(&end);
- end.QuadPart += (freq.QuadPart * microseconds) / 1000000;
- while (QueryPerformanceCounter(¤t) && (current.QuadPart <= end.QuadPart))
- /* noop */ ;
- }
- if (msec)
- Sleep(msec);
- #else
- #error no usleep function is available (nanosleep?)
- #endif
- }
- void mkdirs(const std::string& dirpath)
- {
- File dir(dirpath);
- if(!dir.mkdirs()) {
- int errNum = errno;
- if(!dir.isDir()) {
- throw DL_ABORT_EX3(errNum, fmt(EX_MAKE_DIR, dir.getPath().c_str(),
- safeStrerror(errNum).c_str()),
- error_code::DIR_CREATE_ERROR);
- }
- }
- }
- void convertBitfield(BitfieldMan* dest, const BitfieldMan* src)
- {
- size_t numBlock = dest->countBlock();
- for(size_t index = 0; index < numBlock; ++index) {
- if(src->isBitSetOffsetRange((int64_t)index*dest->getBlockLength(),
- dest->getBlockLength())) {
- dest->setBit(index);
- }
- }
- }
- std::string toString(const std::shared_ptr<BinaryStream>& binaryStream)
- {
- std::stringstream strm;
- char data[2048];
- while(1) {
- int32_t dataLength = binaryStream->readData
- (reinterpret_cast<unsigned char*>(data), sizeof(data), strm.tellp());
- strm.write(data, dataLength);
- if(dataLength == 0) {
- break;
- }
- }
- return strm.str();
- }
- #ifdef HAVE_POSIX_MEMALIGN
- /**
- * In linux 2.6, alignment and size should be a multiple of 512.
- */
- void* allocateAlignedMemory(size_t alignment, size_t size)
- {
- void* buffer;
- int res;
- if((res = posix_memalign(&buffer, alignment, size)) != 0) {
- throw FATAL_EXCEPTION(fmt("Error in posix_memalign: %s",
- util::safeStrerror(res).c_str()));
- }
- return buffer;
- }
- #endif // HAVE_POSIX_MEMALIGN
- std::pair<std::string, uint16_t>
- getNumericNameInfo(const struct sockaddr* sockaddr, socklen_t len)
- {
- char host[NI_MAXHOST];
- char service[NI_MAXSERV];
- int s = getnameinfo(sockaddr, len, host, NI_MAXHOST, service, NI_MAXSERV,
- NI_NUMERICHOST|NI_NUMERICSERV);
- if(s != 0) {
- throw DL_ABORT_EX(fmt("Failed to get hostname and port. cause: %s",
- gai_strerror(s)));
- }
- return std::pair<std::string, uint16_t>(host, atoi(service)); // TODO
- }
- std::string htmlEscape(const std::string& src)
- {
- std::string dest;
- dest.reserve(src.size());
- auto j = std::begin(src);
- for(auto i = std::begin(src); i != std::end(src); ++i) {
- char ch = *i;
- const char *repl;
- if(ch == '<') {
- repl = "<";
- } else if(ch == '>') {
- repl = ">";
- } else if(ch == '&') {
- repl = "&";
- } else if(ch == '\'') {
- repl = "'";
- } else if(ch == '"') {
- repl = """;
- } else {
- continue;
- }
- dest.append(j, i);
- j = i + 1;
- dest += repl;
- }
- dest.append(j, std::end(src));
- return dest;
- }
- std::pair<size_t, std::string>
- parseIndexPath(const std::string& line)
- {
- auto p = divide(std::begin(line), std::end(line), '=');
- uint32_t index;
- if(!parseUIntNoThrow(index, std::string(p.first.first, p.first.second))) {
- throw DL_ABORT_EX("Bad path index");
- }
- if(p.second.first == p.second.second) {
- throw DL_ABORT_EX(fmt("Path with index=%u is empty.", index));
- }
- return std::make_pair(index, std::string(p.second.first, p.second.second));
- }
- std::vector<std::pair<size_t, std::string> > createIndexPaths(std::istream& i)
- {
- std::vector<std::pair<size_t, std::string> > indexPaths;
- std::string line;
- while(getline(i, line)) {
- indexPaths.push_back(parseIndexPath(line));
- }
- return indexPaths;
- }
- void generateRandomData(unsigned char* data, size_t length)
- {
- const auto& rd = SimpleRandomizer::getInstance();
- return rd->getRandomBytes(data, length);
- }
- bool saveAs
- (const std::string& filename, const std::string& data, bool overwrite)
- {
- if(!overwrite && File(filename).exists()) {
- return false;
- }
- std::string tempFilename = filename;
- tempFilename += "__temp";
- {
- BufferedFile fp(tempFilename.c_str(), BufferedFile::WRITE);
- if(!fp) {
- return false;
- }
- if(fp.write(data.data(), data.size()) != data.size()) {
- return false;
- }
- if(fp.close() == EOF) {
- return false;
- }
- }
- return File(tempFilename).renameTo(filename);
- }
- std::string applyDir(const std::string& dir, const std::string& relPath)
- {
- std::string s;
- if(dir.empty()) {
- s = "./";
- s += relPath;
- }
- else {
- s = dir;
- if(dir == "/") {
- s += relPath;
- }
- else {
- s += "/";
- s += relPath;
- }
- }
- #ifdef __MINGW32__
- for(std::string::iterator i = s.begin(), eoi = s.end(); i != eoi; ++i) {
- if(*i == '\\') {
- *i = '/';
- }
- }
- #endif // __MINGW32__
- return s;
- }
- std::string fixTaintedBasename(const std::string& src)
- {
- return escapePath(replace(src, "/", "%2F"));
- }
- void generateRandomKey(unsigned char* key)
- {
- unsigned char bytes[40];
- generateRandomData(bytes, sizeof(bytes));
- message_digest::digest(key, 20, MessageDigest::sha1().get(), bytes,
- sizeof(bytes));
- }
- // Returns true is given numeric ipv4addr is in Private Address Space.
- //
- // From Section.3 RFC1918
- // 10.0.0.0 - 10.255.255.255 (10/8 prefix)
- // 172.16.0.0 - 172.31.255.255 (172.16/12 prefix)
- // 192.168.0.0 - 192.168.255.255 (192.168/16 prefix)
- bool inPrivateAddress(const std::string& ipv4addr)
- {
- if(util::startsWith(ipv4addr, "10.") ||
- util::startsWith(ipv4addr, "192.168.")) {
- return true;
- }
- if(util::startsWith(ipv4addr, "172.")) {
- for(int i = 16; i <= 31; ++i) {
- std::string t(fmt("%d.", i));
- if(util::startsWith(ipv4addr.begin()+4, ipv4addr.end(),
- t.begin(), t.end())) {
- return true;
- }
- }
- }
- return false;
- }
- bool detectDirTraversal(const std::string& s)
- {
- if(s.empty()) {
- return false;
- }
- for (auto c : s) {
- unsigned char ch = c;
- if (in(ch, 0x00u, 0x1fu) || ch == 0x7fu) {
- return true;
- }
- }
- return s == "." || s == ".." || s[0] == '/' ||
- util::startsWith(s, "./") ||
- util::startsWith(s, "../") ||
- s.find("/../") != std::string::npos ||
- s.find("/./") != std::string::npos ||
- s[s.size()-1] == '/' ||
- util::endsWith(s, "/.") ||
- util::endsWith(s, "/..");
- }
- std::string escapePath(const std::string& s)
- {
- // We don't escape '/' because we use it as a path separator.
- #ifdef __MINGW32__
- static const char WIN_INVALID_PATH_CHARS[] =
- { '"', '*', ':', '<', '>', '?', '\\', '|' };
- #endif // __MINGW32__
- std::string d;
- for(auto cc: s) {
- unsigned char c = cc;
- if(in(c, 0x00u, 0x1fu) || c == 0x7fu
- #ifdef __MINGW32__
- || std::find(std::begin(WIN_INVALID_PATH_CHARS),
- std::end(WIN_INVALID_PATH_CHARS),
- c) != std::end(WIN_INVALID_PATH_CHARS)
- #endif // __MINGW32__
- ){
- d += fmt("%%%02X", c);
- } else {
- d += c;
- }
- }
- return d;
- }
- bool inSameCidrBlock
- (const std::string& ip1, const std::string& ip2, size_t bits)
- {
- unsigned char s1[16], s2[16];
- size_t len1, len2;
- if((len1 = net::getBinAddr(s1, ip1)) == 0 ||
- (len2 = net::getBinAddr(s2, ip2)) == 0 ||
- len1 != len2) {
- return false;
- }
- if(bits == 0) {
- return true;
- }
- if(bits > 8*len1) {
- bits = 8*len1;
- }
- int last = (bits-1)/8;
- for(int i = 0; i < last; ++i) {
- if(s1[i] != s2[i]) {
- return false;
- }
- }
- unsigned char mask = bitfield::lastByteMask(bits);
- return (s1[last] & mask) == (s2[last] & mask);
- }
- namespace {
- void executeHook
- (const std::string& command,
- a2_gid_t gid,
- size_t numFiles,
- const std::string& firstFilename)
- {
- const std::string gidStr = GroupId::toHex(gid);
- const std::string numFilesStr = util::uitos(numFiles);
- #ifndef __MINGW32__
- A2_LOG_INFO(fmt("Executing user command: %s %s %s %s",
- command.c_str(),
- gidStr.c_str(),
- numFilesStr.c_str(),
- firstFilename.c_str()));
- pid_t cpid = fork();
- if (cpid == 0) {
- // child!
- execlp(command.c_str(),
- command.c_str(),
- gidStr.c_str(),
- numFilesStr.c_str(),
- firstFilename.c_str(),
- reinterpret_cast<char*>(0));
- perror(("Could not execute user command: "+command).c_str());
- _exit(EXIT_FAILURE);
- return;
- }
- if(cpid == -1) {
- A2_LOG_ERROR("fork() failed. Cannot execute user command.");
- }
- return;
- #else // __MINGW32__
- PROCESS_INFORMATION pi;
- STARTUPINFOW si;
- memset(&si, 0, sizeof (si));
- si.cb = sizeof(STARTUPINFO);
- memset(&pi, 0, sizeof (pi));
- bool batch = util::iendsWith(command, ".bat");
- std::string cmdline;
- std::string cmdexe;
- // XXX batch handling, in particular quoting, correct?
- if(batch) {
- const char* p = getenv("windir");
- if(p) {
- cmdexe = p;
- cmdexe += "\\system32\\cmd.exe";
- } else {
- A2_LOG_INFO("Failed to get windir environment variable."
- " Executing batch file will fail.");
- // TODO Might be useless.
- cmdexe = "cmd.exe";
- }
- cmdline += "/C \"";
- }
- cmdline += "\"";
- cmdline += command;
- cmdline += "\"";
- cmdline += " ";
- cmdline += gidStr;
- cmdline += " ";
- cmdline += numFilesStr;
- cmdline += " \"";
- cmdline += firstFilename;
- cmdline += "\"";
- if(batch) {
- cmdline += "\"";
- }
- int cmdlineLen = utf8ToWChar(nullptr, 0, cmdline.c_str());
- assert(cmdlineLen > 0);
- auto wcharCmdline = make_unique<wchar_t[]>(cmdlineLen);
- cmdlineLen = utf8ToWChar(wcharCmdline.get(), cmdlineLen, cmdline.c_str());
- assert(cmdlineLen > 0);
- A2_LOG_INFO(fmt("Executing user command: %s", cmdline.c_str()));
- DWORD rc = CreateProcessW(batch ? utf8ToWChar(cmdexe).c_str() : nullptr,
- wcharCmdline.get(),
- nullptr,
- nullptr,
- true,
- 0,
- nullptr,
- 0,
- &si,
- &pi);
- if(!rc) {
- A2_LOG_ERROR("CreateProcess() failed. Cannot execute user command.");
- }
- return;
- #endif
- }
- } // namespace
- void executeHookByOptName
- (const std::shared_ptr<RequestGroup>& group, const Option* option,
- PrefPtr pref)
- {
- executeHookByOptName(group.get(), option, pref);
- }
- void executeHookByOptName
- (const RequestGroup* group, const Option* option, PrefPtr pref)
- {
- const std::string& cmd = option->get(pref);
- if(!cmd.empty()) {
- const std::shared_ptr<DownloadContext> dctx = group->getDownloadContext();
- std::string firstFilename;
- size_t numFiles = 0;
- if(!group->inMemoryDownload()) {
- std::shared_ptr<FileEntry> file = dctx->getFirstRequestedFileEntry();
- if(file) {
- firstFilename = file->getPath();
- }
- numFiles = dctx->countRequestedFileEntry();
- }
- executeHook(cmd, group->getGID(), numFiles, firstFilename);
- }
- }
- std::string createSafePath
- (const std::string& dir, const std::string& filename)
- {
- return util::applyDir(dir, util::isUtf8(filename) ?
- util::fixTaintedBasename(filename) :
- util::escapePath(util::percentEncode(filename))
- );
- }
- std::string createSafePath(const std::string& filename)
- {
- return util::isUtf8(filename) ?
- util::fixTaintedBasename(filename) :
- util::escapePath(util::percentEncode(filename));
- }
- std::string encodeNonUtf8(const std::string& s)
- {
- return util::isUtf8(s)?s:util::percentEncode(s);
- }
- std::string makeString(const char* str)
- {
- if(!str) {
- return A2STR::NIL;
- }
- return str;
- }
- std::string safeStrerror(int errNum)
- {
- return makeString(strerror(errNum));
- }
- bool noProxyDomainMatch
- (const std::string& hostname,
- const std::string& domain)
- {
- if(!domain.empty() && domain[0] == '.' && !util::isNumericHost(hostname)) {
- return util::endsWith(hostname, domain);
- }
- return hostname == domain;
- }
- bool tlsHostnameMatch(const std::string& pattern, const std::string& hostname)
- {
- std::string::const_iterator ptWildcard = std::find(pattern.begin(),
- pattern.end(),
- '*');
- if(ptWildcard == pattern.end()) {
- return strieq(pattern.begin(), pattern.end(),
- hostname.begin(), hostname.end());
- }
- std::string::const_iterator ptLeftLabelEnd = std::find(pattern.begin(),
- pattern.end(),
- '.');
- bool wildcardEnabled = true;
- // Do case-insensitive match. At least 2 dots are required to enable
- // wildcard match. Also wildcard must be in the left-most label.
- // Don't attempt to match a presented identifier where the wildcard
- // character is embedded within an A-label.
- if(ptLeftLabelEnd == pattern.end() ||
- std::find(ptLeftLabelEnd+1, pattern.end(), '.') == pattern.end() ||
- ptLeftLabelEnd < ptWildcard ||
- istartsWith(pattern, "xn--")) {
- wildcardEnabled = false;
- }
- if(!wildcardEnabled) {
- return strieq(pattern.begin(), pattern.end(),
- hostname.begin(), hostname.end());
- }
- std::string::const_iterator hnLeftLabelEnd = std::find(hostname.begin(),
- hostname.end(),
- '.');
- if(!strieq(ptLeftLabelEnd, pattern.end(), hnLeftLabelEnd, hostname.end())) {
- return false;
- }
- // Perform wildcard match. Here '*' must match at least one
- // character.
- if(hnLeftLabelEnd - hostname.begin() < ptLeftLabelEnd - pattern.begin()) {
- return false;
- }
- return istartsWith(hostname.begin(), hnLeftLabelEnd, pattern.begin(),
- ptWildcard) &&
- iendsWith(hostname.begin(), hnLeftLabelEnd, ptWildcard + 1,
- ptLeftLabelEnd);
- }
- bool strieq(const std::string& a, const char* b)
- {
- return strieq(a.begin(), a.end(), b);
- }
- bool strieq(const std::string& a, const std::string& b)
- {
- return strieq(a.begin(), a.end(), b.begin(), b.end());
- }
- bool startsWith(const std::string& a, const char* b)
- {
- return startsWith(a.begin(), a.end(), b);
- }
- bool startsWith(const std::string& a, const std::string& b)
- {
- return startsWith(a.begin(), a.end(), b.begin(), b.end());
- }
- bool istartsWith(const std::string& a, const char* b)
- {
- return istartsWith(a.begin(), a.end(), b);
- }
- bool endsWith(const std::string& a, const char* b)
- {
- return endsWith(a.begin(), a.end(), b, b+strlen(b));
- }
- bool endsWith(const std::string& a, const std::string& b)
- {
- return endsWith(a.begin(), a.end(), b.begin(), b.end());
- }
- bool iendsWith(const std::string& a, const char* b)
- {
- return iendsWith(a.begin(), a.end(), b, b+strlen(b));
- }
- bool iendsWith(const std::string& a, const std::string& b)
- {
- return iendsWith(a.begin(), a.end(), b.begin(), b.end());
- }
- bool strless(const char* a, const char* b)
- {
- return strcmp(a, b) < 0;
- }
- #ifdef ENABLE_SSL
- TLSVersion toTLSVersion(const std::string& ver)
- {
- if(ver == A2_V_SSL3) {
- return TLS_PROTO_SSL3;
- }
- if(ver == A2_V_TLS10) {
- return TLS_PROTO_TLS10;
- }
- if(ver == A2_V_TLS11) {
- return TLS_PROTO_TLS11;
- }
- if(ver == A2_V_TLS12) {
- return TLS_PROTO_TLS12;
- }
- return TLS_PROTO_TLS10;
- }
- #endif // ENABLE_SSL
- } // namespace util
- } // namespace aria2
|