1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005 |
- /* <!-- copyright */
- /*
- * aria2 - The high speed download utility
- *
- * Copyright (C) 2006 Tatsuhiro Tsujikawa
- *
- * This program is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License as published by
- * the Free Software Foundation; either version 2 of the License, or
- * (at your option) any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with this program; if not, write to the Free Software
- * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
- *
- * In addition, as a special exception, the copyright holders give
- * permission to link the code of portions of this program with the
- * OpenSSL library under certain conditions as described in each
- * individual source file, and distribute linked combinations
- * including the two.
- * You must obey the GNU General Public License in all respects
- * for all of the code used other than OpenSSL. If you modify
- * file(s) with this exception, you may extend this exception to your
- * version of the file(s), but you are not obligated to do so. If you
- * do not wish to do so, delete this exception statement from your
- * version. If you delete this exception statement from all source
- * files in the program, then also delete it here.
- */
- /* copyright --> */
- #include "util.h"
- #ifdef __sun
- // For opensolaris, just include signal.h which includes sys/signal.h
- #ifdef HAVE_SIGNAL_H
- # include <signal.h>
- #endif // HAVE_SIGNAL_H
- #else // !__sun
- #ifdef HAVE_SYS_SIGNAL_H
- # include <sys/signal.h>
- #endif // HAVE_SYS_SIGNAL_H
- #ifdef HAVE_SIGNAL_H
- # include <signal.h>
- #endif // HAVE_SIGNAL_H
- #endif // !__sun
- #include <sys/types.h>
- #ifdef HAVE_PWD_H
- # include <pwd.h>
- #endif // HAVE_PWD_H
- #include <cerrno>
- #include <cassert>
- #include <cstring>
- #include <cstdio>
- #include <cstdlib>
- #include <sstream>
- #include <ostream>
- #include <algorithm>
- #include <fstream>
- #include <iomanip>
- #include "SimpleRandomizer.h"
- #include "File.h"
- #include "Randomizer.h"
- #include "a2netcompat.h"
- #include "BitfieldMan.h"
- #include "DefaultDiskWriter.h"
- #include "FatalException.h"
- #include "FileEntry.h"
- #include "A2STR.h"
- #include "array_fun.h"
- #include "bitfield.h"
- #include "DownloadHandlerConstants.h"
- #include "RequestGroup.h"
- #include "LogFactory.h"
- #include "Logger.h"
- #include "Option.h"
- #include "DownloadContext.h"
- #include "BufferedFile.h"
- #include "SocketCore.h"
- #include "Lock.h"
- #include "MessageDigest.h"
- #include "message_digest_helper.h"
- // For libc6 which doesn't define ULLONG_MAX properly because of broken limits.h
- #ifndef ULLONG_MAX
- # define ULLONG_MAX 18446744073709551615ULL
- #endif // ULLONG_MAX
- namespace aria2 {
- #ifdef __MINGW32__
- namespace {
- int utf8ToWChar(wchar_t* out, size_t outLength, const char* src)
- {
- return MultiByteToWideChar(CP_UTF8, 0, src, -1, out, outLength);
- }
- } // namespace
- namespace {
- int wCharToUtf8(char* out, size_t outLength, const wchar_t* src)
- {
- return WideCharToMultiByte(CP_UTF8, 0, src, -1, out, outLength,
- nullptr, nullptr);
- }
- } // namespace
- std::wstring utf8ToWChar(const char* src)
- {
- int len = utf8ToWChar(nullptr, 0, src);
- if(len <= 0) {
- abort();
- }
- auto buf = make_unique<wchar_t[]>((size_t)len);
- len = utf8ToWChar(buf.get(), len, src);
- if(len <= 0) {
- abort();
- } else {
- return buf.get();
- }
- }
- std::wstring utf8ToWChar(const std::string& src)
- {
- return utf8ToWChar(src.c_str());
- }
- std::string wCharToUtf8(const std::wstring& wsrc)
- {
- int len = wCharToUtf8(nullptr, 0, wsrc.c_str());
- if(len <= 0) {
- abort();
- }
- auto buf = make_unique<char[]>((size_t)len);
- len = wCharToUtf8(buf.get(), len, wsrc.c_str());
- if(len <= 0) {
- abort();
- } else {
- return buf.get();
- }
- }
- #endif // __MINGW32__
- namespace util {
- const char DEFAULT_STRIP_CHARSET[] = "\r\n\t ";
- std::string strip(const std::string& str, const char* chars)
- {
- std::pair<std::string::const_iterator,
- std::string::const_iterator> p =
- stripIter(str.begin(), str.end(), chars);
- return std::string(p.first, p.second);
- }
- std::string itos(int64_t value, bool comma)
- {
- bool flag = false;
- std::string str;
- if(value < 0) {
- if(value == INT64_MIN) {
- if(comma) {
- str = "-9,223,372,036,854,775,808";
- } else {
- str = "-9223372036854775808";
- }
- return str;
- }
- flag = true;
- value = -value;
- }
- str = uitos(value, comma);
- if(flag) {
- str.insert(str.begin(), '-');
- }
- return str;
- }
- int64_t difftv(struct timeval tv1, struct timeval tv2) {
- if((tv1.tv_sec < tv2.tv_sec) ||
- ((tv1.tv_sec == tv2.tv_sec) && (tv1.tv_usec < tv2.tv_usec))) {
- return 0;
- }
- return ((int64_t)(tv1.tv_sec-tv2.tv_sec)*1000000+
- tv1.tv_usec-tv2.tv_usec);
- }
- int32_t difftvsec(struct timeval tv1, struct timeval tv2) {
- if(tv1.tv_sec < tv2.tv_sec) {
- return 0;
- }
- return tv1.tv_sec-tv2.tv_sec;
- }
- std::string replace(const std::string& target, const std::string& oldstr, const std::string& newstr) {
- if(target.empty() || oldstr.empty()) {
- return target;
- }
- std::string result;
- std::string::size_type p = 0;
- std::string::size_type np = target.find(oldstr);
- while(np != std::string::npos) {
- result.append(target.begin()+p, target.begin()+np);
- result += newstr;
- p = np+oldstr.size();
- np = target.find(oldstr, p);
- }
- result.append(target.begin()+p, target.end());
- return result;
- }
- bool isAlpha(const char c)
- {
- return ('A' <= c && c <= 'Z') || ('a' <= c && c <= 'z');
- }
- bool isDigit(const char c)
- {
- return '0' <= c && c <= '9';
- }
- bool isHexDigit(const char c)
- {
- return isDigit(c) || ('A' <= c && c <= 'F') || ('a' <= c && c <= 'f');
- }
- bool isHexDigit(const std::string& s)
- {
- for (const auto& c : s) {
- if(!isHexDigit(c)) {
- return false;
- }
- }
- return true;
- }
- bool inRFC3986ReservedChars(const char c)
- {
- static const char reserved[] = {
- ':' , '/' , '?' , '#' , '[' , ']' , '@',
- '!' , '$' , '&' , '\'' , '(' , ')',
- '*' , '+' , ',' , ';' , '=' };
- return std::find(std::begin(reserved), std::end(reserved), c)
- != std::end(reserved);
- }
- bool inRFC3986UnreservedChars(const char c)
- {
- static const char unreserved[] = { '-', '.', '_', '~' };
- return isAlpha(c) || isDigit(c) ||
- std::find(std::begin(unreserved), std::end(unreserved), c)
- != std::end(unreserved);
- }
- bool inRFC2978MIMECharset(const char c)
- {
- static const char chars[] = {
- '!', '#', '$', '%', '&',
- '\'', '+', '-', '^', '_',
- '`', '{', '}', '~'
- };
- return isAlpha(c) || isDigit(c) ||
- std::find(std::begin(chars), std::end(chars), c) != std::end(chars);
- }
- bool inRFC2616HttpToken(const char c)
- {
- static const char chars[] = {
- '!', '#', '$', '%', '&', '\'', '*', '+', '-', '.',
- '^', '_', '`', '|', '~'
- };
- return isAlpha(c) || isDigit(c) ||
- std::find(std::begin(chars), std::end(chars), c) != std::end(chars);
- }
- bool inRFC5987AttrChar(const char c)
- {
- return inRFC2616HttpToken(c) && c != '*' && c != '\'' && c != '%';
- }
- // Returns nonzero if |c| is in ISO/IEC 8859-1 character set.
- bool isIso8859p1(unsigned char c)
- {
- return (0x20u <= c && c <= 0x7eu) || 0xa0u <= c;
- }
- bool isLws(const char c)
- {
- return c == ' ' || c == '\t';
- }
- bool isCRLF(const char c)
- {
- return c == '\r' || c == '\n';
- }
- namespace {
- bool isUtf8Tail(unsigned char ch)
- {
- return in(ch, 0x80u, 0xbfu);
- }
- bool inPercentEncodeMini(const unsigned char c)
- {
- return c > 0x20 && c < 0x7fu &&
- // Chromium escapes following characters. Firefox4 escapes more.
- c != '"' && c != '<' && c != '>';
- }
- } // namespace
- bool isUtf8(const std::string& str)
- {
- for(std::string::const_iterator s = str.begin(), eos = str.end(); s != eos;
- ++s) {
- unsigned char firstChar = *s;
- // See ABNF in http://tools.ietf.org/search/rfc3629#section-4
- if(in(firstChar, 0x20u, 0x7eu) ||
- firstChar == 0x08u || // \b
- firstChar == 0x09u || // \t
- firstChar == 0x0au || // \n
- firstChar == 0x0cu || // \f
- firstChar == 0x0du // \r
- ) {
- // UTF8-1 (without ctrl chars)
- } else if(in(firstChar, 0xc2u, 0xdfu)) {
- // UTF8-2
- if(++s == eos || !isUtf8Tail(*s)) {
- return false;
- }
- } else if(0xe0u == firstChar) {
- // UTF8-3
- if(++s == eos || !in(static_cast<unsigned char>(*s), 0xa0u, 0xbfu) ||
- ++s == eos || !isUtf8Tail(*s)) {
- return false;
- }
- } else if(in(firstChar, 0xe1u, 0xecu) || in(firstChar, 0xeeu, 0xefu)) {
- // UTF8-3
- if(++s == eos || !isUtf8Tail(*s) ||
- ++s == eos || !isUtf8Tail(*s)) {
- return false;
- }
- } else if(0xedu == firstChar) {
- // UTF8-3
- if(++s == eos || !in(static_cast<unsigned char>(*s), 0x80u, 0x9fu) ||
- ++s == eos || !isUtf8Tail(*s)) {
- return false;
- }
- } else if(0xf0u == firstChar) {
- // UTF8-4
- if(++s == eos || !in(static_cast<unsigned char>(*s), 0x90u, 0xbfu) ||
- ++s == eos || !isUtf8Tail(*s) ||
- ++s == eos || !isUtf8Tail(*s)) {
- return false;
- }
- } else if(in(firstChar, 0xf1u, 0xf3u)) {
- // UTF8-4
- if(++s == eos || !isUtf8Tail(*s) ||
- ++s == eos || !isUtf8Tail(*s) ||
- ++s == eos || !isUtf8Tail(*s)) {
- return false;
- }
- } else if(0xf4u == firstChar) {
- // UTF8-4
- if(++s == eos || !in(static_cast<unsigned char>(*s), 0x80u, 0x8fu) ||
- ++s == eos || !isUtf8Tail(*s) ||
- ++s == eos || !isUtf8Tail(*s)) {
- return false;
- }
- } else {
- return false;
- }
- }
- return true;
- }
- std::string percentEncode(const unsigned char* target, size_t len)
- {
- std::string dest;
- for(size_t i = 0; i < len; ++i) {
- if(inRFC3986UnreservedChars(target[i])) {
- dest += target[i];
- } else {
- dest.append(fmt("%%%02X", target[i]));
- }
- }
- return dest;
- }
- std::string percentEncode(const std::string& target)
- {
- if (std::find_if_not(target.begin(), target.end(),
- inRFC3986UnreservedChars) == target.end()) {
- return target;
- }
- return percentEncode(reinterpret_cast<const unsigned char*>(target.c_str()),
- target.size());
- }
- std::string percentEncodeMini(const std::string& src)
- {
- if (std::find_if_not(src.begin(), src.end(), inPercentEncodeMini) ==
- src.end()) {
- return src;
- }
- std::string result;
- for (auto c: src) {
- if(!inPercentEncodeMini(c)) {
- result += fmt("%%%02X", static_cast<unsigned char>(c));
- } else {
- result += c;
- }
- }
- return result;
- }
- std::string torrentPercentEncode(const unsigned char* target, size_t len) {
- std::string dest;
- for(size_t i = 0; i < len; ++i) {
- if(isAlpha(target[i]) || isDigit(target[i])) {
- dest += target[i];
- } else {
- dest.append(fmt("%%%02X", target[i]));
- }
- }
- return dest;
- }
- std::string torrentPercentEncode(const std::string& target)
- {
- return torrentPercentEncode
- (reinterpret_cast<const unsigned char*>(target.c_str()), target.size());
- }
- std::string percentDecode
- (std::string::const_iterator first, std::string::const_iterator last)
- {
- std::string result;
- for(; first != last; ++first) {
- if(*first == '%') {
- if(first+1 != last && first+2 != last &&
- isHexDigit(*(first+1)) && isHexDigit(*(first+2))) {
- result += hexCharToUInt(*(first+1))*16+hexCharToUInt(*(first+2));
- first += 2;
- } else {
- result += *first;
- }
- } else {
- result += *first;
- }
- }
- return result;
- }
- std::string toHex(const unsigned char* src, size_t len) {
- std::string out(len*2, '\0');
- std::string::iterator o = out.begin();
- const unsigned char* last = src+len;
- for(const unsigned char* i = src; i != last; ++i) {
- *o = (*i >> 4);
- *(o+1) = (*i)&0x0fu;
- for(int j = 0; j < 2; ++j) {
- if(*o < 10) {
- *o += '0';
- } else {
- *o += 'a'-10;
- }
- ++o;
- }
- }
- return out;
- }
- std::string toHex(const char* src, size_t len)
- {
- return toHex(reinterpret_cast<const unsigned char*>(src), len);
- }
- std::string toHex(const std::string& src)
- {
- return toHex(reinterpret_cast<const unsigned char*>(src.c_str()), src.size());
- }
- unsigned int hexCharToUInt(unsigned char ch)
- {
- if('a' <= ch && ch <= 'f') {
- ch -= 'a';
- ch += 10;
- } else if('A' <= ch && ch <= 'F') {
- ch -= 'A';
- ch += 10;
- } else if('0' <= ch && ch <= '9') {
- ch -= '0';
- } else {
- ch = 255;
- }
- return ch;
- }
- std::string secfmt(time_t sec) {
- time_t tsec = sec;
- std::string str;
- if(sec >= 3600) {
- str = fmt("%" PRId64 "h", static_cast<int64_t>(sec/3600));
- sec %= 3600;
- }
- if(sec >= 60) {
- str += fmt("%dm", static_cast<int>(sec/60));
- sec %= 60;
- }
- if(sec || tsec == 0) {
- str += fmt("%ds", static_cast<int>(sec));
- }
- return str;
- }
- namespace {
- template<typename T, typename F>
- bool parseLong(T& res, F f, const std::string& s, int base)
- {
- if(s.empty()) {
- return false;
- }
- char* endptr;
- errno = 0;
- res = f(s.c_str(), &endptr, base);
- if(errno == ERANGE) {
- return false;
- }
- if(*endptr != '\0') {
- for(const char* i = endptr, *eoi = s.c_str()+s.size(); i < eoi; ++i) {
- if(!isspace(*i)) {
- return false;
- }
- }
- }
- return true;
- }
- } // namespace
- bool parseIntNoThrow(int32_t& res, const std::string& s, int base)
- {
- long int t;
- if(parseLong(t, strtol, s, base) &&
- t >= std::numeric_limits<int32_t>::min() &&
- t <= std::numeric_limits<int32_t>::max()) {
- res = t;
- return true;
- } else {
- return false;
- }
- }
- bool parseUIntNoThrow(uint32_t& res, const std::string& s, int base)
- {
- long int t;
- if(parseLong(t, strtol, s, base) &&
- t >= 0 &&
- t <= std::numeric_limits<int32_t>::max()) {
- res = t;
- return true;
- } else {
- return false;
- }
- }
- bool parseLLIntNoThrow(int64_t& res, const std::string& s, int base)
- {
- long long int t;
- if(parseLong(t, strtoll, s, base) &&
- t >= std::numeric_limits<int64_t>::min() &&
- t <= std::numeric_limits<int64_t>::max()) {
- res = t;
- return true;
- } else {
- return false;
- }
- }
- void parseIntSegments(SegList<int>& sgl, const std::string& src)
- {
- for(std::string::const_iterator i = src.begin(), eoi = src.end(); i != eoi;) {
- std::string::const_iterator j = std::find(i, eoi, ',');
- if(j == i) {
- ++i;
- continue;
- }
- std::string::const_iterator p = std::find(i, j, '-');
- if(p == j) {
- int a;
- if(parseIntNoThrow(a, std::string(i, j))) {
- sgl.add(a, a+1);
- } else {
- throw DL_ABORT_EX(fmt("Bad range %s", std::string(i, j).c_str()));
- }
- } else if(p == i || p+1 == j) {
- throw DL_ABORT_EX(fmt(MSG_INCOMPLETE_RANGE, std::string(i, j).c_str()));
- } else {
- int a, b;
- if(parseIntNoThrow(a, std::string(i, p)) &&
- parseIntNoThrow(b, (std::string(p+1, j)))) {
- sgl.add(a, b+1);
- } else {
- throw DL_ABORT_EX(fmt("Bad range %s", std::string(i, j).c_str()));
- }
- }
- if(j == eoi) {
- break;
- }
- i = j+1;
- }
- }
- namespace {
- void computeHeadPieces
- (std::vector<size_t>& indexes,
- const std::vector<std::shared_ptr<FileEntry> >& fileEntries,
- size_t pieceLength,
- int64_t head)
- {
- if(head == 0) {
- return;
- }
- for (const auto& fi: fileEntries) {
- if(fi->getLength() == 0) {
- continue;
- }
- const size_t lastIndex = (fi->getOffset() +
- std::min(head, fi->getLength()) - 1
- ) / pieceLength;
- for(size_t idx = fi->getOffset() / pieceLength; idx <= lastIndex; ++idx) {
- indexes.push_back(idx);
- }
- }
- }
- } // namespace
- namespace {
- void computeTailPieces
- (std::vector<size_t>& indexes,
- const std::vector<std::shared_ptr<FileEntry> >& fileEntries,
- size_t pieceLength,
- int64_t tail)
- {
- if(tail == 0) {
- return;
- }
- for (const auto& fi: fileEntries) {
- if(fi->getLength() == 0) {
- continue;
- }
- int64_t endOffset = fi->getLastOffset();
- size_t fromIndex = (endOffset - 1 - (std::min(tail, fi->getLength()) - 1)) /
- pieceLength;
- const size_t toIndex = (endOffset - 1) / pieceLength;
- while (fromIndex <= toIndex) {
- indexes.push_back(fromIndex++);
- }
- }
- }
- } // namespace
- void parsePrioritizePieceRange
- (std::vector<size_t>& result, const std::string& src,
- const std::vector<std::shared_ptr<FileEntry> >& fileEntries,
- size_t pieceLength,
- int64_t defaultSize)
- {
- std::vector<size_t> indexes;
- std::vector<Scip> parts;
- splitIter(src.begin(), src.end(), std::back_inserter(parts), ',', true);
- for (const auto& i: parts) {
- if(util::streq(i.first, i.second, "head")) {
- computeHeadPieces(indexes, fileEntries, pieceLength, defaultSize);
- }
- else if(util::startsWith(i.first, i.second, "head=")) {
- std::string sizestr(i.first + 5, i.second);
- computeHeadPieces(indexes, fileEntries, pieceLength,
- std::max((int64_t)0, getRealSize(sizestr)));
- }
- else if(util::streq(i.first, i.second, "tail")) {
- computeTailPieces(indexes, fileEntries, pieceLength, defaultSize);
- }
- else if(util::startsWith(i.first, i.second, "tail=")) {
- std::string sizestr(i.first + 5, i.second);
- computeTailPieces(indexes, fileEntries, pieceLength,
- std::max((int64_t)0, getRealSize(sizestr)));
- }
- else {
- throw DL_ABORT_EX(fmt("Unrecognized token %s",
- std::string(i.first, i.second).c_str()));
- }
- }
- std::sort(indexes.begin(), indexes.end());
- indexes.erase(std::unique(indexes.begin(), indexes.end()), indexes.end());
- result.insert(result.end(), indexes.begin(), indexes.end());
- }
- // Converts ISO/IEC 8859-1 string to UTF-8 string. If there is a
- // character not in ISO/IEC 8859-1, returns empty string.
- std::string iso8859p1ToUtf8(const char* src, size_t len)
- {
- std::string dest;
- for(const char* p = src, *last = src+len; p != last; ++p) {
- unsigned char c = *p;
- if(0xa0u <= c) {
- if(c <= 0xbfu) {
- dest += 0xc2u;
- } else {
- dest += 0xc3u;
- }
- dest += c&(~0x40u);
- } else if(0x80u <= c && c <= 0x9fu) {
- return "";
- } else {
- dest += c;
- }
- }
- return dest;
- }
- std::string iso8859p1ToUtf8(const std::string& src)
- {
- return iso8859p1ToUtf8(src.c_str(), src.size());
- }
- /* Start of utf8 dfa */
- /* Copyright (c) 2008-2010 Bjoern Hoehrmann <bjoern@hoehrmann.de>
- * See http://bjoern.hoehrmann.de/utf-8/decoder/dfa/ for details.
- *
- * Copyright (c) 2008-2009 Bjoern Hoehrmann <bjoern@hoehrmann.de>
- *
- * Permission is hereby granted, free of charge, to any person
- * obtaining a copy of this software and associated documentation
- * files (the "Software"), to deal in the Software without
- * restriction, including without limitation the rights to use, copy,
- * modify, merge, publish, distribute, sublicense, and/or sell copies
- * of the Software, and to permit persons to whom the Software is
- * furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice shall be
- * included in all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
- * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
- * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
- * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
- * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
- * SOFTWARE.
- */
- #define UTF8_ACCEPT 0
- #define UTF8_REJECT 12
- static const uint8_t utf8d[] = {
- /*
- * The first part of the table maps bytes to character classes that
- * to reduce the size of the transition table and create bitmasks.
- */
- 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
- 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
- 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
- 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
- 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, 9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,
- 7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7, 7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,
- 8,8,2,2,2,2,2,2,2,2,2,2,2,2,2,2, 2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,
- 10,3,3,3,3,3,3,3,3,3,3,3,3,4,3,3, 11,6,6,6,5,8,8,8,8,8,8,8,8,8,8,8,
- /*
- * The second part is a transition table that maps a combination
- * of a state of the automaton and a character class to a state.
- */
- 0,12,24,36,60,96,84,12,12,12,48,72, 12,12,12,12,12,12,12,12,12,12,12,12,
- 12, 0,12,12,12,12,12, 0,12, 0,12,12, 12,24,12,12,12,12,12,24,12,24,12,12,
- 12,12,12,12,12,12,12,24,12,12,12,12, 12,24,12,12,12,12,12,12,12,24,12,12,
- 12,12,12,12,12,12,12,36,12,36,12,12, 12,36,12,12,12,12,12,36,12,36,12,12,
- 12,36,12,12,12,12,12,12,12,12,12,12,
- };
- static uint32_t
- utf8dfa(uint32_t* state, uint32_t* codep, uint32_t byte) {
- uint32_t type = utf8d[byte];
- *codep = (*state != UTF8_ACCEPT) ?
- (byte & 0x3fu) | (*codep << 6) :
- (0xff >> type) & (byte);
- *state = utf8d[256 + *state + type];
- return *state;
- }
- /* End of utf8 dfa */
- typedef enum {
- CD_BEFORE_DISPOSITION_TYPE,
- CD_AFTER_DISPOSITION_TYPE,
- CD_DISPOSITION_TYPE,
- CD_BEFORE_DISPOSITION_PARM_NAME,
- CD_AFTER_DISPOSITION_PARM_NAME,
- CD_DISPOSITION_PARM_NAME,
- CD_BEFORE_VALUE,
- CD_AFTER_VALUE,
- CD_QUOTED_STRING,
- CD_TOKEN,
- CD_BEFORE_EXT_VALUE,
- CD_CHARSET,
- CD_LANGUAGE,
- CD_VALUE_CHARS,
- CD_VALUE_CHARS_PCT_ENCODED1,
- CD_VALUE_CHARS_PCT_ENCODED2
- } content_disposition_parse_state;
- typedef enum {
- CD_FILENAME_FOUND = 1,
- CD_EXT_FILENAME_FOUND = 1 << 1
- } content_disposition_parse_flag;
- typedef enum {
- CD_ENC_UNKNOWN,
- CD_ENC_UTF8,
- CD_ENC_ISO_8859_1
- } content_disposition_charset;
- ssize_t parse_content_disposition(char *dest, size_t destlen,
- const char **charsetp, size_t *charsetlenp,
- const char *in, size_t len)
- {
- const char *p = in, *eop = in + len, *mark_first = nullptr, *mark_last = nullptr;
- int state = CD_BEFORE_DISPOSITION_TYPE;
- int in_file_parm = 0;
- int flags = 0;
- int quoted_seen = 0;
- int charset = 0;
- /* To suppress warnings */
- char *dp = dest;
- size_t dlen = destlen;
- uint32_t dfa_state = 0;
- uint32_t dfa_code = 0;
- uint8_t pctval = 0;
- *charsetp = nullptr;
- *charsetlenp = 0;
- for(; p != eop; ++p) {
- switch(state) {
- case CD_BEFORE_DISPOSITION_TYPE:
- if(inRFC2616HttpToken(*p)) {
- state = CD_DISPOSITION_TYPE;
- } else if(!isLws(*p)) {
- return -1;
- }
- break;
- case CD_AFTER_DISPOSITION_TYPE:
- case CD_DISPOSITION_TYPE:
- if(*p == ';') {
- state = CD_BEFORE_DISPOSITION_PARM_NAME;
- } else if(isLws(*p)) {
- state = CD_AFTER_DISPOSITION_TYPE;
- } else if(state == CD_AFTER_DISPOSITION_TYPE ||
- !inRFC2616HttpToken(*p)) {
- return -1;
- }
- break;
- case CD_BEFORE_DISPOSITION_PARM_NAME:
- if(inRFC2616HttpToken(*p)) {
- mark_first = p;
- state = CD_DISPOSITION_PARM_NAME;
- } else if(!isLws(*p)) {
- return -1;
- }
- break;
- case CD_AFTER_DISPOSITION_PARM_NAME:
- case CD_DISPOSITION_PARM_NAME:
- if(*p == '=') {
- if(state == CD_DISPOSITION_PARM_NAME) {
- mark_last = p;
- }
- in_file_parm = 0;
- if(strieq(mark_first, mark_last, "filename*")) {
- if((flags & CD_EXT_FILENAME_FOUND) == 0) {
- in_file_parm = 1;
- } else {
- return -1;
- }
- state = CD_BEFORE_EXT_VALUE;
- } else if(strieq(mark_first, mark_last, "filename")) {
- if(flags & CD_FILENAME_FOUND) {
- return -1;
- }
- if((flags & CD_EXT_FILENAME_FOUND) == 0) {
- in_file_parm = 1;
- }
- state = CD_BEFORE_VALUE;
- } else {
- /* ext-token must be characters in token, followed by "*" */
- if(mark_first != mark_last-1 && *(mark_last-1) == '*') {
- state = CD_BEFORE_EXT_VALUE;
- } else {
- state = CD_BEFORE_VALUE;
- }
- }
- if(in_file_parm) {
- dp = dest;
- dlen = destlen;
- }
- } else if(isLws(*p)) {
- mark_last = p;
- state = CD_AFTER_DISPOSITION_PARM_NAME;
- } else if(state == CD_AFTER_DISPOSITION_PARM_NAME ||
- !inRFC2616HttpToken(*p)) {
- return -1;
- }
- break;
- case CD_BEFORE_VALUE:
- if(*p == '"') {
- quoted_seen = 0;
- state = CD_QUOTED_STRING;
- } else if(inRFC2616HttpToken(*p)) {
- if(in_file_parm) {
- if(dlen == 0) {
- return -1;
- } else {
- *dp++ = *p;
- --dlen;
- }
- }
- state = CD_TOKEN;
- } else if(!isLws(*p)) {
- return -1;
- }
- break;
- case CD_AFTER_VALUE:
- if(*p == ';') {
- state = CD_BEFORE_DISPOSITION_PARM_NAME;
- } else if(!isLws(*p)) {
- return -1;
- }
- break;
- case CD_QUOTED_STRING:
- if(*p == '\\' && quoted_seen == 0) {
- quoted_seen = 1;
- } else if(*p == '"' && quoted_seen == 0) {
- if(in_file_parm) {
- flags |= CD_FILENAME_FOUND;
- }
- state = CD_AFTER_VALUE;
- } else {
- /* TEXT which is OCTET except CTLs, but including LWS. We only
- accept ISO-8859-1 chars. */
- quoted_seen = 0;
- if(!isIso8859p1(*p)) {
- return -1;
- }
- if(in_file_parm) {
- if(dlen == 0) {
- return -1;
- } else {
- *dp++ = *p;
- --dlen;
- }
- }
- }
- break;
- case CD_TOKEN:
- if(inRFC2616HttpToken(*p)) {
- if(in_file_parm) {
- if(dlen == 0) {
- return -1;
- } else {
- *dp++ = *p;
- --dlen;
- }
- }
- } else if(*p == ';') {
- if(in_file_parm) {
- flags |= CD_FILENAME_FOUND;
- }
- state = CD_BEFORE_DISPOSITION_PARM_NAME;
- } else if(isLws(*p)) {
- if(in_file_parm) {
- flags |= CD_FILENAME_FOUND;
- }
- state = CD_AFTER_VALUE;
- } else {
- return -1;
- }
- break;
- case CD_BEFORE_EXT_VALUE:
- if(*p == '\'') {
- /* Empty charset is not allowed */
- return -1;
- } else if(inRFC2978MIMECharset(*p)) {
- mark_first = p;
- state = CD_CHARSET;
- } else if(!isLws(*p)) {
- return -1;
- }
- break;
- case CD_CHARSET:
- if(*p == '\'') {
- mark_last = p;
- *charsetp = mark_first;
- *charsetlenp = mark_last - mark_first;
- if(strieq(mark_first, mark_last, "utf-8")) {
- charset = CD_ENC_UTF8;
- dfa_state = UTF8_ACCEPT;
- dfa_code = 0;
- } else if(strieq(mark_first, mark_last, "iso-8859-1")) {
- charset = CD_ENC_ISO_8859_1;
- } else {
- charset = CD_ENC_UNKNOWN;
- }
- state = CD_LANGUAGE;
- } else if(!inRFC2978MIMECharset(*p)) {
- return -1;
- }
- break;
- case CD_LANGUAGE:
- if(*p == '\'') {
- if(in_file_parm) {
- dp = dest;
- dlen = destlen;
- }
- state = CD_VALUE_CHARS;
- } else if(*p != '-' && !isAlpha(*p) && !isDigit(*p)) {
- return -1;
- }
- break;
- case CD_VALUE_CHARS:
- if(inRFC5987AttrChar(*p)) {
- if(charset == CD_ENC_UTF8) {
- if(utf8dfa(&dfa_state, &dfa_code, *p) == UTF8_REJECT) {
- return -1;
- }
- }
- if(in_file_parm) {
- if(dlen == 0) {
- return -1;
- } else {
- *dp++ = *p;
- --dlen;
- }
- }
- } else if(*p == '%') {
- if(in_file_parm) {
- if(dlen == 0) {
- return -1;
- }
- }
- pctval = 0;
- state = CD_VALUE_CHARS_PCT_ENCODED1;
- } else if(*p == ';' || isLws(*p)) {
- if(charset == CD_ENC_UTF8 && dfa_state != UTF8_ACCEPT) {
- return -1;
- }
- if(in_file_parm) {
- flags |= CD_EXT_FILENAME_FOUND;
- }
- if(*p == ';') {
- state = CD_BEFORE_DISPOSITION_PARM_NAME;
- } else {
- state = CD_AFTER_VALUE;
- }
- } else if(!inRFC5987AttrChar(*p)) {
- return -1;
- }
- break;
- case CD_VALUE_CHARS_PCT_ENCODED1:
- if(isHexDigit(*p)) {
- pctval |= hexCharToUInt(*p) << 4;
- state = CD_VALUE_CHARS_PCT_ENCODED2;
- } else {
- return -1;
- }
- break;
- case CD_VALUE_CHARS_PCT_ENCODED2:
- if(isHexDigit(*p)) {
- pctval |= hexCharToUInt(*p);
- if(charset == CD_ENC_UTF8) {
- if(utf8dfa(&dfa_state, &dfa_code, pctval) == UTF8_REJECT) {
- return -1;
- }
- } else if(charset == CD_ENC_ISO_8859_1) {
- if(!isIso8859p1(pctval)) {
- return -1;
- }
- }
- if(in_file_parm) {
- *dp++ = pctval;
- --dlen;
- }
- state = CD_VALUE_CHARS;
- } else {
- return -1;
- }
- break;
- }
- }
- switch(state) {
- case CD_BEFORE_DISPOSITION_TYPE:
- case CD_AFTER_DISPOSITION_TYPE:
- case CD_DISPOSITION_TYPE:
- case CD_AFTER_VALUE:
- case CD_TOKEN:
- return destlen-dlen;
- case CD_VALUE_CHARS:
- if(charset == CD_ENC_UTF8 && dfa_state != UTF8_ACCEPT) {
- return -1;
- }
- return destlen - dlen;
- default:
- return -1;
- }
- }
- std::string getContentDispositionFilename(const std::string& header)
- {
- char cdval[1024];
- size_t cdvallen = sizeof(cdval);
- const char* charset;
- size_t charsetlen;
- ssize_t rv = parse_content_disposition(cdval, cdvallen,
- &charset, &charsetlen,
- header.c_str(), header.size());
- if(rv == -1) {
- return "";
- }
- std::string res;
- if(!charset || strieq(charset, charset+charsetlen, "iso-8859-1")) {
- res = iso8859p1ToUtf8(cdval, rv);
- } else {
- res.assign(cdval, rv);
- }
- if(!detectDirTraversal(res) &&
- res.find_first_of("/\\") == std::string::npos) {
- return res;
- }
- return "";
- }
- std::string toUpper(std::string src)
- {
- uppercase(src);
- return src;
- }
- std::string toLower(std::string src) {
- lowercase(src);
- return src;
- }
- void uppercase(std::string& s)
- {
- std::transform(s.begin(), s.end(), s.begin(), toUpperChar);
- }
- void lowercase(std::string& s)
- {
- std::transform(s.begin(), s.end(), s.begin(), toLowerChar);
- }
- char toUpperChar(char c)
- {
- if('a' <= c && c <= 'z') {
- c += 'A'-'a';
- }
- return c;
- }
- char toLowerChar(char c)
- {
- if('A' <= c && c <= 'Z') {
- c += 'a'-'A';
- }
- return c;
- }
- bool isNumericHost(const std::string& name)
- {
- struct addrinfo hints;
- struct addrinfo* res;
- memset(&hints, 0, sizeof(hints));
- hints.ai_family = AF_UNSPEC;
- hints.ai_flags = AI_NUMERICHOST;
- if(getaddrinfo(name.c_str(), nullptr, &hints, &res)) {
- return false;
- }
- freeaddrinfo(res);
- return true;
- }
- #if _WIN32
- namespace {
- static Lock win_signal_lock;
- static signal_handler_t win_int_handler = nullptr;
- static signal_handler_t win_term_handler = nullptr;
- static void win_ign_handler(int) {}
- static BOOL WINAPI HandlerRoutine(DWORD ctrlType)
- {
- void(*handler)(int) = nullptr;
- switch (ctrlType) {
- case CTRL_C_EVENT:
- case CTRL_BREAK_EVENT:
- {
- // Handler will be called on a new/different thread.
- LockGuard lg(win_signal_lock);
- handler = win_int_handler;
- }
- if (handler) {
- handler(SIGINT);
- return TRUE;
- }
- return FALSE;
- case CTRL_LOGOFF_EVENT:
- case CTRL_CLOSE_EVENT:
- case CTRL_SHUTDOWN_EVENT:
- {
- // Handler will be called on a new/different thread.
- LockGuard lg(win_signal_lock);
- handler = win_term_handler;;
- }
- if (handler) {
- handler(SIGTERM);
- return TRUE;
- }
- return FALSE;
- }
- return FALSE;
- }
- }
- #endif
- void setGlobalSignalHandler(int sig, sigset_t* mask, signal_handler_t handler,
- int flags) {
- #if _WIN32
- if (sig == SIGINT || sig == SIGTERM) {
- // Handler will be called on a new/different thread.
- LockGuard lg(win_signal_lock);
- if (handler == SIG_DFL) {
- handler = nullptr;
- }
- else if (handler == SIG_IGN) {
- handler = win_ign_handler;
- }
- // Not yet in use: add console handler.
- if (handler && !win_int_handler && !win_term_handler) {
- ::SetConsoleCtrlHandler(HandlerRoutine, TRUE);
- }
- if (sig == SIGINT) {
- win_int_handler = handler;
- }
- else {
- win_term_handler = handler;
- }
- // No handlers set: remove.
- if (!win_int_handler && !win_term_handler) {
- ::SetConsoleCtrlHandler(HandlerRoutine, FALSE);
- }
- return;
- }
- #endif
- #ifdef HAVE_SIGACTION
- struct sigaction sigact;
- sigact.sa_handler = handler;
- sigact.sa_flags = flags;
- sigact.sa_mask = *mask;
- sigaction(sig, &sigact, nullptr);
- #else
- signal(sig, handler);
- #endif // HAVE_SIGACTION
- }
- std::string getHomeDir()
- {
- const char* p = getenv("HOME");
- if (p) {
- return p;
- }
- #ifdef __MINGW32__
- p = getenv("USERPROFILE");
- if (p) {
- return p;
- }
- p = getenv("HOMEDRIVE");
- if (p) {
- std::string homeDir = p;
- p = getenv("HOMEPATH");
- if (p) {
- homeDir += p;
- return homeDir;
- }
- }
- #elif HAVE_PWD_H
- passwd* pw = getpwuid(geteuid());
- if(pw && pw->pw_dir) {
- return pw->pw_dir;
- }
- #endif // HAVE_PWD_H
- return A2STR::NIL;
- }
- int64_t getRealSize(const std::string& sizeWithUnit)
- {
- std::string::size_type p = sizeWithUnit.find_first_of("KMkm");
- std::string size;
- int32_t mult = 1;
- if(p == std::string::npos) {
- size = sizeWithUnit;
- } else {
- switch(sizeWithUnit[p]) {
- case 'K':
- case 'k':
- mult = 1024;
- break;
- case 'M':
- case 'm':
- mult = 1024*1024;
- break;
- }
- size.assign(sizeWithUnit.begin(), sizeWithUnit.begin()+p);
- }
- int64_t v;
- if(!parseLLIntNoThrow(v, size) || v < 0) {
- throw DL_ABORT_EX(fmt("Bad or negative value detected: %s",
- sizeWithUnit.c_str()));
- }
- if(INT64_MAX/mult < v) {
- throw DL_ABORT_EX(fmt(MSG_STRING_INTEGER_CONVERSION_FAILURE,
- "overflow/underflow"));
- }
- return v*mult;
- }
- std::string abbrevSize(int64_t size)
- {
- static const char* UNITS[] = { "", "Ki", "Mi", "Gi" };
- int64_t t = size;
- size_t uidx = 0;
- int r = 0;
- while(t >= 1024 && uidx+1 < sizeof(UNITS)/sizeof(UNITS[0])) {
- lldiv_t d = lldiv(t, 1024);
- t = d.quot;
- r = d.rem;
- ++uidx;
- }
- if(uidx+1 < sizeof(UNITS)/sizeof(UNITS[0]) && t >= 922) {
- ++uidx;
- r = t;
- t = 0;
- }
- std::string res;
- res += itos(t, true);
- if(t < 10 && uidx > 0) {
- res += ".";
- res += itos(r*10/1024);
- }
- res += UNITS[uidx];
- return res;
- }
- void sleep(long seconds) {
- #if defined(HAVE_WINSOCK2_H)
- ::Sleep(seconds * 1000);
- #elif HAVE_SLEEP
- ::sleep(seconds);
- #elif defined(HAVE_USLEEP)
- ::usleep(seconds * 1000000);
- #else
- # error no sleep function is available (nanosleep?)
- #endif
- }
- void usleep(long microseconds) {
- #ifdef HAVE_USLEEP
- ::usleep(microseconds);
- #elif defined(HAVE_WINSOCK2_H)
- LARGE_INTEGER current, freq, end;
- static enum {GET_FREQUENCY, GET_MICROSECONDS, SKIP_MICROSECONDS} state = GET_FREQUENCY;
- if (state == GET_FREQUENCY) {
- if (QueryPerformanceFrequency(&freq))
- state = GET_MICROSECONDS;
- else
- state = SKIP_MICROSECONDS;
- }
- long msec = microseconds / 1000;
- microseconds %= 1000;
- if (state == GET_MICROSECONDS && microseconds) {
- QueryPerformanceCounter(&end);
- end.QuadPart += (freq.QuadPart * microseconds) / 1000000;
- while (QueryPerformanceCounter(¤t) && (current.QuadPart <= end.QuadPart))
- /* noop */ ;
- }
- if (msec)
- Sleep(msec);
- #else
- #error no usleep function is available (nanosleep?)
- #endif
- }
- void mkdirs(const std::string& dirpath)
- {
- File dir(dirpath);
- if(!dir.mkdirs()) {
- int errNum = errno;
- if(!dir.isDir()) {
- throw DL_ABORT_EX3(errNum, fmt(EX_MAKE_DIR, dir.getPath().c_str(),
- safeStrerror(errNum).c_str()),
- error_code::DIR_CREATE_ERROR);
- }
- }
- }
- void convertBitfield(BitfieldMan* dest, const BitfieldMan* src)
- {
- size_t numBlock = dest->countBlock();
- for(size_t index = 0; index < numBlock; ++index) {
- if(src->isBitSetOffsetRange((int64_t)index*dest->getBlockLength(),
- dest->getBlockLength())) {
- dest->setBit(index);
- }
- }
- }
- std::string toString(const std::shared_ptr<BinaryStream>& binaryStream)
- {
- std::stringstream strm;
- char data[2048];
- while(1) {
- int32_t dataLength = binaryStream->readData
- (reinterpret_cast<unsigned char*>(data), sizeof(data), strm.tellp());
- strm.write(data, dataLength);
- if(dataLength == 0) {
- break;
- }
- }
- return strm.str();
- }
- #ifdef HAVE_POSIX_MEMALIGN
- /**
- * In linux 2.6, alignment and size should be a multiple of 512.
- */
- void* allocateAlignedMemory(size_t alignment, size_t size)
- {
- void* buffer;
- int res;
- if((res = posix_memalign(&buffer, alignment, size)) != 0) {
- throw FATAL_EXCEPTION(fmt("Error in posix_memalign: %s",
- util::safeStrerror(res).c_str()));
- }
- return buffer;
- }
- #endif // HAVE_POSIX_MEMALIGN
- std::pair<std::string, uint16_t>
- getNumericNameInfo(const struct sockaddr* sockaddr, socklen_t len)
- {
- char host[NI_MAXHOST];
- char service[NI_MAXSERV];
- int s = getnameinfo(sockaddr, len, host, NI_MAXHOST, service, NI_MAXSERV,
- NI_NUMERICHOST|NI_NUMERICSERV);
- if(s != 0) {
- throw DL_ABORT_EX(fmt("Failed to get hostname and port. cause: %s",
- gai_strerror(s)));
- }
- return std::pair<std::string, uint16_t>(host, atoi(service)); // TODO
- }
- std::string htmlEscape(const std::string& src)
- {
- std::string dest;
- dest.reserve(src.size());
- auto j = std::begin(src);
- for(auto i = std::begin(src); i != std::end(src); ++i) {
- char ch = *i;
- const char *repl;
- if(ch == '<') {
- repl = "<";
- } else if(ch == '>') {
- repl = ">";
- } else if(ch == '&') {
- repl = "&";
- } else if(ch == '\'') {
- repl = "'";
- } else if(ch == '"') {
- repl = """;
- } else {
- continue;
- }
- dest.append(j, i);
- j = i + 1;
- dest += repl;
- }
- dest.append(j, std::end(src));
- return dest;
- }
- std::pair<size_t, std::string>
- parseIndexPath(const std::string& line)
- {
- auto p = divide(std::begin(line), std::end(line), '=');
- uint32_t index;
- if(!parseUIntNoThrow(index, std::string(p.first.first, p.first.second))) {
- throw DL_ABORT_EX("Bad path index");
- }
- if(p.second.first == p.second.second) {
- throw DL_ABORT_EX(fmt("Path with index=%u is empty.", index));
- }
- return std::make_pair(index, std::string(p.second.first, p.second.second));
- }
- std::vector<std::pair<size_t, std::string> > createIndexPaths(std::istream& i)
- {
- std::vector<std::pair<size_t, std::string> > indexPaths;
- std::string line;
- while(getline(i, line)) {
- indexPaths.push_back(parseIndexPath(line));
- }
- return indexPaths;
- }
- namespace {
- void generateRandomDataRandom(unsigned char* data, size_t length)
- {
- const auto& rd = SimpleRandomizer::getInstance();
- rd->getRandomBytes(data, length);
- }
- } // namespace
- #ifndef __MINGW32__
- namespace {
- void generateRandomDataUrandom
- (unsigned char* data, size_t length, std::ifstream& devUrand)
- {
- devUrand.read(reinterpret_cast<char*>(data), length);
- }
- } // namespace
- #endif
- void generateRandomData(unsigned char* data, size_t length)
- {
- #ifdef __MINGW32__
- generateRandomDataRandom(data, length);
- #else // !__MINGW32__
- static int method = -1;
- static std::ifstream devUrand;
- if(method == 0) {
- generateRandomDataUrandom(data, length, devUrand);
- } else if(method == 1) {
- generateRandomDataRandom(data, length);
- } else {
- devUrand.open("/dev/urandom");
- if(devUrand) {
- method = 0;
- } else {
- method = 1;
- }
- generateRandomData(data, length);
- }
- #endif // !__MINGW32__
- }
- bool saveAs
- (const std::string& filename, const std::string& data, bool overwrite)
- {
- if(!overwrite && File(filename).exists()) {
- return false;
- }
- std::string tempFilename = filename;
- tempFilename += "__temp";
- {
- BufferedFile fp(tempFilename.c_str(), BufferedFile::WRITE);
- if(!fp) {
- return false;
- }
- if(fp.write(data.data(), data.size()) != data.size()) {
- return false;
- }
- if(fp.close() == EOF) {
- return false;
- }
- }
- return File(tempFilename).renameTo(filename);
- }
- std::string applyDir(const std::string& dir, const std::string& relPath)
- {
- std::string s;
- if(dir.empty()) {
- s = "./";
- s += relPath;
- }
- else {
- s = dir;
- if(dir == "/") {
- s += relPath;
- }
- else {
- s += "/";
- s += relPath;
- }
- }
- #ifdef __MINGW32__
- for(std::string::iterator i = s.begin(), eoi = s.end(); i != eoi; ++i) {
- if(*i == '\\') {
- *i = '/';
- }
- }
- #endif // __MINGW32__
- return s;
- }
- std::string fixTaintedBasename(const std::string& src)
- {
- return escapePath(replace(src, "/", "%2F"));
- }
- void generateRandomKey(unsigned char* key)
- {
- unsigned char bytes[40];
- generateRandomData(bytes, sizeof(bytes));
- message_digest::digest(key, 20, MessageDigest::sha1().get(), bytes,
- sizeof(bytes));
- }
- // Returns true is given numeric ipv4addr is in Private Address Space.
- //
- // From Section.3 RFC1918
- // 10.0.0.0 - 10.255.255.255 (10/8 prefix)
- // 172.16.0.0 - 172.31.255.255 (172.16/12 prefix)
- // 192.168.0.0 - 192.168.255.255 (192.168/16 prefix)
- bool inPrivateAddress(const std::string& ipv4addr)
- {
- if(util::startsWith(ipv4addr, "10.") ||
- util::startsWith(ipv4addr, "192.168.")) {
- return true;
- }
- if(util::startsWith(ipv4addr, "172.")) {
- for(int i = 16; i <= 31; ++i) {
- std::string t(fmt("%d.", i));
- if(util::startsWith(ipv4addr.begin()+4, ipv4addr.end(),
- t.begin(), t.end())) {
- return true;
- }
- }
- }
- return false;
- }
- bool detectDirTraversal(const std::string& s)
- {
- if(s.empty()) {
- return false;
- }
- for (auto c : s) {
- unsigned char ch = c;
- if (in(ch, 0x00u, 0x1fu) || ch == 0x7fu) {
- return true;
- }
- }
- return s == "." || s == ".." || s[0] == '/' ||
- util::startsWith(s, "./") ||
- util::startsWith(s, "../") ||
- s.find("/../") != std::string::npos ||
- s.find("/./") != std::string::npos ||
- s[s.size()-1] == '/' ||
- util::endsWith(s, "/.") ||
- util::endsWith(s, "/..");
- }
- std::string escapePath(const std::string& s)
- {
- // We don't escape '/' because we use it as a path separator.
- #ifdef __MINGW32__
- static const char WIN_INVALID_PATH_CHARS[] =
- { '"', '*', ':', '<', '>', '?', '\\', '|' };
- #endif // __MINGW32__
- std::string d;
- for(auto cc: s) {
- unsigned char c = cc;
- if(in(c, 0x00u, 0x1fu) || c == 0x7fu
- #ifdef __MINGW32__
- || std::find(std::begin(WIN_INVALID_PATH_CHARS),
- std::end(WIN_INVALID_PATH_CHARS),
- c) != std::end(WIN_INVALID_PATH_CHARS)
- #endif // __MINGW32__
- ){
- d += fmt("%%%02X", c);
- } else {
- d += c;
- }
- }
- return d;
- }
- bool inSameCidrBlock
- (const std::string& ip1, const std::string& ip2, size_t bits)
- {
- unsigned char s1[16], s2[16];
- size_t len1, len2;
- if((len1 = net::getBinAddr(s1, ip1)) == 0 ||
- (len2 = net::getBinAddr(s2, ip2)) == 0 ||
- len1 != len2) {
- return false;
- }
- if(bits == 0) {
- return true;
- }
- if(bits > 8*len1) {
- bits = 8*len1;
- }
- int last = (bits-1)/8;
- for(int i = 0; i < last; ++i) {
- if(s1[i] != s2[i]) {
- return false;
- }
- }
- unsigned char mask = bitfield::lastByteMask(bits);
- return (s1[last] & mask) == (s2[last] & mask);
- }
- namespace {
- void executeHook
- (const std::string& command,
- a2_gid_t gid,
- size_t numFiles,
- const std::string& firstFilename)
- {
- const std::string gidStr = GroupId::toHex(gid);
- const std::string numFilesStr = util::uitos(numFiles);
- #ifndef __MINGW32__
- A2_LOG_INFO(fmt("Executing user command: %s %s %s %s",
- command.c_str(),
- gidStr.c_str(),
- numFilesStr.c_str(),
- firstFilename.c_str()));
- pid_t cpid = fork();
- if (cpid == 0) {
- // child!
- execlp(command.c_str(),
- command.c_str(),
- gidStr.c_str(),
- numFilesStr.c_str(),
- firstFilename.c_str(),
- reinterpret_cast<char*>(0));
- perror(("Could not execute user command: "+command).c_str());
- _exit(EXIT_FAILURE);
- return;
- }
- if(cpid == -1) {
- A2_LOG_ERROR("fork() failed. Cannot execute user command.");
- }
- return;
- #else // __MINGW32__
- PROCESS_INFORMATION pi;
- STARTUPINFOW si;
- memset(&si, 0, sizeof (si));
- si.cb = sizeof(STARTUPINFO);
- memset(&pi, 0, sizeof (pi));
- bool batch = util::iendsWith(command, ".bat");
- std::string cmdline;
- std::string cmdexe;
- // XXX batch handling, in particular quoting, correct?
- if(batch) {
- const char* p = getenv("windir");
- if(p) {
- cmdexe = p;
- cmdexe += "\\system32\\cmd.exe";
- } else {
- A2_LOG_INFO("Failed to get windir environment variable."
- " Executing batch file will fail.");
- // TODO Might be useless.
- cmdexe = "cmd.exe";
- }
- cmdline += "/C \"";
- }
- cmdline += "\"";
- cmdline += command;
- cmdline += "\"";
- cmdline += " ";
- cmdline += gidStr;
- cmdline += " ";
- cmdline += numFilesStr;
- cmdline += " \"";
- cmdline += firstFilename;
- cmdline += "\"";
- if(batch) {
- cmdline += "\"";
- }
- int cmdlineLen = utf8ToWChar(nullptr, 0, cmdline.c_str());
- assert(cmdlineLen > 0);
- auto wcharCmdline = make_unique<wchar_t[]>(cmdlineLen);
- cmdlineLen = utf8ToWChar(wcharCmdline.get(), cmdlineLen, cmdline.c_str());
- assert(cmdlineLen > 0);
- A2_LOG_INFO(fmt("Executing user command: %s", cmdline.c_str()));
- DWORD rc = CreateProcessW(batch ? utf8ToWChar(cmdexe).c_str() : nullptr,
- wcharCmdline.get(),
- nullptr,
- nullptr,
- true,
- 0,
- nullptr,
- 0,
- &si,
- &pi);
- if(!rc) {
- A2_LOG_ERROR("CreateProcess() failed. Cannot execute user command.");
- }
- return;
- #endif
- }
- } // namespace
- void executeHookByOptName
- (const std::shared_ptr<RequestGroup>& group, const Option* option,
- PrefPtr pref)
- {
- executeHookByOptName(group.get(), option, pref);
- }
- void executeHookByOptName
- (const RequestGroup* group, const Option* option, PrefPtr pref)
- {
- const std::string& cmd = option->get(pref);
- if(!cmd.empty()) {
- const std::shared_ptr<DownloadContext> dctx = group->getDownloadContext();
- std::string firstFilename;
- size_t numFiles = 0;
- if(!group->inMemoryDownload()) {
- std::shared_ptr<FileEntry> file = dctx->getFirstRequestedFileEntry();
- if(file) {
- firstFilename = file->getPath();
- }
- numFiles = dctx->countRequestedFileEntry();
- }
- executeHook(cmd, group->getGID(), numFiles, firstFilename);
- }
- }
- std::string createSafePath
- (const std::string& dir, const std::string& filename)
- {
- return util::applyDir(dir, util::isUtf8(filename) ?
- util::fixTaintedBasename(filename) :
- util::escapePath(util::percentEncode(filename))
- );
- }
- std::string encodeNonUtf8(const std::string& s)
- {
- return util::isUtf8(s)?s:util::percentEncode(s);
- }
- std::string makeString(const char* str)
- {
- if(!str) {
- return A2STR::NIL;
- }
- return str;
- }
- std::string safeStrerror(int errNum)
- {
- return makeString(strerror(errNum));
- }
- bool noProxyDomainMatch
- (const std::string& hostname,
- const std::string& domain)
- {
- if(!domain.empty() && domain[0] == '.' && !util::isNumericHost(hostname)) {
- return util::endsWith(hostname, domain);
- }
- return hostname == domain;
- }
- bool tlsHostnameMatch(const std::string& pattern, const std::string& hostname)
- {
- std::string::const_iterator ptWildcard = std::find(pattern.begin(),
- pattern.end(),
- '*');
- if(ptWildcard == pattern.end()) {
- return strieq(pattern.begin(), pattern.end(),
- hostname.begin(), hostname.end());
- }
- std::string::const_iterator ptLeftLabelEnd = std::find(pattern.begin(),
- pattern.end(),
- '.');
- bool wildcardEnabled = true;
- // Do case-insensitive match. At least 2 dots are required to enable
- // wildcard match. Also wildcard must be in the left-most label.
- // Don't attempt to match a presented identifier where the wildcard
- // character is embedded within an A-label.
- if(ptLeftLabelEnd == pattern.end() ||
- std::find(ptLeftLabelEnd+1, pattern.end(), '.') == pattern.end() ||
- ptLeftLabelEnd < ptWildcard ||
- istartsWith(pattern, "xn--")) {
- wildcardEnabled = false;
- }
- if(!wildcardEnabled) {
- return strieq(pattern.begin(), pattern.end(),
- hostname.begin(), hostname.end());
- }
- std::string::const_iterator hnLeftLabelEnd = std::find(hostname.begin(),
- hostname.end(),
- '.');
- if(!strieq(ptLeftLabelEnd, pattern.end(), hnLeftLabelEnd, hostname.end())) {
- return false;
- }
- // Perform wildcard match. Here '*' must match at least one
- // character.
- if(hnLeftLabelEnd - hostname.begin() < ptLeftLabelEnd - pattern.begin()) {
- return false;
- }
- return istartsWith(hostname.begin(), hnLeftLabelEnd, pattern.begin(),
- ptWildcard) &&
- iendsWith(hostname.begin(), hnLeftLabelEnd, ptWildcard + 1,
- ptLeftLabelEnd);
- }
- bool strieq(const std::string& a, const char* b)
- {
- return strieq(a.begin(), a.end(), b);
- }
- bool strieq(const std::string& a, const std::string& b)
- {
- return strieq(a.begin(), a.end(), b.begin(), b.end());
- }
- bool startsWith(const std::string& a, const char* b)
- {
- return startsWith(a.begin(), a.end(), b);
- }
- bool startsWith(const std::string& a, const std::string& b)
- {
- return startsWith(a.begin(), a.end(), b.begin(), b.end());
- }
- bool istartsWith(const std::string& a, const char* b)
- {
- return istartsWith(a.begin(), a.end(), b);
- }
- bool endsWith(const std::string& a, const char* b)
- {
- return endsWith(a.begin(), a.end(), b, b+strlen(b));
- }
- bool endsWith(const std::string& a, const std::string& b)
- {
- return endsWith(a.begin(), a.end(), b.begin(), b.end());
- }
- bool iendsWith(const std::string& a, const char* b)
- {
- return iendsWith(a.begin(), a.end(), b, b+strlen(b));
- }
- bool iendsWith(const std::string& a, const std::string& b)
- {
- return iendsWith(a.begin(), a.end(), b.begin(), b.end());
- }
- bool strless(const char* a, const char* b)
- {
- return strcmp(a, b) < 0;
- }
- } // namespace util
- } // namespace aria2
|