/* */ #include "util.h" #include #include #include #include #include #include #include #include #include #include #include #include "SimpleRandomizer.h" #include "File.h" #include "Randomizer.h" #include "a2netcompat.h" #include "BitfieldMan.h" #include "DefaultDiskWriter.h" #include "FatalException.h" #include "FileEntry.h" #include "A2STR.h" #include "array_fun.h" #include "bitfield.h" #include "DownloadHandlerConstants.h" #include "RequestGroup.h" #include "LogFactory.h" #include "Logger.h" #include "Option.h" #include "DownloadContext.h" #include "BufferedFile.h" #include "SocketCore.h" #include "prefs.h" #ifdef ENABLE_MESSAGE_DIGEST # include "MessageDigest.h" # include "message_digest_helper.h" #endif // ENABLE_MESSAGE_DIGEST // For libc6 which doesn't define ULLONG_MAX properly because of broken limits.h #ifndef ULLONG_MAX # define ULLONG_MAX 18446744073709551615ULL #endif // ULLONG_MAX namespace aria2 { #ifdef __MINGW32__ namespace { int utf8ToWChar(wchar_t* out, size_t outLength, const char* src) { return MultiByteToWideChar(CP_UTF8, 0, src, -1, out, outLength); } } // namespace namespace { int ansiToWChar(wchar_t* out, size_t outLength, const char* src) { return MultiByteToWideChar(CP_ACP, 0, src, -1, out, outLength); } } // namespace namespace { int wCharToUtf8(char* out, size_t outLength, const wchar_t* src) { return WideCharToMultiByte(CP_UTF8, 0, src, -1, out, outLength, 0, 0); } } // namespace namespace { int wCharToAnsi(char* out, size_t outLength, const wchar_t* src) { return WideCharToMultiByte(CP_ACP, 0, src, -1, out, outLength, 0, 0); } } // namespace std::wstring utf8ToWChar(const char* src) { int len = utf8ToWChar(0, 0, src); if(len == 0) { abort(); } array_ptr buf(new wchar_t[len]); len = utf8ToWChar(buf, len, src); if(len == 0) { abort(); } else { std::wstring dest(buf); return dest; } } std::wstring utf8ToWChar(const std::string& src) { return utf8ToWChar(src.c_str()); } std::string utf8ToNative(const std::string& src) { std::wstring wsrc = utf8ToWChar(src); int len = wCharToAnsi(0, 0, wsrc.c_str()); if(len == 0) { abort(); } array_ptr buf(new char[len]); len = wCharToAnsi(buf, len, wsrc.c_str()); if(len == 0) { abort(); } else { std::string dest(buf); return dest; } } std::string wCharToUtf8(const std::wstring& wsrc) { int len = wCharToUtf8(0, 0, wsrc.c_str()); if(len == 0) { abort(); } array_ptr buf(new char[len]); len = wCharToUtf8(buf, len, wsrc.c_str()); if(len == 0) { abort(); } else { std::string dest(buf); return dest; } } std::string nativeToUtf8(const std::string& src) { int len = ansiToWChar(0, 0, src.c_str()); if(len == 0) { abort(); } array_ptr buf(new wchar_t[len]); len = ansiToWChar(buf, len, src.c_str()); if(len == 0) { abort(); } else { return wCharToUtf8(std::wstring(buf)); } } #endif // __MINGW32__ namespace util { const std::string DEFAULT_STRIP_CHARSET("\r\n\t "); std::string strip(const std::string& str, const std::string& chars) { std::pair p = stripIter(str.begin(), str.end(), chars); return std::string(p.first, p.second); } std::string itos(int64_t value, bool comma) { bool flag = false; std::string str; if(value < 0) { if(value == INT64_MIN) { if(comma) { str = "-9,223,372,036,854,775,808"; } else { str = "-9223372036854775808"; } return str; } flag = true; value = -value; } str = uitos(value, comma); if(flag) { str.insert(str.begin(), '-'); } return str; } int64_t difftv(struct timeval tv1, struct timeval tv2) { if((tv1.tv_sec < tv2.tv_sec) || ((tv1.tv_sec == tv2.tv_sec) && (tv1.tv_usec < tv2.tv_usec))) { return 0; } return ((int64_t)(tv1.tv_sec-tv2.tv_sec)*1000000+ tv1.tv_usec-tv2.tv_usec); } int32_t difftvsec(struct timeval tv1, struct timeval tv2) { if(tv1.tv_sec < tv2.tv_sec) { return 0; } return tv1.tv_sec-tv2.tv_sec; } std::string replace(const std::string& target, const std::string& oldstr, const std::string& newstr) { if(target.empty() || oldstr.empty()) { return target; } std::string result; std::string::size_type p = 0; std::string::size_type np = target.find(oldstr); while(np != std::string::npos) { result += target.substr(p, np-p); result += newstr; p = np+oldstr.size(); np = target.find(oldstr, p); } result += target.substr(p); return result; } bool isAlpha(const char c) { return ('A' <= c && c <= 'Z') || ('a' <= c && c <= 'z'); } bool isDigit(const char c) { return '0' <= c && c <= '9'; } bool isHexDigit(const char c) { return isDigit(c) || ('A' <= c && c <= 'F') || ('a' <= c && c <= 'f'); } bool isHexDigit(const std::string& s) { for(std::string::const_iterator i = s.begin(), eoi = s.end(); i != eoi; ++i) { if(!isHexDigit(*i)) { return false; } } return true; } bool inRFC3986ReservedChars(const char c) { static const char reserved[] = { ':' , '/' , '?' , '#' , '[' , ']' , '@', '!' , '$' , '&' , '\'' , '(' , ')', '*' , '+' , ',' , ';' , '=' }; return std::find(vbegin(reserved), vend(reserved), c) != vend(reserved); } bool inRFC3986UnreservedChars(const char c) { static const char unreserved[] = { '-', '.', '_', '~' }; return isAlpha(c) || isDigit(c) || std::find(vbegin(unreserved), vend(unreserved), c) != vend(unreserved); } bool inRFC2978MIMECharset(const char c) { static const char chars[] = { '!', '#', '$', '%', '&', '\'', '+', '-', '^', '_', '`', '{', '}', '~' }; return isAlpha(c) || isDigit(c) || std::find(vbegin(chars), vend(chars), c) != vend(chars); } bool inRFC2616HttpToken(const char c) { static const char chars[] = { '!', '#', '$', '%', '&', '\'', '*', '+', '-', '.', '^', '_', '`', '|', '~' }; return isAlpha(c) || isDigit(c) || std::find(vbegin(chars), vend(chars), c) != vend(chars); } namespace { bool isUtf8Tail(unsigned char ch) { return in(ch, 0x80u, 0xbfu); } } // namespace bool isUtf8(const std::string& str) { for(std::string::const_iterator s = str.begin(), eos = str.end(); s != eos; ++s) { unsigned char firstChar = *s; // See ABNF in http://tools.ietf.org/search/rfc3629#section-4 if(in(firstChar, 0x20u, 0x7eu) || firstChar == 0x08u || // \b firstChar == 0x09u || // \t firstChar == 0x0au || // \n firstChar == 0x0cu || // \f firstChar == 0x0du // \r ) { // UTF8-1 (without ctrl chars) } else if(in(firstChar, 0xc2u, 0xdfu)) { // UTF8-2 if(++s == eos || !isUtf8Tail(*s)) { return false; } } else if(0xe0u == firstChar) { // UTF8-3 if(++s == eos || !in(static_cast(*s), 0xa0u, 0xbfu) || ++s == eos || !isUtf8Tail(*s)) { return false; } } else if(in(firstChar, 0xe1u, 0xecu) || in(firstChar, 0xeeu, 0xefu)) { // UTF8-3 if(++s == eos || !isUtf8Tail(*s) || ++s == eos || !isUtf8Tail(*s)) { return false; } } else if(0xedu == firstChar) { // UTF8-3 if(++s == eos || !in(static_cast(*s), 0x80u, 0x9fu) || ++s == eos || !isUtf8Tail(*s)) { return false; } } else if(0xf0u == firstChar) { // UTF8-4 if(++s == eos || !in(static_cast(*s), 0x90u, 0xbfu) || ++s == eos || !isUtf8Tail(*s) || ++s == eos || !isUtf8Tail(*s)) { return false; } } else if(in(firstChar, 0xf1u, 0xf3u)) { // UTF8-4 if(++s == eos || !isUtf8Tail(*s) || ++s == eos || !isUtf8Tail(*s) || ++s == eos || !isUtf8Tail(*s)) { return false; } } else if(0xf4u == firstChar) { // UTF8-4 if(++s == eos || !in(static_cast(*s), 0x80u, 0x8fu) || ++s == eos || !isUtf8Tail(*s) || ++s == eos || !isUtf8Tail(*s)) { return false; } } else { return false; } } return true; } std::string percentEncode(const unsigned char* target, size_t len) { std::string dest; for(size_t i = 0; i < len; ++i) { if(inRFC3986UnreservedChars(target[i])) { dest += target[i]; } else { dest.append(fmt("%%%02X", target[i])); } } return dest; } std::string percentEncode(const std::string& target) { return percentEncode(reinterpret_cast(target.c_str()), target.size()); } std::string percentEncodeMini(const std::string& src) { std::string result; for(std::string::const_iterator i = src.begin(), eoi = src.end(); i != eoi; ++i) { // Non-Printable ASCII and non-ASCII chars + some ASCII chars. unsigned char c = *i; if(in(c, 0x00u, 0x20u) || c >= 0x7fu || // Chromium escapes following characters. Firefox4 escapes // more. c == '"' || c == '<' || c == '>') { result += fmt("%%%02X", c); } else { result += c; } } return result; } std::string torrentPercentEncode(const unsigned char* target, size_t len) { std::string dest; for(size_t i = 0; i < len; ++i) { if(isAlpha(target[i]) || isDigit(target[i])) { dest += target[i]; } else { dest.append(fmt("%%%02X", target[i])); } } return dest; } std::string torrentPercentEncode(const std::string& target) { return torrentPercentEncode (reinterpret_cast(target.c_str()), target.size()); } std::string percentDecode (std::string::const_iterator first, std::string::const_iterator last) { std::string result; for(; first != last; ++first) { if(*first == '%') { if(first+1 != last && first+2 != last && isHexDigit(*(first+1)) && isHexDigit(*(first+2))) { result += parseInt(first+1, first+3, 16); first += 2; } else { result += *first; } } else { result += *first; } } return result; } std::string toHex(const unsigned char* src, size_t len) { std::string out(len*2, '\0'); std::string::iterator o = out.begin(); const unsigned char* last = src+len; for(const unsigned char* i = src; i != last; ++i) { *o = (*i >> 4); *(o+1) = (*i)&0x0fu; for(int j = 0; j < 2; ++j) { if(*o < 10) { *o += '0'; } else { *o += 'a'-10; } ++o; } } return out; } std::string toHex(const char* src, size_t len) { return toHex(reinterpret_cast(src), len); } std::string toHex(const std::string& src) { return toHex(reinterpret_cast(src.c_str()), src.size()); } namespace { unsigned int hexCharToUInt(unsigned char ch) { if('a' <= ch && ch <= 'f') { ch -= 'a'; ch += 10; } else if('A' <= ch && ch <= 'F') { ch -= 'A'; ch += 10; } else if('0' <= ch && ch <= '9') { ch -= '0'; } else { ch = 255; } return ch; } } // namespace std::string fromHex(const std::string& src) { std::string dest; if(src.size()%2) { return dest; } for(size_t i = 0, eoi = src.size(); i < eoi; i += 2) { unsigned char high = hexCharToUInt(src[i]); unsigned char low = hexCharToUInt(src[i+1]); if(high == 255 || low == 255) { dest.clear(); return dest; } dest += (high*16+low); } return dest; } FILE* openFile(const std::string& filename, const std::string& mode) { FILE* file = fopen(filename.c_str(), mode.c_str()); return file; } bool isPowerOf(int num, int base) { if(base <= 0) { return false; } if(base == 1) { return true; } while(num%base == 0) { num /= base; if(num == 1) { return true; } } return false; } std::string secfmt(time_t sec) { std::string str; if(sec >= 3600) { str = itos(sec/3600); str += "h"; sec %= 3600; } if(sec >= 60) { int min = sec/60; if(min < 10) { str += "0"; } str += itos(min); str += "m"; sec %= 60; } if(sec < 10) { str += "0"; } str += itos(sec); str += "s"; return str; } int getNum(const char* buf, int offset, size_t length) { char* temp = new char[length+1]; memcpy(temp, buf+offset, length); temp[length] = '\0'; int x = strtol(temp, 0, 10); delete [] temp; return x; } void parseIntSegments(SegList& sgl, const std::string& src) { for(std::string::const_iterator i = src.begin(), eoi = src.end(); i != eoi;) { std::string::const_iterator j = std::find(i, eoi, ','); if(j == i) { ++i; continue; } std::string::const_iterator p = std::find(i, j, '-'); if(p == j) { int a = parseInt(i, j); sgl.add(a, a+1); } else if(p == i || p+1 == j) { throw DL_ABORT_EX(fmt(MSG_INCOMPLETE_RANGE, std::string(i, j).c_str())); } else { int a = parseInt(i, p); int b = parseInt(p+1, j); sgl.add(a, b+1); } if(j == eoi) { break; } i = j+1; } } namespace { void computeHeadPieces (std::vector& indexes, const std::vector >& fileEntries, size_t pieceLength, uint64_t head) { if(head == 0) { return; } for(std::vector >::const_iterator fi = fileEntries.begin(), eoi = fileEntries.end(); fi != eoi; ++fi) { if((*fi)->getLength() == 0) { continue; } size_t lastIndex = ((*fi)->getOffset()+std::min(head, (*fi)->getLength())-1)/pieceLength; for(size_t index = (*fi)->getOffset()/pieceLength; index <= lastIndex; ++index) { indexes.push_back(index); } } } } // namespace namespace { void computeTailPieces (std::vector& indexes, const std::vector >& fileEntries, size_t pieceLength, uint64_t tail) { if(tail == 0) { return; } for(std::vector >::const_iterator fi = fileEntries.begin(), eoi = fileEntries.end(); fi != eoi; ++fi) { if((*fi)->getLength() == 0) { continue; } uint64_t endOffset = (*fi)->getLastOffset(); size_t fromIndex = (endOffset-1-(std::min(tail, (*fi)->getLength())-1))/pieceLength; for(size_t index = fromIndex; index <= (endOffset-1)/pieceLength; ++index) { indexes.push_back(index); } } } } // namespace void parsePrioritizePieceRange (std::vector& result, const std::string& src, const std::vector >& fileEntries, size_t pieceLength, uint64_t defaultSize) { std::vector indexes; std::vector parts; const char A2_HEAD[] = "head"; const char A2_HEADEQ[] = "head="; const char A2_TAIL[] = "tail"; const char A2_TAILEQ[] = "tail="; splitIter(src.begin(), src.end(), std::back_inserter(parts), ',', true); for(std::vector::const_iterator i = parts.begin(), eoi = parts.end(); i != eoi; ++i) { if(util::streq((*i).first, (*i).second, A2_HEAD, vend(A2_HEAD)-1)) { computeHeadPieces(indexes, fileEntries, pieceLength, defaultSize); } else if(util::startsWith((*i).first, (*i).second, A2_HEADEQ, vend(A2_HEADEQ)-1)) { std::string sizestr((*i).first+5, (*i).second); computeHeadPieces(indexes, fileEntries, pieceLength, std::max((int64_t)0, getRealSize(sizestr))); } else if(util::streq((*i).first, (*i).second, A2_TAIL, vend(A2_TAIL)-1)) { computeTailPieces(indexes, fileEntries, pieceLength, defaultSize); } else if(util::startsWith((*i).first, (*i).second, A2_TAILEQ, vend(A2_TAILEQ)-1)) { std::string sizestr((*i).first+5, (*i).second); computeTailPieces(indexes, fileEntries, pieceLength, std::max((int64_t)0, getRealSize(sizestr))); } else { throw DL_ABORT_EX(fmt("Unrecognized token %s", std::string((*i).first, (*i).second).c_str())); } } std::sort(indexes.begin(), indexes.end()); indexes.erase(std::unique(indexes.begin(), indexes.end()), indexes.end()); result.insert(result.end(), indexes.begin(), indexes.end()); } // Converts ISO/IEC 8859-1 string to UTF-8 string. If there is a // character not in ISO/IEC 8859-1, returns empty string. std::string iso8859ToUtf8(const std::string& src) { std::string dest; for(std::string::const_iterator itr = src.begin(), eoi = src.end(); itr != eoi; ++itr) { unsigned char c = *itr; if(0xa0u <= c) { if(c <= 0xbfu) { dest += 0xc2u; } else { dest += 0xc3u; } dest += c&(~0x40u); } else if(0x80u <= c && c <= 0x9fu) { return A2STR::NIL; } else { dest += c; } } return dest; } namespace { template void parseParam(OutputIterator out, const std::string& header) { for(std::string::const_iterator i = header.begin(), eoi = header.end(); i != eoi;) { std::string::const_iterator paramFirst = i; std::string::const_iterator paramLast = paramFirst; for(; paramLast != eoi && *paramLast != '=' && *paramLast != ';'; ++paramLast); std::string param; if(paramLast == eoi || *paramLast == ';') { // No value, parmname only param = std::string(paramFirst, paramLast); } else { for(; paramLast != eoi && *paramLast != '"' && *paramLast != ';'; ++paramLast); if(paramLast != eoi && *paramLast == '"') { // quoted-string ++paramLast; for(; paramLast != eoi && *paramLast != '"'; ++paramLast); if(paramLast != eoi) { ++paramLast; } param = std::string(paramFirst, paramLast); for(; paramLast != eoi && *paramLast != ';'; ++paramLast); } else { param = std::string(paramFirst, paramLast); } } param = strip(param); *out++ = param; if(paramLast == eoi) { break; } i = paramLast; ++i; } } } // namespace std::string getContentDispositionFilename(const std::string& header) { const char A2_KEYNAME[] = "filename"; std::string filename; std::vector params; parseParam(std::back_inserter(params), header); for(std::vector::const_iterator i = params.begin(), eoi = params.end(); i != eoi; ++i) { const std::string& param = *i; std::string lowparam = toLower(param); if(!startsWith(lowparam.begin(), lowparam.end(), A2_KEYNAME, vend(A2_KEYNAME)-1) || param.size() == sizeof(A2_KEYNAME)-1) { continue; } std::string::const_iterator markeritr = param.begin()+sizeof(A2_KEYNAME)-1; if(*markeritr == '*') { // See RFC2231 Section4 and draft-reschke-rfc2231-in-http. // Please note that this function doesn't do charset conversion // except that if iso-8859-1 is specified, it is converted to // utf-8. ++markeritr; for(; markeritr != param.end() && *markeritr == ' '; ++markeritr); if(markeritr == param.end() || *markeritr != '=') { continue; } std::vector extValues; splitIter(markeritr+1, param.end(), std::back_inserter(extValues), '\'', true, true); if(extValues.size() != 3) { continue; } bool bad = false; for(std::string::const_iterator j = extValues[0].first, eoj = extValues[0].second; j != eoj; ++j) { // Since we first split parameter by ', we can safely assume // that ' is not included in charset. if(!inRFC2978MIMECharset(*j)) { bad = true; break; } } if(bad) { continue; } bad = false; for(std::string::const_iterator j = extValues[2].first, eoj = extValues[2].second; j != eoj; ++j){ if(*j == '%') { if(j+1 != eoj && isHexDigit(*(j+1)) && j+2 != eoj && isHexDigit(*(j+2))) { j += 2; } else { bad = true; break; } } else { if(*j == '*' || *j == '\'' || !inRFC2616HttpToken(*j)) { bad = true; break; } } } if(bad) { continue; } std::string value = percentDecode(extValues[2].first, extValues[2].second); const char A2_ISO88591[] = "iso-8859-1"; if(util::strieq(extValues[0].first, extValues[0].second, A2_ISO88591, vend(A2_ISO88591)-1)) { value = iso8859ToUtf8(value); } if(!detectDirTraversal(value) && value.find(A2STR::SLASH_C) == std::string::npos) { filename = value; } if(!filename.empty()) { break; } } else { for(; markeritr != param.end() && *markeritr == ' '; ++markeritr); if(markeritr == param.end() || markeritr+1 == param.end() || *markeritr != '=') { continue; } Scip p = stripIter(markeritr+1, param.end()); if(p.first == p.second) { continue; } std::string value(p.first, p.second); std::string::iterator filenameLast; if(value[0] == '\'' || value[0] == '"') { char qc = *value.begin(); for(filenameLast = value.begin()+1; filenameLast != value.end() && *filenameLast != qc; ++filenameLast); } else { filenameLast = value.end(); } static const std::string TRIMMED("\r\n\t '\""); value = percentDecode(value.begin(), filenameLast); value = strip(value, TRIMMED); value.erase(std::remove(value.begin(), value.end(), '\\'), value.end()); if(!detectDirTraversal(value) && value.find(A2STR::SLASH_C) == std::string::npos) { filename = value; } // continue because there is a chance we can find filename*=... } } return filename; } std::string randomAlpha(size_t length, const RandomizerHandle& randomizer) { static const char *random_chars = "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz"; std::string str; for(size_t i = 0; i < length; ++i) { size_t index = randomizer->getRandomNumber(strlen(random_chars)); str += random_chars[index]; } return str; } std::string toUpper(const std::string& src) { std::string temp = src; std::transform(temp.begin(), temp.end(), temp.begin(), ::toupper); return temp; } std::string toLower(const std::string& src) { std::string temp = src; std::transform(temp.begin(), temp.end(), temp.begin(), ::tolower); return temp; } void uppercase(std::string& s) { std::transform(s.begin(), s.end(), s.begin(), ::toupper); } void lowercase(std::string& s) { std::transform(s.begin(), s.end(), s.begin(), ::tolower); } bool isNumericHost(const std::string& name) { struct addrinfo hints; struct addrinfo* res; memset(&hints, 0, sizeof(hints)); hints.ai_family = AF_UNSPEC; hints.ai_flags = AI_NUMERICHOST; if(getaddrinfo(name.c_str(), 0, &hints, &res)) { return false; } freeaddrinfo(res); return true; } void setGlobalSignalHandler(int sig, void (*handler)(int), int flags) { #ifdef HAVE_SIGACTION struct sigaction sigact; sigact.sa_handler = handler; sigact.sa_flags = flags; sigemptyset(&sigact.sa_mask); sigaction(sig, &sigact, NULL); #else signal(sig, handler); #endif // HAVE_SIGACTION } std::string getHomeDir() { const char* p = getenv("HOME"); if(p) { return p; } else { #ifdef __MINGW32__ p = getenv("USERPROFILE"); if(p) { return p; } else { p = getenv("HOMEDRIVE"); if(p) { std::string homeDir = p; p = getenv("HOMEPATH"); if(p) { homeDir += p; return homeDir; } } } #endif return A2STR::NIL; } } int64_t getRealSize(const std::string& sizeWithUnit) { std::string::size_type p = sizeWithUnit.find_first_of("KM"); std::string size; int32_t mult = 1; if(p == std::string::npos) { size = sizeWithUnit; } else { if(sizeWithUnit[p] == 'K') { mult = 1024; } else if(sizeWithUnit[p] == 'M') { mult = 1024*1024; } size = sizeWithUnit.substr(0, p); } int64_t v = parseLLInt(size.begin(), size.end()); if(v < 0) { throw DL_ABORT_EX(fmt("Negative value detected: %s", sizeWithUnit.c_str())); } else if(INT64_MAX/mult < v) { throw DL_ABORT_EX(fmt(MSG_STRING_INTEGER_CONVERSION_FAILURE, "overflow/underflow")); } return v*mult; } std::string abbrevSize(int64_t size) { if(size < 1024) { return itos(size, true); } char units[] = { 'K', 'M' }; size_t numUnit = sizeof(units)/sizeof(char); size_t i = 0; int r = size&0x3ffu; size >>= 10; for(; i < numUnit-1 && size >= 1024; ++i) { r = size&0x3ffu; size >>= 10; } std::string result = itos(size, true); result += A2STR::DOT_C; result += itos(r*10/1024); result += units[i]; result += "i"; return result; } void sleep(long seconds) { #ifdef HAVE_SLEEP ::sleep(seconds); #elif defined(HAVE_USLEEP) ::usleep(seconds * 1000000); #elif defined(HAVE_WINSOCK2_H) ::Sleep(seconds * 1000); #else #error no sleep function is available (nanosleep?) #endif } void usleep(long microseconds) { #ifdef HAVE_USLEEP ::usleep(microseconds); #elif defined(HAVE_WINSOCK2_H) LARGE_INTEGER current, freq, end; static enum {GET_FREQUENCY, GET_MICROSECONDS, SKIP_MICROSECONDS} state = GET_FREQUENCY; if (state == GET_FREQUENCY) { if (QueryPerformanceFrequency(&freq)) state = GET_MICROSECONDS; else state = SKIP_MICROSECONDS; } long msec = microseconds / 1000; microseconds %= 1000; if (state == GET_MICROSECONDS && microseconds) { QueryPerformanceCounter(&end); end.QuadPart += (freq.QuadPart * microseconds) / 1000000; while (QueryPerformanceCounter(¤t) && (current.QuadPart <= end.QuadPart)) /* noop */ ; } if (msec) Sleep(msec); #else #error no usleep function is available (nanosleep?) #endif } bool isNumber(const std::string& what) { if(what.empty()) { return false; } for(std::string::const_iterator i = what.begin(), eoi = what.end(); i != eoi; ++i) { if(!isDigit(*i)) { return false; } } return true; } bool isLowercase(const std::string& what) { if(what.empty()) { return false; } for(uint32_t i = 0, eoi = what.size(); i < eoi; ++i) { if(!('a' <= what[i] && what[i] <= 'z')) { return false; } } return true; } bool isUppercase(const std::string& what) { if(what.empty()) { return false; } for(uint32_t i = 0, eoi = what.size(); i < eoi; ++i) { if(!('A' <= what[i] && what[i] <= 'Z')) { return false; } } return true; } unsigned int alphaToNum(const std::string& alphabets) { if(alphabets.empty()) { return 0; } char base; if(islower(alphabets[0])) { base = 'a'; } else { base = 'A'; } uint64_t num = 0; for(size_t i = 0, eoi = alphabets.size(); i < eoi; ++i) { unsigned int v = alphabets[i]-base; num = num*26+v; if(num > UINT32_MAX) { return 0; } } return num; } void mkdirs(const std::string& dirpath) { File dir(dirpath); if(!dir.mkdirs()) { int errNum = errno; if(!dir.isDir()) { throw DL_ABORT_EX3 (errNum, fmt(EX_MAKE_DIR, dir.getPath().c_str(), safeStrerror(errNum).c_str()), error_code::DIR_CREATE_ERROR); } } } void convertBitfield(BitfieldMan* dest, const BitfieldMan* src) { size_t numBlock = dest->countBlock(); for(size_t index = 0; index < numBlock; ++index) { if(src->isBitSetOffsetRange((uint64_t)index*dest->getBlockLength(), dest->getBlockLength())) { dest->setBit(index); } } } std::string toString(const BinaryStreamHandle& binaryStream) { std::stringstream strm; char data[2048]; while(1) { int32_t dataLength = binaryStream->readData (reinterpret_cast(data), sizeof(data), strm.tellp()); strm.write(data, dataLength); if(dataLength == 0) { break; } } return strm.str(); } #ifdef HAVE_POSIX_MEMALIGN /** * In linux 2.6, alignment and size should be a multiple of 512. */ void* allocateAlignedMemory(size_t alignment, size_t size) { void* buffer; int res; if((res = posix_memalign(&buffer, alignment, size)) != 0) { throw FATAL_EXCEPTION (fmt("Error in posix_memalign: %s", util::safeStrerror(res).c_str())); } return buffer; } #endif // HAVE_POSIX_MEMALIGN std::pair getNumericNameInfo(const struct sockaddr* sockaddr, socklen_t len) { char host[NI_MAXHOST]; char service[NI_MAXSERV]; int s = getnameinfo(sockaddr, len, host, NI_MAXHOST, service, NI_MAXSERV, NI_NUMERICHOST|NI_NUMERICSERV); if(s != 0) { throw DL_ABORT_EX(fmt("Failed to get hostname and port. cause: %s", gai_strerror(s))); } return std::pair(host, atoi(service)); // TODO } std::string htmlEscape(const std::string& src) { std::string dest; for(std::string::const_iterator i = src.begin(), eoi = src.end(); i != eoi; ++i) { char ch = *i; if(ch == '<') { dest += "<"; } else if(ch == '>') { dest += ">"; } else if(ch == '&') { dest += "&"; } else if(ch == '\'') { dest += "'"; } else if(ch == '"') { dest += """; } else { dest += ch; } } return dest; } std::pair parseIndexPath(const std::string& line) { std::pair p; divide(p, line.begin(), line.end(), '='); size_t index = parseUInt(p.first.first, p.first.second); if(p.second.first == p.second.second) { throw DL_ABORT_EX(fmt("Path with index=%u is empty.", static_cast(index))); } return std::make_pair(index, std::string(p.second.first, p.second.second)); } std::vector > createIndexPaths(std::istream& i) { std::vector > indexPaths; std::string line; while(getline(i, line)) { indexPaths.push_back(parseIndexPath(line)); } return indexPaths; } namespace { void generateRandomDataRandom(unsigned char* data, size_t length) { const SharedHandle& rd = SimpleRandomizer::getInstance(); for(size_t i = 0; i < length; ++i) { data[i] = static_cast(rd->getRandomNumber(256)); } } } // namespace namespace { void generateRandomDataUrandom(unsigned char* data, size_t length, int fd) { while(length > 0) { ssize_t r; while((r = read(fd, data, length)) == -1 && errno == EINTR); if(r <= 0) { generateRandomDataRandom(data, length); return; } length -= r; data += r; } } } // namespace void generateRandomData(unsigned char* data, size_t length) { #ifdef __MINGW32__ generateRandomDataRandom(data, length); #else // !__MINGW32__ static int method = -1; static int fd; if(method == 0) { generateRandomDataUrandom(data, length, fd); } else if(method == 1) { generateRandomDataRandom(data, length); } else { while((fd = open("/dev/urandom", O_RDONLY)) == -1 && errno == EINTR); if(fd == -1) { method = 1; } else { method = 0; } generateRandomData(data, length); } #endif // !__MINGW32__ } bool saveAs (const std::string& filename, const std::string& data, bool overwrite) { if(!overwrite && File(filename).exists()) { return false; } std::string tempFilename = strconcat(filename, "__temp"); { BufferedFile fp(tempFilename, BufferedFile::WRITE); if(!fp) { return false; } if(fp.write(data.data(), data.size()) != data.size()) { return false; } if(fp.close() == EOF) { return false; } } return File(tempFilename).renameTo(filename); } std::string applyDir(const std::string& dir, const std::string& relPath) { std::string s; if(dir.empty()) { s = strconcat(A2STR::DOT_C, A2STR::SLASH_C, relPath); } else if(dir == A2STR::SLASH_C) { s = strconcat(A2STR::SLASH_C, relPath); } else { s = strconcat(dir, A2STR::SLASH_C, relPath); } #ifdef __MINGW32__ for(std::string::iterator i = s.begin(), eoi = s.end(); i != eoi; ++i) { if(*i == '\\') { *i = '/'; } } #endif // __MINGW32__ return s; } std::string fixTaintedBasename(const std::string& src) { static std::string SLASH_REP = "%2F"; return escapePath(replace(src, A2STR::SLASH_C, SLASH_REP)); } void generateRandomKey(unsigned char* key) { #ifdef ENABLE_MESSAGE_DIGEST unsigned char bytes[40]; generateRandomData(bytes, sizeof(bytes)); message_digest::digest(key, 20, MessageDigest::sha1(), bytes, sizeof(bytes)); #else // !ENABLE_MESSAGE_DIGEST generateRandomData(key, 20); #endif // !ENABLE_MESSAGE_DIGEST } // Returns true is given numeric ipv4addr is in Private Address Space. // // From Section.3 RFC1918 // 10.0.0.0 - 10.255.255.255 (10/8 prefix) // 172.16.0.0 - 172.31.255.255 (172.16/12 prefix) // 192.168.0.0 - 192.168.255.255 (192.168/16 prefix) bool inPrivateAddress(const std::string& ipv4addr) { const char A2_IP10[] = "10."; const char A2_IP192[] = "192.168."; if(util::startsWith(ipv4addr.begin(), ipv4addr.end(), A2_IP10, vend(A2_IP10)-1) || util::startsWith(ipv4addr.begin(), ipv4addr.end(), A2_IP192, vend(A2_IP192)-1)) { return true; } std::string p172("172."); if(util::startsWith(ipv4addr.begin(), ipv4addr.end(), p172.begin(), p172.end())) { for(int i = 16; i <= 31; ++i) { std::string t(p172); t += util::itos(i); t += '.'; if(util::startsWith(ipv4addr.begin(), ipv4addr.end(), t.begin(), t.end())) { return true; } } } return false; } bool detectDirTraversal(const std::string& s) { if(s.empty()) { return false; } for(std::string::const_iterator i = s.begin(), eoi = s.end(); i != eoi; ++i) { unsigned char c = *i; if(in(c, 0x00u, 0x1fu) || c == 0x7fu) { return true; } } const char A2_DS[] = "./"; const char A2_DDS[] = "../"; const char A2_SD[] = "/."; const char A2_SDD[] = "/.."; const char A2_SDDS[] = "/../"; const char A2_SDS[] = "/./"; const char A2_DD[] = ".."; return s == A2STR::DOT_C || s == A2_DD || s[0] == '/' || util::startsWith(s.begin(), s.end(), A2_DS, vend(A2_DS)-1) || util::startsWith(s.begin(), s.end(), A2_DDS, vend(A2_DDS)-1) || s.find(A2_SDDS) != std::string::npos || s.find(A2_SDS) != std::string::npos || s[s.size()-1] == '/' || util::endsWith(s.begin(), s.end(), A2_SD, vend(A2_SD)-1) || util::endsWith(s.begin(), s.end(), A2_SDD, vend(A2_SDD)-1); } std::string escapePath(const std::string& s) { // We don't escape '/' because we use it as a path separator. #ifdef __MINGW32__ static const char WIN_INVALID_PATH_CHARS[] = { '"', '*', ':', '<', '>', '?', '\\', '|' }; #endif // __MINGW32__ std::string d; for(std::string::const_iterator i = s.begin(), eoi = s.end(); i != eoi; ++i) { unsigned char c = *i; if(in(c, 0x00u, 0x1fu) || c == 0x7fu #ifdef __MINGW32__ || std::find(vbegin(WIN_INVALID_PATH_CHARS), vend(WIN_INVALID_PATH_CHARS), c) != vend(WIN_INVALID_PATH_CHARS) #endif // __MINGW32__ ){ d += fmt("%%%02X", c); } else { d += *i; } } return d; } bool inSameCidrBlock (const std::string& ip1, const std::string& ip2, size_t bits) { unsigned char s1[16], s2[16]; size_t len1, len2; if((len1 = net::getBinAddr(s1, ip1)) == 0 || (len2 = net::getBinAddr(s2, ip2)) == 0 || len1 != len2) { return false; } if(bits > 8*len1) { bits = 8*len1; } int last = (bits-1)/8; for(int i = 0; i < last; ++i) { if(s1[i] != s2[i]) { return false; } } unsigned char mask = bitfield::lastByteMask(bits); return (s1[last] & mask) == (s2[last] & mask); } void removeMetalinkContentTypes(const SharedHandle& group) { removeMetalinkContentTypes(group.get()); } void removeMetalinkContentTypes(RequestGroup* group) { for(std::vector::const_iterator i = DownloadHandlerConstants::getMetalinkContentTypes().begin(), eoi = DownloadHandlerConstants::getMetalinkContentTypes().end(); i != eoi; ++i) { group->removeAcceptType(*i); } } namespace { void executeHook (const std::string& command, a2_gid_t gid, size_t numFiles, const std::string& firstFilename) { const std::string gidStr = util::itos(gid); const std::string numFilesStr = util::uitos(numFiles); #ifndef __MINGW32__ A2_LOG_INFO(fmt("Executing user command: %s %s %s %s", command.c_str(), gidStr.c_str(), numFilesStr.c_str(), firstFilename.c_str())); pid_t cpid = fork(); if(cpid == -1) { A2_LOG_ERROR("fork() failed. Cannot execute user command."); } else if(cpid == 0) { execl(command.c_str(), command.c_str(), gidStr.c_str(), numFilesStr.c_str(), firstFilename.c_str(), reinterpret_cast(0)); perror(("Could not execute user command: "+command).c_str()); exit(EXIT_FAILURE); } #else PROCESS_INFORMATION pi; STARTUPINFO si; memset(&si, 0, sizeof (si)); si.cb = sizeof(STARTUPINFO); memset(&pi, 0, sizeof (pi)); const char A2_BAT[] = ".bat"; bool batch = util::iendsWith(command.begin(), command.end(), A2_BAT, vend(A2_BAT)-1); std::string cmdline; std::string cmdexe; if(batch) { const char* p = getenv("windir"); if(p) { cmdexe = std::string(p); cmdexe += "\\system32\\cmd.exe"; } else { A2_LOG_INFO("Failed to get windir environment variable." " Executing batch file will fail."); // TODO Might be useless. cmdexe = "cmd.exe"; } cmdline += "/C \""; } strappend(cmdline, "\"", command, "\""); strappend(cmdline, " ", gidStr, " ", numFilesStr, " \"", firstFilename, "\""); if(batch) { cmdline += "\""; } A2_LOG_INFO(fmt("Executing user command: %s", cmdline.c_str())); DWORD rc = CreateProcess( batch ? cmdexe.c_str() : NULL, (LPSTR)cmdline.c_str(), NULL, NULL, true, NULL, NULL, 0, &si, &pi); if(!rc) { A2_LOG_ERROR("CreateProcess() failed. Cannot execute user command."); } #endif } } // namespace void executeHookByOptName (const SharedHandle& group, const Option* option, const Pref* pref) { executeHookByOptName(group.get(), option, pref); } void executeHookByOptName (const RequestGroup* group, const Option* option, const Pref* pref) { const std::string& cmd = option->get(pref); if(!cmd.empty()) { const SharedHandle dctx = group->getDownloadContext(); std::string firstFilename; size_t numFiles = 0; if(!group->inMemoryDownload()) { SharedHandle file = dctx->getFirstRequestedFileEntry(); if(file) { firstFilename = file->getPath(); } numFiles = dctx->countRequestedFileEntry(); } executeHook(cmd, group->getGID(), numFiles, firstFilename); } } std::string createSafePath (const std::string& dir, const std::string& filename) { return util::applyDir (dir, util::isUtf8(filename)? util::fixTaintedBasename(filename): util::escapePath(util::percentEncode(filename))); } std::string encodeNonUtf8(const std::string& s) { return util::isUtf8(s)?s:util::percentEncode(s); } std::string makeString(const char* str) { if(str) { return str; } else { return A2STR::NIL; } } std::string safeStrerror(int errNum) { return makeString(strerror(errNum)); } bool noProxyDomainMatch (const std::string& hostname, const std::string& domain) { if(!domain.empty() && domain[0] == '.' && !util::isNumericHost(hostname)) { return util::endsWith(hostname.begin(), hostname.end(), domain.begin(), domain.end()); } else { return hostname == domain; } } } // namespace util } // namespace aria2