/* */ #ifndef D_UTIL_H #define D_UTIL_H #include "common.h" #include #include #include #include #include #include #include #include #include #include #include #include #include #include "SharedHandle.h" #include "a2time.h" #include "a2netcompat.h" #include "a2functional.h" #include "SegList.h" #include "a2iterator.h" #include "message.h" #include "DlAbortEx.h" #include "fmt.h" namespace aria2 { class Randomizer; class BitfieldMan; class BinaryStream; class FileEntry; class RequestGroup; class Option; class Pref; #define STRTOLL(X) strtoll(X, reinterpret_cast(0), 10) #define STRTOULL(X) strtoull(X, reinterpret_cast(0), 10) #define START_INDEX(OFFSET, PIECE_LENGTH) ((OFFSET)/(PIECE_LENGTH)) #define END_INDEX(OFFSET, LENGTH, PIECE_LENGTH) (((OFFSET)+(LENGTH)-1)/(PIECE_LENGTH)) #define DIV_FLOOR(X,Y) ((X)/(Y)+((X)%(Y)? 1:0)) #ifdef WORDS_BIGENDIAN inline uint64_t ntoh64(uint64_t x) { return x; } inline uint64_t hton64(uint64_t x) { return x; } #else // !WORDS_BIGENDIAN inline uint64_t byteswap64(uint64_t x) { uint64_t v1 = ntohl(x & 0x00000000ffffffffllu); uint64_t v2 = ntohl(x >> 32); return (v1 << 32)|v2; } inline uint64_t ntoh64(uint64_t x) { return byteswap64(x); } inline uint64_t hton64(uint64_t x) { return byteswap64(x); } #endif // !WORDS_BIGENDIAN #ifdef __MINGW32__ std::wstring utf8ToWChar(const std::string& src); std::wstring utf8ToWChar(const char* str); std::string utf8ToNative(const std::string& src); std::string wCharToUtf8(const std::wstring& wsrc); std::string nativeToUtf8(const std::string& src); #else // !__MINGW32__ # define utf8ToWChar(src) src # define utf8ToNative(src) src #endif // !__MINGW32__ namespace util { template void divide (std::pair& hp, InputIterator first, InputIterator last, char delim) { InputIterator dpos = std::find(first, last, delim); if(dpos == last) { hp.first = stripIter(first, last); hp.second.first = hp.second.second; } else { hp.first = stripIter(first, dpos); hp.second = stripIter(dpos+1, last); } } template std::string uitos(T value, bool comma = false) { std::string str; if(value == 0) { str = "0"; return str; } unsigned int count = 0; while(value) { ++count; char digit = value%10+'0'; if(comma && count > 3 && count%3 == 1) { str += ','; } str += digit; value /= 10; } std::reverse(str.begin(), str.end()); return str; } std::string itos(int64_t value, bool comma = false); /** * Computes difference in micro-seconds between tv1 and tv2, * assuming tv1 is newer than tv2. * If tv1 is older than tv2, then this method returns 0. */ int64_t difftv(struct timeval tv1, struct timeval tv2); int32_t difftvsec(struct timeval tv1, struct timeval tv2); extern const std::string DEFAULT_STRIP_CHARSET; template std::pair stripIter (InputIterator first, InputIterator last, const std::string& chars = DEFAULT_STRIP_CHARSET) { for(; first != last && std::find(chars.begin(), chars.end(), *first) != chars.end(); ++first); if(first == last) { return std::make_pair(first, last); } InputIterator left = last-1; for(; left != first && std::find(chars.begin(), chars.end(), *left) != chars.end(); --left); return std::make_pair(first, left+1); } std::string strip (const std::string& str, const std::string& chars = DEFAULT_STRIP_CHARSET); bool startsWith(const std::string& target, const std::string& part); bool endsWith(const std::string& target, const std::string& part); std::string replace(const std::string& target, const std::string& oldstr, const std::string& newstr); std::string percentEncode(const unsigned char* target, size_t len); std::string percentEncode(const std::string& target); std::string percentEncodeMini(const std::string& target); bool inRFC3986ReservedChars(const char c); bool inRFC3986UnreservedChars(const char c); bool isUtf8(const std::string& str); std::string percentDecode (std::string::const_iterator first, std::string::const_iterator last); std::string torrentPercentEncode(const unsigned char* target, size_t len); std::string torrentPercentEncode(const std::string& target); std::string toHex(const unsigned char* src, size_t len); std::string toHex(const char* src, size_t len); std::string toHex(const std::string& src); // Converts hexadecimal ascii string 'src' into packed binary form and // return the result. If src is not well formed, then empty string is // returned. std::string fromHex(const std::string& src); FILE* openFile(const std::string& filename, const std::string& mode); bool isPowerOf(int num, int base); std::string secfmt(time_t sec); template bool parseIntNoThrow (int32_t& result, InputIterator first, InputIterator last, int base = 10) { // Without strip, strtol(" -1 ",..) emits error. Scip p = util::stripIter(first, last); if(p.first == p.second) { return false; } char buf[32]; size_t len = std::distance(p.first, p.second); if(len+1 > sizeof(buf)) { return false; } std::copy(p.first, p.second, &buf[0]); buf[len] = '\0'; char* stop; errno = 0; long int v = strtol(buf, &stop, base); if(*stop != '\0') { return false; } else if(((v == LONG_MAX || v == LONG_MIN) && (errno == ERANGE)) || v < INT32_MIN || INT32_MAX < v) { return false; } result = v; return true; } template bool parseUIntNoThrow (uint32_t& result, InputIterator first, InputIterator last, int base = 10) { // Without strip, strtol(" -1 ",..) emits error. Scip p = util::stripIter(first, last); if(p.first == p.second) { return false; } char buf[32]; size_t len = std::distance(p.first, p.second); if(len+1 > sizeof(buf)) { return false; } std::copy(p.first, p.second, &buf[0]); buf[len] = '\0'; // We don't allow negative number. if(buf[0] == '-') { return false; } char* stop; errno = 0; unsigned long int v = strtoul(buf, &stop, base); if(*stop != '\0') { return false; } else if(((v == ULONG_MAX) && (errno == ERANGE)) || (v > UINT32_MAX)) { return false; } result = v; return true; } template bool parseLLIntNoThrow (int64_t& result, InputIterator first, InputIterator last, int base = 10) { // Without strip, strtol(" -1 ",..) emits error. Scip p = util::stripIter(first, last); if(p.first == p.second) { return false; } char buf[32]; size_t len = std::distance(p.first, p.second); if(len+1 > sizeof(buf)) { return false; } std::copy(p.first, p.second, &buf[0]); buf[len] = '\0'; char* stop; errno = 0; int64_t v = strtoll(buf, &stop, base); if(*stop != '\0') { return false; } else if(((v == INT64_MIN) || (v == INT64_MAX)) && (errno == ERANGE)) { return false; } result = v; return true; } template int64_t parseLLInt(InputIterator first, InputIterator last, int base = 10) { Scip p = util::stripIter(first, last); if(p.first == p.second) { throw DL_ABORT_EX(fmt(MSG_STRING_INTEGER_CONVERSION_FAILURE, "empty string")); } char buf[32]; size_t len = std::distance(p.first, p.second); if(len+1 > sizeof(buf)) { throw DL_ABORT_EX(fmt(MSG_STRING_INTEGER_CONVERSION_FAILURE, "too large")); } std::copy(p.first, p.second, &buf[0]); buf[len] = '\0'; char* stop; errno = 0; int64_t v = strtoll(buf, &stop, base); if(*stop != '\0') { throw DL_ABORT_EX(fmt(MSG_STRING_INTEGER_CONVERSION_FAILURE, buf)); } else if(((v == INT64_MIN) || (v == INT64_MAX)) && (errno == ERANGE)) { throw DL_ABORT_EX(fmt(MSG_STRING_INTEGER_CONVERSION_FAILURE, buf)); } return v; } template int32_t parseInt(InputIterator first, InputIterator last, int base = 10) { int64_t v = util::parseLLInt(first, last, base); if(v < INT32_MIN || INT32_MAX < v) { throw DL_ABORT_EX(fmt(MSG_STRING_INTEGER_CONVERSION_FAILURE, std::string(first, last).c_str())); } return v; } template uint64_t parseULLInt(InputIterator first, InputIterator last, int base = 10) { Scip p = util::stripIter(first, last); if(p.first == p.second) { throw DL_ABORT_EX(fmt(MSG_STRING_INTEGER_CONVERSION_FAILURE, "empty string")); } char buf[32]; size_t len = std::distance(p.first, p.second); if(len+1 > sizeof(buf)) { throw DL_ABORT_EX(fmt(MSG_STRING_INTEGER_CONVERSION_FAILURE, "too large")); } std::copy(p.first, p.second, &buf[0]); buf[len] = '\0'; // We don't allow negative number. if(buf[0] == '-') { throw DL_ABORT_EX(fmt(MSG_STRING_INTEGER_CONVERSION_FAILURE, buf)); } char* stop; errno = 0; uint64_t v = strtoull(buf, &stop, base); if(*stop != '\0') { throw DL_ABORT_EX(fmt(MSG_STRING_INTEGER_CONVERSION_FAILURE, buf)); } else if((v == ULLONG_MAX) && (errno == ERANGE)) { throw DL_ABORT_EX(fmt(MSG_STRING_INTEGER_CONVERSION_FAILURE, buf)); } return v; } template uint32_t parseUInt(InputIterator first, InputIterator last, int base = 10) { uint64_t v = util::parseULLInt(first, last, base); if(UINT32_MAX < v) { throw DL_ABORT_EX(fmt(MSG_STRING_INTEGER_CONVERSION_FAILURE, std::string(first, last).c_str())); } return v; } void parseIntSegments(SegList& sgl, const std::string& src); // Parses string which specifies the range of piece index for higher // priority and appends those indexes into result. The input string // src can contain 2 keywords "head" and "tail". To include both // keywords, they must be separated by comma. "head" means the pieces // where the first byte of each file sits. "tail" means the pieces // where the last byte of each file sits. These keywords can take one // parameter, SIZE. For example, if "head=SIZE" is specified, pieces // in the range of first SIZE bytes of each file get higher // priority. SIZE can include K or M(1K = 1024, 1M = 1024K). // If SIZE is omitted, SIZE=defaultSize is used. // // sample: head=512K,tail=512K void parsePrioritizePieceRange (std::vector& result, const std::string& src, const std::vector >& fileEntries, size_t pieceLength, uint64_t defaultSize = 1048576 /* 1MiB */); // Converts ISO/IEC 8859-1 string src to utf-8. std::string iso8859ToUtf8(const std::string& src); std::string getContentDispositionFilename(const std::string& header); std::string randomAlpha(size_t length, const SharedHandle& randomizer); std::string toUpper(const std::string& src); std::string toLower(const std::string& src); void uppercase(std::string& s); void lowercase(std::string& s); bool isNumericHost(const std::string& name); void setGlobalSignalHandler(int signal, void (*handler)(int), int flags); std::string getHomeDir(); int64_t getRealSize(const std::string& sizeWithUnit); std::string abbrevSize(int64_t size); template void toStream (InputIterator first, InputIterator last, Output& os) { os.printf("%s\n" "idx|path/length\n" "===+===========================================================================\n", _("Files:")); int32_t count = 1; for(; first != last; ++first, ++count) { os.printf("%3d|%s\n" " |%sB (%s)\n" "---+---------------------------------------------------------------------------\n", count, (*first)->getPath().c_str(), util::abbrevSize((*first)->getLength()).c_str(), util::uitos((*first)->getLength(), true).c_str()); } } void sleep(long seconds); void usleep(long microseconds); bool isNumber(const std::string& what); bool isDigit(const char c); bool isHexDigit(const char c); bool isHexDigit(const std::string& s); bool isLowercase(const std::string& what); bool isUppercase(const std::string& what); /** * Converts alphabets to unsigned int, assuming alphabets as a base 26 * integer and 'a' or 'A' is 0. * This function assumes alphabets includes only a-z. * Upper case are allowed but all letters must be upper case. * If overflow occurs, returns 0. */ unsigned int alphaToNum(const std::string& alphabets); void mkdirs(const std::string& dirpath); void convertBitfield(BitfieldMan* dest, const BitfieldMan* src); // binaryStream has to be opened before calling this function. std::string toString(const SharedHandle& binaryStream); #ifdef HAVE_POSIX_MEMALIGN void* allocateAlignedMemory(size_t alignment, size_t size); #endif // HAVE_POSIX_MEMALIGN std::pair getNumericNameInfo(const struct sockaddr* sockaddr, socklen_t len); std::string htmlEscape(const std::string& src); // Joins path element specified in [first, last). If ".." is found, // it eats the previous element if it exists. If "." is found, it // is just ignored and it is not appeared in the result. template std::string joinPath(InputIterator first, InputIterator last) { std::vector elements; for(;first != last; ++first) { if(*first == "..") { if(!elements.empty()) { elements.pop_back(); } } else if(*first == ".") { // do nothing } else { elements.push_back(*first); } } return strjoin(elements.begin(), elements.end(), "/"); } // Parses INDEX=PATH format string. INDEX must be an unsigned // integer. std::pair parseIndexPath(const std::string& line); std::vector > createIndexPaths(std::istream& i); /** * Take a string src which is a delimited list and add its elements * into result. result is stored in out. */ template OutputIterator split(const std::string& src, OutputIterator out, const std::string& delims, bool doStrip = false, bool allowEmpty = false) { std::string::const_iterator first = src.begin(); std::string::const_iterator last = src.end(); for(std::string::const_iterator i = first; i != last;) { std::string::const_iterator j = i; for(; j != last && std::find(delims.begin(), delims.end(), *j) == delims.end(); ++j); std::pair p(i, j); if(doStrip) { p = stripIter(i, j); } if(allowEmpty || p.first != p.second) { *out++ = std::string(p.first, p.second); } i = j; if(j != last) { ++i; } } if(allowEmpty && (src.empty() || std::find(delims.begin(), delims.end(), src[src.size()-1]) != delims.end())) { *out++ = A2STR::NIL; } return out; } void generateRandomData(unsigned char* data, size_t length); // Saves data to file whose name is filename. If overwrite is true, // existing file is overwritten. Otherwise, this function doesn't do // nothing. If data is saved successfully, return true. Otherwise // returns false. bool saveAs (const std::string& filename, const std::string& data, bool overwrite=false); // Prepend dir to relPath. If dir is empty, it prepends "." to relPath. // // dir = "/dir", relPath = "foo" => "/dir/foo" // dir = "", relPath = "foo" => "./foo" // dir = "/", relPath = "foo" => "/foo" std::string applyDir(const std::string& dir, const std::string& relPath); // In HTTP/FTP, file name is file component in URI. In HTTP, filename // may be a value of Content-Disposition header. They are likely // percent encoded. If they contains, for example, %2F, when decoded, // basename contains dir component. This should be avoided. This // function is created to fix these issues. This function expects src // should be non-percent-encoded basename. Currently, this function // replaces '/' with '_' and result string is passed to escapePath() // function and its result is returned. std::string fixTaintedBasename(const std::string& src); // Generates 20 bytes random key and store it to the address pointed // by key. Caller must allocate at least 20 bytes for generated key. void generateRandomKey(unsigned char* key); // Returns true is given numeric ipv4addr is in Private Address Space. bool inPrivateAddress(const std::string& ipv4addr); // Returns true if s contains directory traversal path component such // as '..' or it contains null or control character which may fool // user. bool detectDirTraversal(const std::string& s); // Replaces null(0x00) and control character(0x01-0x1f) with '_'. If // __MINGW32__ is defined, following characters are also replaced with // '_': '"', '*', ':', '<', '>', '?', '\', '|'. std::string escapePath(const std::string& s); // Returns true if ip1 and ip2 are in the same CIDR block. ip1 and // ip2 must be numeric IPv4 or IPv6 address. If either of them or both // of them is not valid numeric address, then returns false. bits is // prefix bits. If bits is out of range, then bits is set to the // length of binary representation of the address*8. bool inSameCidrBlock (const std::string& ip1, const std::string& ip2, size_t bits); void removeMetalinkContentTypes(const SharedHandle& group); void removeMetalinkContentTypes(RequestGroup* group); // No throw void executeHookByOptName (const SharedHandle& group, const Option* option, const Pref* pref); // No throw void executeHookByOptName (const RequestGroup* group, const Option* option, const Pref* pref); std::string createSafePath(const std::string& dir, const std::string& filename); std::string encodeNonUtf8(const std::string& s); // Create string safely. If str is NULL, returns empty string. // Otherwise, returns std::string(str). std::string makeString(const char* str); // This function is basically the same with strerror(errNum) but when // strerror returns NULL, this function returns empty string. std::string safeStrerror(int errNum); // Parses sequence [first, last) and find name=value pair delimited by // delim character. If name(and optionally value) is found, returns // pair of iterator which can use as first parameter of next call of // this function, and true. If no name is found, returns the pair of // last and false. template std::pair nextParam (std::string& name, std::string& value, Iterator first, Iterator last, char delim) { Iterator end = last; while(first != end) { last = first; Iterator parmnameFirst = first; Iterator parmnameLast = first; bool eqFound = false; for(; last != end; ++last) { if(*last == delim) { break; } else if(!eqFound && *last == '=') { eqFound = true; parmnameFirst = first; parmnameLast = last; } } std::pair namep; std::pair valuep; if(parmnameFirst == parmnameLast) { if(!eqFound) { parmnameFirst = first; parmnameLast = last; namep = stripIter(parmnameFirst, parmnameLast); } } else { first = parmnameLast+1; namep = stripIter(parmnameFirst, parmnameLast); valuep = stripIter(first, last); } if(last != end) { ++last; } if(namep.first != namep.second) { name.assign(namep.first, namep.second); value.assign(valuep.first, valuep.second); return std::make_pair(last, true); } first = last; } return std::make_pair(end, false); } template SharedHandle copy(const SharedHandle& a) { return SharedHandle(new T(*a.get())); } // This is a bit different from cookie_helper::domainMatch(). If // hostname is numeric host, then returns true if domain == hostname. // That is if domain starts with ".", then returns true if domain is a // suffix of hostname. If domain does not start with ".", then // returns true if domain == hostname. Otherwise returns true. // For example, // // * noProxyDomainMatch("aria2.sf.net", ".sf.net") returns true. // * noProxyDomainMatch("sf.net", ".sf.net") returns false. bool noProxyDomainMatch(const std::string& hostname, const std::string& domain); } // namespace util } // namespace aria2 #endif // D_UTIL_H