aria2/src/cookie_helper.cc

400 lines
11 KiB
C++

/* <!-- copyright */
/*
* aria2 - The high speed download utility
*
* Copyright (C) 2010 Tatsuhiro Tsujikawa
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*
* In addition, as a special exception, the copyright holders give
* permission to link the code of portions of this program with the
* OpenSSL library under certain conditions as described in each
* individual source file, and distribute linked combinations
* including the two.
* You must obey the GNU General Public License in all respects
* for all of the code used other than OpenSSL. If you modify
* file(s) with this exception, you may extend this exception to your
* version of the file(s), but you are not obligated to do so. If you
* do not wish to do so, delete this exception statement from your
* version. If you delete this exception statement from all source
* files in the program, then also delete it here.
*/
/* copyright --> */
#include "cookie_helper.h"
#include <cstring>
#include <vector>
#include <limits>
#include "util.h"
#include "array_fun.h"
#include "Cookie.h"
#include "a2functional.h"
namespace aria2 {
namespace cookie {
namespace {
bool isDelimiter(unsigned char c)
{
return c == 0x09u || in(c, 0x20u, 0x2fu) || in(c, 0x3bu, 0x40u) ||
in(c, 0x5bu, 0x60u) || in(c, 0x7bu, 0x7eu);
}
} // namespace
namespace {
std::string::const_iterator getNextDigit
(std::string::const_iterator first, std::string::const_iterator last)
{
for(; first != last && in(static_cast<unsigned char>(*first), 0x30u, 0x39u);
++first);
return first;
}
} // namespace
bool parseDate(time_t& time, const std::string& cookieDate)
{
// Following algorithm is described in
// http://tools.ietf.org/html/rfc6265#section-5.1.1
std::vector<std::string> dateTokens;
for(std::string::const_iterator i = cookieDate.begin(),
eoi = cookieDate.end(); i != eoi;) {
unsigned char c = *i;
if(isDelimiter(c)) {
++i;
continue;
}
std::string::const_iterator s = i;
for(; s != eoi && !isDelimiter(static_cast<unsigned char>(*s)); ++s);
dateTokens.push_back(std::string(i, s));
i = s;
}
int dayOfMonth = 0;
bool foundDayOfMonth = false;
int month = 0;
bool foundMonth = false;
int year = 0;
bool foundYear = false;
int hour = 0;
int minute = 0;
int second = 0;
bool foundTime = false;
for(std::vector<std::string>::const_iterator i = dateTokens.begin(),
eoi = dateTokens.end(); i != eoi; ++i) {
if(!foundTime) {
std::string::const_iterator hEnd;
std::string::const_iterator mEnd;
std::string::const_iterator sEnd;
hEnd = getNextDigit((*i).begin(),(*i).end());
size_t len = std::distance((*i).begin(), hEnd);
if(len == 0 || 2 < len || hEnd == (*i).end() || *hEnd != ':') {
goto NOT_TIME;
}
mEnd = getNextDigit(hEnd+1, (*i).end());
len = std::distance(hEnd+1, mEnd);
if(len == 0 || 2 < len || mEnd == (*i).end() || *mEnd != ':') {
goto NOT_TIME;
}
sEnd = getNextDigit(mEnd+1, (*i).end());
len = std::distance(mEnd+1, sEnd);
if(len == 0 || 2 < len) {
goto NOT_TIME;
}
foundTime = true;
hour = util::parseInt(std::string((*i).begin(), hEnd));
minute = util::parseInt(std::string(hEnd+1, mEnd));
second = util::parseInt(std::string(mEnd+1, sEnd));
continue;
NOT_TIME:
;
}
if(!foundDayOfMonth) {
std::string::const_iterator j = getNextDigit((*i).begin(), (*i).end());
size_t len = std::distance((*i).begin(), j);
if(1 <= len && len <= 2) {
foundDayOfMonth = true;
dayOfMonth = util::parseInt(std::string((*i).begin(), j));
continue;
}
}
if(!foundMonth) {
static std::string MONTH[] = {
"jan", "feb", "mar", "apr",
"may", "jun", "jul", "aug",
"sep", "oct", "nov", "dec" };
if((*i).size() >= 3) {
std::string head = (*i).substr(0, 3);
util::lowercase(head);
std::string* mptr = std::find(vbegin(MONTH), vend(MONTH), head);
if(mptr != vend(MONTH)) {
foundMonth = true;
month = std::distance(vbegin(MONTH), mptr)+1;
continue;
}
}
}
if(!foundYear) {
std::string::const_iterator j = getNextDigit((*i).begin(), (*i).end());
size_t len = std::distance((*i).begin(), j);
if(1 <= len && len <= 4) {
foundYear = true;
year = util::parseInt(std::string((*i).begin(), j));
continue;
}
}
}
if(in(year, 70, 99)) {
year += 1900;
} else if(in(year, 0, 69)) {
year += 2000;
}
if(!foundDayOfMonth || !foundMonth || !foundYear || !foundTime ||
!in(dayOfMonth, 1, 31) || year < 1601 || hour > 23 ||
minute > 59 || second > 59) {
return false;
}
if((month == 4 || month == 6 || month == 9 || month == 11) &&
dayOfMonth > 30) {
return false;
}
if(month == 2) {
if((year%4 == 0 && year%100 != 0) || year%400 == 0) {
if(dayOfMonth > 29) {
return false;
}
} else if(dayOfMonth > 28) {
return false;
}
}
tm timespec;
memset(&timespec, 0, sizeof(timespec));
timespec.tm_sec = second;
timespec.tm_min = minute;
timespec.tm_hour = hour;
timespec.tm_mday = dayOfMonth;
timespec.tm_mon = month-1;
timespec.tm_year = year-1900;
time = timegm(&timespec);
return time != -1;
}
bool parse
(Cookie& cookie,
const std::string& cookieStr,
const std::string& requestHost,
const std::string& defaultPath,
time_t creationTime)
{
// This implementation is based on the algorithm listed in
// http://tools.ietf.org/html/rfc6265
std::string::const_iterator nvEnd = cookieStr.begin();
std::string::const_iterator end = cookieStr.end();
for(; nvEnd != end && *nvEnd != ';'; ++nvEnd);
std::string::const_iterator eq = cookieStr.begin();
for(; eq != nvEnd && *eq != '='; ++eq);
if(eq == nvEnd) {
return false;
}
std::string cookieName = util::stripIter(cookieStr.begin(), eq);
if(cookieName.empty()) {
return false;
}
std::string cookieValue = util::stripIter(eq+1, nvEnd);
cookieValue = util::strip(cookieValue, "\"");
time_t expiryTime = 0;
bool foundExpires = false;
bool persistent = false;
time_t maxAge = 0;
bool foundMaxAge = false;
std::string cookieDomain;
bool hostOnly = false;
std::string cookiePath;
bool secure = false;
bool httpOnly = false;
if(nvEnd != end) {
++nvEnd;
}
for(std::string::const_iterator i = nvEnd; i != end;) {
std::string::const_iterator j = std::find(i, end, ';');
std::string::const_iterator eq = std::find(i, j, '=');
std::string attrName = util::stripIter(i, eq);
util::lowercase(attrName);
std::string attrValue;
if(eq != j) {
attrValue = util::stripIter(eq+1, j);
}
i = j;
if(j != end) {
++i;
}
if(attrName == "expires") {
if(parseDate(expiryTime, attrValue)) {
foundExpires = true;
} else {
return false;
}
} else if(attrName == "max-age") {
if(attrValue.empty() ||
(!in(static_cast<unsigned char>(attrValue[0]), 0x30u, 0x39u) &&
attrValue[0] != '-')) {
return false;
}
for(std::string::const_iterator s = attrValue.begin()+1,
eos = attrValue.end(); s != eos; ++s) {
if(!in(static_cast<unsigned char>(*s), 0x30u, 0x39u)) {
return false;
}
}
int64_t delta;
if(util::parseLLIntNoThrow(delta, attrValue)) {
foundMaxAge = true;
if(delta <= 0) {
maxAge = 0;
} else {
int64_t n = creationTime;
n += delta;
if(n < 0 || std::numeric_limits<time_t>::max() < n) {
maxAge = std::numeric_limits<time_t>::max();
} else {
maxAge = n;
}
}
} else {
return false;
}
} else if(attrName == "domain") {
if(attrValue.empty()) {
return false;
}
std::string::const_iterator noDot = attrValue.begin();
std::string::const_iterator end = attrValue.end();
for(; noDot != end && *noDot == '.'; ++noDot);
if(noDot == end) {
return false;
}
cookieDomain = std::string(noDot, end);
} else if(attrName == "path") {
if(goodPath(attrValue)) {
cookiePath = attrValue;
} else {
cookiePath = defaultPath;
}
} else if(attrName == "secure") {
secure = true;
} else if(attrName == "httponly") {
httpOnly = true;
}
}
if(foundMaxAge) {
expiryTime = maxAge;
persistent = true;
} else if(foundExpires) {
persistent = true;
} else {
expiryTime = std::numeric_limits<time_t>::max();
persistent = false;
}
std::string canonicalizedHost = canonicalizeHost(requestHost);
if(cookieDomain.empty()) {
hostOnly = true;
cookieDomain = canonicalizedHost;
} else if(domainMatch(canonicalizedHost, cookieDomain)) {
hostOnly = util::isNumericHost(canonicalizedHost);
} else {
return false;
}
if(cookiePath.empty()) {
cookiePath = defaultPath;
}
cookie.setName(cookieName);
cookie.setValue(cookieValue);
cookie.setExpiryTime(expiryTime);
cookie.setPersistent(persistent);
cookie.setDomain(cookieDomain);
cookie.setHostOnly(hostOnly);
cookie.setPath(cookiePath);
cookie.setSecure(secure);
cookie.setHttpOnly(httpOnly);
cookie.setCreationTime(creationTime);
cookie.setLastAccessTime(creationTime);
return true;
}
std::string removePrecedingDots(const std::string& host)
{
std::string::const_iterator noDot = host.begin();
std::string::const_iterator end = host.end();
for(; noDot != end && *noDot == '.'; ++noDot);
return std::string(noDot, end);
}
bool goodPath(const std::string& cookiePath)
{
return !cookiePath.empty() && cookiePath[0] == '/';
}
std::string canonicalizeHost(const std::string& host)
{
std::string ch = util::toLower(host);
return ch;
}
bool domainMatch(const std::string& requestHost, const std::string& domain)
{
return requestHost == domain ||
(util::endsWith(requestHost, domain) &&
requestHost[requestHost.size()-domain.size()-1] == '.' &&
!util::isNumericHost(requestHost));
}
bool pathMatch(const std::string& requestPath, const std::string& path)
{
return requestPath == path ||
(util::startsWith(requestPath, path) &&
(path[path.size()-1] == '/' || requestPath[path.size()] == '/'));
}
std::string reverseDomainLevel(const std::string& domain)
{
std::string r;
for(std::string::const_iterator i = domain.begin(), eoi = domain.end();
i != eoi;) {
std::string::const_iterator j = std::find(i, eoi, '.');
r.insert(r.begin(), '.');
r.insert(r.begin(), i, j);
i = j;
if(j != eoi) {
++i;
}
}
if(!r.empty()) {
r.erase(r.size()-1, 1);
}
return r;
}
} // namespace cookie
} // namespace aria2