mirror of https://github.com/aria2/aria2
544 lines
14 KiB
C++
544 lines
14 KiB
C++
/* <!-- copyright */
|
|
/*
|
|
* aria2 - The high speed download utility
|
|
*
|
|
* Copyright (C) 2013 Tatsuhiro Tsujikawa
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*
|
|
* In addition, as a special exception, the copyright holders give
|
|
* permission to link the code of portions of this program with the
|
|
* OpenSSL library under certain conditions as described in each
|
|
* individual source file, and distribute linked combinations
|
|
* including the two.
|
|
* You must obey the GNU General Public License in all respects
|
|
* for all of the code used other than OpenSSL. If you modify
|
|
* file(s) with this exception, you may extend this exception to your
|
|
* version of the file(s), but you are not obligated to do so. If you
|
|
* do not wish to do so, delete this exception statement from your
|
|
* version. If you delete this exception statement from all source
|
|
* files in the program, then also delete it here.
|
|
*/
|
|
/* copyright --> */
|
|
#include "CookieStorage.h"
|
|
|
|
#include <cstring>
|
|
#include <cstdio>
|
|
#include <algorithm>
|
|
|
|
#include "util.h"
|
|
#include "LogFactory.h"
|
|
#include "Logger.h"
|
|
#include "DlAbortEx.h"
|
|
#include "fmt.h"
|
|
#include "NsCookieParser.h"
|
|
#include "File.h"
|
|
#include "a2functional.h"
|
|
#include "A2STR.h"
|
|
#include "message.h"
|
|
#include "cookie_helper.h"
|
|
#include "BufferedFile.h"
|
|
#ifdef HAVE_SQLITE3
|
|
# include "Sqlite3CookieParserImpl.h"
|
|
#endif // HAVE_SQLITE3
|
|
|
|
namespace aria2 {
|
|
|
|
DomainNode::DomainNode(std::string label, DomainNode* parent)
|
|
: label_{std::move(label)}, parent_{parent}, lastAccessTime_{0},
|
|
lruAccessTime_{0}, inLru_{false}
|
|
{}
|
|
|
|
void DomainNode::findCookie
|
|
(std::vector<const Cookie*>& out,
|
|
const std::string& requestHost,
|
|
const std::string& requestPath,
|
|
time_t now, bool secure)
|
|
{
|
|
if(cookies_) {
|
|
for(auto& c : *cookies_) {
|
|
if(c->match(requestHost, requestPath, now, secure)) {
|
|
c->setLastAccessTime(now);
|
|
out.push_back(c.get());
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
bool DomainNode::addCookie(std::unique_ptr<Cookie> cookie, time_t now)
|
|
{
|
|
using namespace std::placeholders;
|
|
setLastAccessTime(now);
|
|
if(!cookies_) {
|
|
if(cookie->isExpired(now)) {
|
|
return false;
|
|
} else {
|
|
cookies_ = make_unique<std::deque<std::unique_ptr<Cookie>>>();
|
|
cookies_->push_back(std::move(cookie));
|
|
return true;
|
|
}
|
|
}
|
|
|
|
auto i = std::find_if(std::begin(*cookies_), std::end(*cookies_),
|
|
[&](const std::unique_ptr<Cookie>& c)
|
|
{
|
|
return *c == *cookie;
|
|
});
|
|
if(i == std::end(*cookies_)) {
|
|
if(cookie->isExpired(now)) {
|
|
return false;
|
|
} else {
|
|
if(cookies_->size() >= CookieStorage::MAX_COOKIE_PER_DOMAIN) {
|
|
cookies_->erase
|
|
(std::remove_if(std::begin(*cookies_), std::end(*cookies_),
|
|
std::bind(&Cookie::isExpired, _1, now)),
|
|
std::end(*cookies_));
|
|
if(cookies_->size() >= CookieStorage::MAX_COOKIE_PER_DOMAIN) {
|
|
auto m = std::min_element(std::begin(*cookies_), std::end(*cookies_),
|
|
[](const std::unique_ptr<Cookie>& lhs,
|
|
const std::unique_ptr<Cookie>& rhs)
|
|
{
|
|
return lhs->getLastAccessTime() <
|
|
rhs->getLastAccessTime();
|
|
});
|
|
*m = std::move(cookie);
|
|
} else {
|
|
cookies_->push_back(std::move(cookie));
|
|
}
|
|
} else {
|
|
cookies_->push_back(std::move(cookie));
|
|
}
|
|
return true;
|
|
}
|
|
} else if(cookie->isExpired(now)) {
|
|
cookies_->erase(i);
|
|
return false;
|
|
} else {
|
|
*i = std::move(cookie);
|
|
return true;
|
|
}
|
|
}
|
|
|
|
bool DomainNode::contains(const Cookie& cookie) const
|
|
{
|
|
if(cookies_) {
|
|
for(auto& i : *cookies_) {
|
|
if(*i == cookie) {
|
|
return true;
|
|
}
|
|
}
|
|
}
|
|
return false;
|
|
}
|
|
|
|
bool DomainNode::writeCookie(BufferedFile& fp) const
|
|
{
|
|
if(cookies_) {
|
|
for(const auto& c : *cookies_) {
|
|
std::string data = c->toNsCookieFormat();
|
|
data += "\n";
|
|
if(fp.write(data.data(), data.size()) != data.size()) {
|
|
return false;
|
|
}
|
|
}
|
|
}
|
|
return true;
|
|
}
|
|
|
|
size_t DomainNode::countCookie() const
|
|
{
|
|
if(cookies_) {
|
|
return cookies_->size();
|
|
} else {
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
void DomainNode::clearCookie()
|
|
{
|
|
cookies_->clear();
|
|
}
|
|
|
|
void DomainNode::setLastAccessTime(time_t lastAccessTime)
|
|
{
|
|
lastAccessTime_ = lastAccessTime;
|
|
}
|
|
|
|
time_t DomainNode::getLastAccessTime() const
|
|
{
|
|
return lastAccessTime_;
|
|
}
|
|
|
|
void DomainNode::setLruAccessTime(time_t t)
|
|
{
|
|
lruAccessTime_ = t;
|
|
}
|
|
|
|
time_t DomainNode::getLruAccessTime() const
|
|
{
|
|
return lruAccessTime_;
|
|
}
|
|
|
|
bool DomainNode::empty() const
|
|
{
|
|
return !cookies_ || cookies_->empty();
|
|
}
|
|
|
|
bool DomainNode::hasNext() const
|
|
{
|
|
return !next_.empty();
|
|
}
|
|
|
|
DomainNode* DomainNode::getParent() const
|
|
{
|
|
return parent_;
|
|
}
|
|
|
|
void DomainNode::removeNode(DomainNode* node)
|
|
{
|
|
next_.erase(node->getLabel());
|
|
}
|
|
|
|
DomainNode* DomainNode::findNext(const std::string& label) const
|
|
{
|
|
auto i = next_.find(label);
|
|
if(i == std::end(next_)) {
|
|
return nullptr;
|
|
} else {
|
|
return (*i).second.get();
|
|
}
|
|
}
|
|
|
|
DomainNode* DomainNode::addNext(std::string label,
|
|
std::unique_ptr<DomainNode> node)
|
|
{
|
|
auto& res = next_[std::move(label)] = std::move(node);
|
|
return res.get();
|
|
}
|
|
|
|
const std::string& DomainNode::getLabel() const
|
|
{
|
|
return label_;
|
|
}
|
|
|
|
bool DomainNode::getInLru() const
|
|
{
|
|
return inLru_;
|
|
}
|
|
|
|
void DomainNode::setInLru(bool f)
|
|
{
|
|
inLru_ = f;
|
|
}
|
|
|
|
CookieStorage::CookieStorage()
|
|
: rootNode_{make_unique<DomainNode>("", nullptr)}
|
|
{}
|
|
|
|
namespace {
|
|
// See CookieStorageTest::testDomainIsFull() in CookieStorageTest.cc
|
|
const size_t DOMAIN_EVICTION_TRIGGER = 2000;
|
|
|
|
const double DOMAIN_EVICTION_RATE = 0.1;
|
|
} // namespace
|
|
|
|
namespace {
|
|
std::vector<std::string> splitDomainLabel(const std::string& domain)
|
|
{
|
|
auto labels = std::vector<std::string>{};
|
|
if(util::isNumericHost(domain)) {
|
|
labels.push_back(domain);
|
|
} else {
|
|
util::split(std::begin(domain), std::end(domain),
|
|
std::back_inserter(labels), '.');
|
|
}
|
|
return labels;
|
|
}
|
|
} // namespace
|
|
|
|
|
|
size_t CookieStorage::getLruTrackerSize() const
|
|
{
|
|
return lruTracker_.size();
|
|
}
|
|
|
|
void CookieStorage::evictNode(size_t delnum)
|
|
{
|
|
for(; delnum > 0 && !lruTracker_.empty(); --delnum) {
|
|
auto node = (*lruTracker_.begin()).second;
|
|
lruTracker_.erase(lruTracker_.begin());
|
|
node->setInLru(false);
|
|
node->clearCookie();
|
|
while(node->empty() && !node->hasNext()) {
|
|
auto parent = node->getParent();
|
|
parent->removeNode(node);
|
|
if(!parent->empty() || parent->hasNext() ||
|
|
parent == rootNode_.get()) {
|
|
break;
|
|
}
|
|
node = parent;
|
|
if(node->getInLru()) {
|
|
lruTracker_.erase({node->getLruAccessTime(), node});
|
|
node->setInLru(false);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
const DomainNode* CookieStorage::getRootNode() const
|
|
{
|
|
return rootNode_.get();
|
|
}
|
|
|
|
bool CookieStorage::store(std::unique_ptr<Cookie> cookie, time_t now)
|
|
{
|
|
if(lruTracker_.size() >= DOMAIN_EVICTION_TRIGGER) {
|
|
auto delnum = size_t(lruTracker_.size()*DOMAIN_EVICTION_RATE);
|
|
evictNode(delnum);
|
|
}
|
|
auto labels = splitDomainLabel(cookie->getDomain());
|
|
auto node = rootNode_.get();
|
|
for(auto i = labels.rbegin(), eoi = labels.rend(); i != eoi; ++i) {
|
|
auto nextNode = node->findNext(*i);
|
|
if(nextNode) {
|
|
node = nextNode;
|
|
} else {
|
|
node = node->addNext(*i, make_unique<DomainNode>(*i, node));
|
|
}
|
|
}
|
|
bool ok = node->addCookie(std::move(cookie), now);
|
|
if(ok) {
|
|
updateLru(node, now);
|
|
}
|
|
return ok;
|
|
}
|
|
|
|
void CookieStorage::updateLru(DomainNode* node, time_t now)
|
|
{
|
|
if(node->getInLru()) {
|
|
lruTracker_.erase({node->getLruAccessTime(), node});
|
|
} else {
|
|
node->setInLru(true);
|
|
}
|
|
node->setLruAccessTime(now);
|
|
lruTracker_.insert({node->getLruAccessTime(), node});
|
|
}
|
|
|
|
bool CookieStorage::parseAndStore
|
|
(const std::string& setCookieString,
|
|
const std::string& requestHost,
|
|
const std::string& defaultPath,
|
|
time_t now)
|
|
{
|
|
auto cookie = cookie::parse(setCookieString, requestHost, defaultPath, now);
|
|
return cookie && store(std::move(cookie), now);
|
|
}
|
|
|
|
namespace {
|
|
struct CookiePathDivider {
|
|
const Cookie* cookie_;
|
|
int pathDepth_;
|
|
CookiePathDivider(const Cookie* cookie):cookie_(cookie), pathDepth_(0)
|
|
{
|
|
const std::string& path = cookie_->getPath();
|
|
if(!path.empty()) {
|
|
for(size_t i = 1, len = path.size(); i < len; ++i) {
|
|
if(path[i] == '/' && path[i-1] != '/') {
|
|
++pathDepth_;
|
|
}
|
|
}
|
|
if(path[path.size()-1] != '/') {
|
|
++pathDepth_;
|
|
}
|
|
}
|
|
}
|
|
};
|
|
} // namespace
|
|
|
|
namespace {
|
|
class CookiePathDividerConverter {
|
|
public:
|
|
CookiePathDivider operator()(const Cookie* cookie) const
|
|
{
|
|
return CookiePathDivider(cookie);
|
|
}
|
|
|
|
const Cookie* operator()(const CookiePathDivider& cookiePathDivider) const
|
|
{
|
|
return cookiePathDivider.cookie_;
|
|
}
|
|
};
|
|
} // namespace
|
|
|
|
namespace {
|
|
class OrderByPathDepthDesc:public std::binary_function<Cookie, Cookie, bool> {
|
|
public:
|
|
bool operator()
|
|
(const CookiePathDivider& lhs, const CookiePathDivider& rhs) const
|
|
{
|
|
// From http://tools.ietf.org/html/rfc6265#section-5.4:
|
|
// 2. The user agent SHOULD sort the cookie-list in the following
|
|
// order:
|
|
//
|
|
// * Cookies with longer paths are listed before cookies with
|
|
// shorter paths.
|
|
//
|
|
// * Among cookies that have equal-length path fields, cookies with
|
|
// earlier creation-times are listed before cookies with later
|
|
// creation-times.
|
|
return lhs.pathDepth_ > rhs.pathDepth_ ||
|
|
(!(rhs.pathDepth_ > lhs.pathDepth_) &&
|
|
lhs.cookie_->getCreationTime() < rhs.cookie_->getCreationTime());
|
|
}
|
|
};
|
|
} // namespace
|
|
|
|
namespace {
|
|
DomainNode* findNode(const std::string& domain, DomainNode* node)
|
|
{
|
|
auto labels = splitDomainLabel(domain);
|
|
for(auto i = labels.rbegin(), eoi = labels.rend(); i != eoi && node; ++i) {
|
|
node = node->findNext(*i);
|
|
}
|
|
return node;
|
|
}
|
|
} // namespace
|
|
|
|
bool CookieStorage::contains(const Cookie& cookie) const
|
|
{
|
|
auto node = findNode(cookie.getDomain(), rootNode_.get());
|
|
return node && node->contains(cookie);
|
|
}
|
|
|
|
std::vector<const Cookie*> CookieStorage::criteriaFind
|
|
(const std::string& requestHost,
|
|
const std::string& requestPath,
|
|
time_t now,
|
|
bool secure)
|
|
{
|
|
auto res = std::vector<const Cookie*>{};
|
|
if(requestPath.empty()) {
|
|
return res;
|
|
}
|
|
auto labels = splitDomainLabel(requestHost);
|
|
auto node = rootNode_.get();
|
|
for (auto i = labels.rbegin(), eoi = labels.rend(); i != eoi; ++i) {
|
|
auto nextNode = node->findNext(*i);
|
|
if(!nextNode) {
|
|
break;
|
|
}
|
|
nextNode->setLastAccessTime(now);
|
|
if(nextNode->getInLru()) {
|
|
updateLru(nextNode, now);
|
|
}
|
|
nextNode->findCookie(res, requestHost, requestPath, now, secure);
|
|
node = nextNode;
|
|
}
|
|
auto divs = std::vector<CookiePathDivider>{};
|
|
std::transform(std::begin(res), std::end(res), std::back_inserter(divs),
|
|
CookiePathDividerConverter{});
|
|
std::sort(std::begin(divs), std::end(divs), OrderByPathDepthDesc{});
|
|
std::transform(std::begin(divs), std::end(divs), std::begin(res),
|
|
CookiePathDividerConverter{});
|
|
return res;
|
|
}
|
|
|
|
size_t CookieStorage::size() const
|
|
{
|
|
size_t n = 0;
|
|
for(auto& p : lruTracker_) {
|
|
n += p.second->countCookie();
|
|
}
|
|
return n;
|
|
}
|
|
|
|
bool CookieStorage::load(const std::string& filename, time_t now)
|
|
{
|
|
char header[16]; // "SQLite format 3" plus \0
|
|
size_t headlen;
|
|
{
|
|
BufferedFile fp{filename.c_str(), BufferedFile::READ};
|
|
if(!fp) {
|
|
A2_LOG_ERROR(fmt("Failed to open cookie file %s", filename.c_str()));
|
|
return false;
|
|
}
|
|
headlen = fp.read(header, sizeof(header));
|
|
}
|
|
try {
|
|
if(headlen == 16 && memcmp(header, "SQLite format 3\0", 16) == 0) {
|
|
#ifdef HAVE_SQLITE3
|
|
try {
|
|
auto cookies = Sqlite3MozCookieParser(filename).parse();
|
|
storeCookies(std::make_move_iterator(std::begin(cookies)),
|
|
std::make_move_iterator(std::end(cookies)), now);
|
|
} catch(RecoverableException& e) {
|
|
A2_LOG_INFO_EX(EX_EXCEPTION_CAUGHT, e);
|
|
A2_LOG_INFO("This does not look like Firefox3 cookie file."
|
|
" Retrying, assuming it is Chromium cookie file.");
|
|
// Try chrome cookie format
|
|
auto cookies = Sqlite3ChromiumCookieParser(filename).parse();
|
|
storeCookies(std::make_move_iterator(std::begin(cookies)),
|
|
std::make_move_iterator(std::end(cookies)), now);
|
|
}
|
|
#else // !HAVE_SQLITE3
|
|
throw DL_ABORT_EX
|
|
("Cannot read SQLite3 database because SQLite3 support is disabled by"
|
|
" configuration.");
|
|
#endif // !HAVE_SQLITE3
|
|
} else {
|
|
auto cookies = NsCookieParser().parse(filename, now);
|
|
storeCookies(std::make_move_iterator(std::begin(cookies)),
|
|
std::make_move_iterator(std::end(cookies)), now);
|
|
}
|
|
return true;
|
|
} catch(RecoverableException& e) {
|
|
A2_LOG_ERROR(fmt("Failed to load cookies from %s", filename.c_str()));
|
|
return false;
|
|
}
|
|
}
|
|
|
|
bool CookieStorage::saveNsFormat(const std::string& filename)
|
|
{
|
|
auto tempfilename = filename;
|
|
tempfilename += "__temp";
|
|
{
|
|
BufferedFile fp{tempfilename.c_str(), BufferedFile::WRITE};
|
|
if(!fp) {
|
|
A2_LOG_ERROR(fmt("Cannot create cookie file %s", filename.c_str()));
|
|
return false;
|
|
}
|
|
for(auto& p : lruTracker_) {
|
|
if(!p.second->writeCookie(fp)) {
|
|
A2_LOG_ERROR(fmt("Failed to save cookies to %s", filename.c_str()));
|
|
return false;
|
|
}
|
|
}
|
|
if(fp.close() == EOF) {
|
|
A2_LOG_ERROR(fmt("Failed to save cookies to %s", filename.c_str()));
|
|
return false;
|
|
}
|
|
}
|
|
if(File(tempfilename).renameTo(filename)) {
|
|
return true;
|
|
} else {
|
|
A2_LOG_ERROR(fmt("Could not rename file %s as %s",
|
|
tempfilename.c_str(),
|
|
filename.c_str()));
|
|
return false;
|
|
}
|
|
}
|
|
|
|
} // namespace aria2
|