aria2/src/ExpatMetalinkProcessor.cc

222 lines
6.5 KiB
C++

/* <!-- copyright */
/*
* aria2 - The high speed download utility
*
* Copyright (C) 2006 Tatsuhiro Tsujikawa
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*
* In addition, as a special exception, the copyright holders give
* permission to link the code of portions of this program with the
* OpenSSL library under certain conditions as described in each
* individual source file, and distribute linked combinations
* including the two.
* You must obey the GNU General Public License in all respects
* for all of the code used other than OpenSSL. If you modify
* file(s) with this exception, you may extend this exception to your
* version of the file(s), but you are not obligated to do so. If you
* do not wish to do so, delete this exception statement from your
* version. If you delete this exception statement from all source
* files in the program, then also delete it here.
*/
/* copyright --> */
#include "ExpatMetalinkProcessor.h"
#include <iostream>
#include <fstream>
#include "DefaultDiskWriter.h"
#include "MetalinkParserStateMachine.h"
#include "Metalinker.h"
#include "MetalinkEntry.h"
#include "util.h"
#include "message.h"
#include "DlAbortEx.h"
#include "MetalinkParserState.h"
#include "A2STR.h"
namespace aria2 {
namespace {
class SessionData {
public:
SharedHandle<MetalinkParserStateMachine> stm_;
std::deque<std::string> charactersStack_;
SessionData(const SharedHandle<MetalinkParserStateMachine>& stm):stm_(stm) {}
};
}
static void splitNsName
(std::string& localname, std::string& prefix, std::string& nsUri,
const std::string& nsName)
{
std::pair<std::string, std::string> nsNamePair;
util::split(nsNamePair, nsName, '\t');
if(nsNamePair.second.empty()) {
localname = nsNamePair.first;
} else {
nsUri = nsNamePair.first;
localname = nsNamePair.second;
}
}
static void mlStartElement(void* userData, const char* nsName, const char** attrs)
{
SessionData* sd = reinterpret_cast<SessionData*>(userData);
std::vector<XmlAttr> xmlAttrs;
if(attrs) {
const char** p = attrs;
while(*p != 0) {
std::string attrNsName = *p++;
if(*p == 0) {
break;
}
std::string value = *p++;
std::pair<std::string, std::string> nsNamePair;
util::split(nsNamePair, attrNsName, '\t');
XmlAttr xa;
if(nsNamePair.second.empty()) {
xa.localname = nsNamePair.first;
} else {
xa.nsUri = nsNamePair.first;
xa.localname = nsNamePair.second;
}
xa.value = value;
xmlAttrs.push_back(xa);
}
}
std::string localname;
std::string prefix;
std::string nsUri;
splitNsName(localname, prefix, nsUri, nsName);
sd->stm_->beginElement(localname, prefix, nsUri, xmlAttrs);
if(sd->stm_->needsCharactersBuffering()) {
sd->charactersStack_.push_front(A2STR::NIL);
}
}
static void mlEndElement(void* userData, const char* nsName)
{
std::string localname;
std::string prefix;
std::string nsUri;
splitNsName(localname, prefix, nsUri, nsName);
SessionData* sd = reinterpret_cast<SessionData*>(userData);
std::string characters;
if(sd->stm_->needsCharactersBuffering()) {
characters = sd->charactersStack_.front();
sd->charactersStack_.pop_front();
}
sd->stm_->endElement(localname, prefix, nsUri, characters);
}
static void mlCharacters(void* userData, const char* ch, int len)
{
SessionData* sd = reinterpret_cast<SessionData*>(userData);
if(sd->stm_->needsCharactersBuffering()) {
sd->charactersStack_.front() += std::string(&ch[0], &ch[len]);
}
}
static XML_Parser createParser(const SharedHandle<SessionData>& sessionData)
{
XML_Parser parser = XML_ParserCreateNS(0, static_cast<const XML_Char>('\t'));
XML_SetUserData(parser, sessionData.get());
XML_SetElementHandler(parser, &mlStartElement, &mlEndElement);
XML_SetCharacterDataHandler(parser, &mlCharacters);
return parser;
}
static void checkError(XML_Parser parser)
{
if(XML_Parse(parser, 0, 0, 1) == XML_STATUS_ERROR) {
throw DL_ABORT_EX(MSG_CANNOT_PARSE_METALINK);
}
SessionData* sessionData =
reinterpret_cast<SessionData*>(XML_GetUserData(parser));
const SharedHandle<MetalinkParserStateMachine>& stm = sessionData->stm_;
if(!stm->finished()) {
throw DL_ABORT_EX(MSG_CANNOT_PARSE_METALINK);
}
if(!stm->getErrors().empty()) {
throw DL_ABORT_EX(stm->getErrorString());
}
}
SharedHandle<Metalinker>
MetalinkProcessor::parseFile(const std::string& filename)
{
if(filename == DEV_STDIN) {
return parseFile(std::cin);
} else {
std::ifstream infile(filename.c_str(), std::ios::binary);
return parseFile(infile);
}
}
SharedHandle<Metalinker>
MetalinkProcessor::parseFile(std::istream& stream)
{
stm_.reset(new MetalinkParserStateMachine());
char buf[4096];
SharedHandle<SessionData> sessionData(new SessionData(stm_));
XML_Parser parser = createParser(sessionData);
auto_delete<XML_Parser> deleter(parser, XML_ParserFree);
while(stream) {
stream.read(buf, sizeof(buf));
if(XML_Parse(parser, buf, stream.gcount(), 0) == XML_STATUS_ERROR) {
throw DL_ABORT_EX(MSG_CANNOT_PARSE_METALINK);
}
}
if(stream.bad()) {
throw DL_ABORT_EX(MSG_CANNOT_PARSE_METALINK);
}
checkError(parser);
return stm_->getResult();
}
SharedHandle<Metalinker>
MetalinkProcessor::parseFromBinaryStream(const SharedHandle<BinaryStream>& binaryStream)
{
stm_.reset(new MetalinkParserStateMachine());
ssize_t bufSize = 4096;
unsigned char buf[bufSize];
SharedHandle<SessionData> sessionData(new SessionData(stm_));
XML_Parser parser = createParser(sessionData);
off_t readOffset = 0;
while(1) {
ssize_t res = binaryStream->readData(buf, bufSize, readOffset);
if(res == 0) {
break;
}
if(XML_Parse(parser, reinterpret_cast<const char*>(buf), res, 0) ==
XML_STATUS_ERROR) {
throw DL_ABORT_EX(MSG_CANNOT_PARSE_METALINK);
}
readOffset += res;
}
checkError(parser);
return stm_->getResult();
}
} // namespace aria2