/* * Bittorrent Client using Qt and libtorrent. * Copyright (C) 2014 Vladimir Golovnev * Copyright (C) 2006 Ishan Arora and Christophe Dumez * * This program is free software; you can redistribute it and/or * modify it under the terms of the GNU General Public License * as published by the Free Software Foundation; either version 2 * of the License, or (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. * * In addition, as a special exception, the copyright holders give permission to * link this program with the OpenSSL project's "OpenSSL" library (or with * modified versions of it that use the same license as the "OpenSSL" library), * and distribute the linked executables. You must obey the GNU General Public * License in all respects for all of the code used other than "OpenSSL". If you * modify file(s), you may extend this exception to your version of the file(s), * but you are not obligated to do so. If you do not wish to do so, delete this * exception statement from your version. */ #include "requestparser.h" #include #include #include #include #include const QByteArray EOL("\r\n"); const QByteArray EOH("\r\n\r\n"); inline QString unquoted(const QString &str) { if ((str[0] == '\"') && (str[str.length() - 1] == '\"')) return str.mid(1, str.length() - 2); return str; } using namespace Http; RequestParser::ErrorCode RequestParser::parse(const QByteArray &data, Request &request, uint maxContentLength) { return RequestParser(maxContentLength).parseHttpRequest(data, request); } RequestParser::RequestParser(uint maxContentLength) : m_maxContentLength(maxContentLength) { } RequestParser::ErrorCode RequestParser::parseHttpRequest(const QByteArray &data, Request &request) { m_request = Request(); // Parse HTTP request header const int headerEnd = data.indexOf(EOH); if (headerEnd < 0) { qDebug() << Q_FUNC_INFO << "incomplete request"; return IncompleteRequest; } if (!parseHttpHeader(data.left(headerEnd))) { qWarning() << Q_FUNC_INFO << "header parsing error"; return BadRequest; } // Parse HTTP request message if (m_request.headers.contains("content-length")) { int contentLength = m_request.headers["content-length"].toInt(); if (contentLength < 0) { qWarning() << Q_FUNC_INFO << "bad request: content-length is negative"; return BadRequest; } if (contentLength > static_cast(m_maxContentLength)) { qWarning() << Q_FUNC_INFO << "bad request: message too long"; return BadRequest; } QByteArray content = data.mid(headerEnd + EOH.length(), contentLength); if (content.length() < contentLength) { qDebug() << Q_FUNC_INFO << "incomplete request"; return IncompleteRequest; } if ((contentLength > 0) && !parseContent(content)) { qWarning() << Q_FUNC_INFO << "message parsing error"; return BadRequest; } } // qDebug() << Q_FUNC_INFO; // qDebug() << "HTTP Request header:"; // qDebug() << data.left(headerEnd) << "\n"; request = m_request; return NoError; } bool RequestParser::parseStartingLine(const QString &line) { const QRegExp rx("^([A-Z]+)\\s+(\\S+)\\s+HTTP/\\d\\.\\d$"); if (rx.indexIn(line.trimmed()) >= 0) { m_request.method = rx.cap(1); QUrl url = QUrl::fromEncoded(rx.cap(2).toLatin1()); m_request.path = url.path(); // Path // Parse GET parameters QListIterator > i(QUrlQuery(url).queryItems()); while (i.hasNext()) { QPair pair = i.next(); m_request.gets[pair.first] = pair.second; } return true; } qWarning() << Q_FUNC_INFO << "invalid http header:" << line; return false; } bool RequestParser::parseHeaderLine(const QString &line, QPair &out) { int i = line.indexOf(QLatin1Char(':')); if (i == -1) { qWarning() << Q_FUNC_INFO << "invalid http header:" << line; return false; } out = qMakePair(line.left(i).trimmed().toLower(), line.mid(i + 1).trimmed()); return true; } bool RequestParser::parseHttpHeader(const QByteArray &data) { QString str = QString::fromUtf8(data); QStringList lines = str.trimmed().split(EOL); QStringList headerLines; foreach (const QString &line, lines) { if (line[0].isSpace()) { // header line continuation if (!headerLines.isEmpty()) { // really continuation headerLines.last() += QLatin1Char(' '); headerLines.last() += line.trimmed(); } } else { headerLines.append(line); } } if (headerLines.isEmpty()) return false; // Empty header QStringList::Iterator it = headerLines.begin(); if (!parseStartingLine(*it)) return false; ++it; for (; it != headerLines.end(); ++it) { QPair header; if (!parseHeaderLine(*it, header)) return false; m_request.headers[header.first] = header.second; } return true; } QList RequestParser::splitMultipartData(const QByteArray &data, const QByteArray &boundary) { QList ret; QByteArray sep = boundary + EOL; const int sepLength = sep.size(); int start = 0, end = 0; if ((end = data.indexOf(sep, start)) >= 0) { start = end + sepLength; // skip first boundary while ((end = data.indexOf(sep, start)) >= 0) { ret << data.mid(start, end - EOL.length() - start); start = end + sepLength; } // last or single part sep = boundary + "--" + EOL; if ((end = data.indexOf(sep, start)) >= 0) ret << data.mid(start, end - EOL.length() - start); } return ret; } bool RequestParser::parseContent(const QByteArray &data) { // Parse message content qDebug() << Q_FUNC_INFO << "Content-Length: " << m_request.headers["content-length"]; qDebug() << Q_FUNC_INFO << "data.size(): " << data.size(); // Parse url-encoded POST data if (m_request.headers["content-type"].startsWith("application/x-www-form-urlencoded")) { QUrl url; url.setQuery(data); QListIterator > i(QUrlQuery(url).queryItems(QUrl::FullyDecoded)); while (i.hasNext()) { QPair pair = i.next(); m_request.posts[pair.first] = pair.second; } return true; } // Parse multipart/form data (torrent file) /** data has the following format (if boundary is "cH2ae0GI3KM7GI3Ij5ae0ei4Ij5Ij5") --cH2ae0GI3KM7GI3Ij5ae0ei4Ij5Ij5 Content-Disposition: form-data; name=\"Filename\" PB020344.torrent --cH2ae0GI3KM7GI3Ij5ae0ei4Ij5Ij5 Content-Disposition: form-data; name=\"torrentfile"; filename=\"PB020344.torrent\" Content-Type: application/x-bittorrent BINARY DATA IS HERE --cH2ae0GI3KM7GI3Ij5ae0ei4Ij5Ij5 Content-Disposition: form-data; name=\"Upload\" Submit Query --cH2ae0GI3KM7GI3Ij5ae0ei4Ij5Ij5-- **/ QString contentType = m_request.headers["content-type"]; if (contentType.startsWith("multipart/form-data")) { const QRegExp boundaryRegexQuoted("boundary=\"([ \\w'()+,-\\./:=\\?]+)\""); const QRegExp boundaryRegexNotQuoted("boundary=([\\w'()+,-\\./:=\\?]+)"); QByteArray boundary; if (boundaryRegexQuoted.indexIn(contentType) < 0) { if (boundaryRegexNotQuoted.indexIn(contentType) < 0) { qWarning() << "Could not find boundary in multipart/form-data header!"; return false; } else { boundary = "--" + boundaryRegexNotQuoted.cap(1).toLatin1(); } } else { boundary = "--" + boundaryRegexQuoted.cap(1).toLatin1(); } qDebug() << "Boundary is " << boundary; QList parts = splitMultipartData(data, boundary); qDebug() << parts.size() << "parts in data"; foreach (const QByteArray& part, parts) { if (!parseFormData(part)) return false; } return true; } qWarning() << Q_FUNC_INFO << "unknown content type:" << qPrintable(contentType); return false; } bool RequestParser::parseFormData(const QByteArray &data) { // Parse form data header const int headerEnd = data.indexOf(EOH); if (headerEnd < 0) { qDebug() << "Invalid form data: \n" << data; return false; } QString headerStr = QString::fromUtf8(data.left(headerEnd)); QStringList lines = headerStr.trimmed().split(EOL); QStringMap headers; foreach (const QString& line, lines) { QPair header; if (!parseHeaderLine(line, header)) return false; headers[header.first] = header.second; } QStringMap disposition; if (!headers.contains("content-disposition") || !parseHeaderValue(headers["content-disposition"], disposition) || !disposition.contains("name")) { qDebug() << "Invalid form data header: \n" << headerStr; return false; } if (disposition.contains("filename")) { UploadedFile ufile; ufile.filename = disposition["filename"]; ufile.type = disposition["content-type"]; ufile.data = data.mid(headerEnd + EOH.length()); m_request.files.append(ufile); } else { m_request.posts[disposition["name"]] = QString::fromUtf8(data.mid(headerEnd + EOH.length())); } return true; } bool RequestParser::parseHeaderValue(const QString &value, QStringMap &out) { int pos = value.indexOf(QLatin1Char(';')); if (pos == -1) { out[""] = value.trimmed(); return true; } out[""] = value.left(pos).trimmed(); QRegExp rx(";\\s*([^=;\"]+)\\s*=\\s*(\"[^\"]*\"|[^\";\\s]+)\\s*"); while (rx.indexIn(value, pos) == pos) { out[rx.cap(1).trimmed()] = unquoted(rx.cap(2)); pos += rx.cap(0).length(); } if (pos != value.length()) return false; return true; }