ZLMediaKit/src/Common/Parser.cpp

324 lines
9.0 KiB
C++
Raw Normal View History

2020-04-04 20:30:09 +08:00
/*
* Copyright (c) 2016 The ZLMediaKit project authors. All Rights Reserved.
*
* This file is part of ZLMediaKit(https://github.com/xia-chu/ZLMediaKit).
2020-04-04 20:30:09 +08:00
*
* Use of this source code is governed by MIT license that can be found in the
* LICENSE file in the root of the source tree. All contributing project authors
* may be found in the AUTHORS file in the root of the source tree.
*/
2019-06-28 16:48:02 +08:00
2022-05-13 20:48:22 +08:00
#include <cinttypes>
2019-06-28 16:48:02 +08:00
#include "Parser.h"
2022-05-08 16:33:33 +08:00
#include "macros.h"
#include "Network/sockutil.h"
2019-06-28 16:48:02 +08:00
using namespace std;
using namespace toolkit;
2019-06-28 16:48:02 +08:00
namespace mediakit{
string FindField(const char* buf, const char* start, const char *end ,size_t bufSize) {
2019-06-28 16:48:02 +08:00
if(bufSize <=0 ){
bufSize = strlen(buf);
}
const char *msg_start = buf, *msg_end = buf + bufSize;
size_t len = 0;
2019-06-28 16:48:02 +08:00
if (start != NULL) {
len = strlen(start);
msg_start = strstr(buf, start);
}
if (msg_start == NULL) {
return "";
}
msg_start += len;
if (end != NULL) {
msg_end = strstr(msg_start, end);
if (msg_end == NULL) {
return "";
}
}
return string(msg_start, msg_end);
}
2020-04-20 18:13:45 +08:00
void Parser::Parse(const char *buf) {
//解析
const char *start = buf;
2023-06-10 11:04:52 +08:00
clear();
2020-04-20 18:13:45 +08:00
while (true) {
auto line = FindField(start, NULL, "\r\n");
if (line.size() == 0) {
break;
}
if (start == buf) {
_strMethod = FindField(line.data(), NULL, " ");
auto strFullUrl = FindField(line.data(), " ", " ");
auto args_pos = strFullUrl.find('?');
2020-04-20 18:13:45 +08:00
if (args_pos != string::npos) {
_strUrl = strFullUrl.substr(0, args_pos);
_params = strFullUrl.substr(args_pos + 1);
2020-04-20 18:13:45 +08:00
_mapUrlArgs = parseArgs(_params);
} else {
_strUrl = strFullUrl;
2020-04-20 18:13:45 +08:00
}
_strTail = FindField(line.data(), (strFullUrl + " ").data(), NULL);
2020-04-20 18:13:45 +08:00
} else {
auto field = FindField(line.data(), NULL, ": ");
auto value = FindField(line.data(), ": ", NULL);
if (field.size() != 0) {
_mapHeaders.emplace_force(field, value);
}
}
start = start + line.size() + 2;
if (strncmp(start, "\r\n", 2) == 0) { //协议解析完毕
_strContent = FindField(start, "\r\n", NULL);
break;
}
}
}
2023-06-10 11:04:52 +08:00
const string &Parser::method() const {
2020-04-20 18:13:45 +08:00
return _strMethod;
}
2023-06-10 11:04:52 +08:00
const string &Parser::url() const {
2020-04-20 18:13:45 +08:00
return _strUrl;
}
2023-06-10 11:04:52 +08:00
const std::string &Parser::status() const {
return url();
}
string Parser::fullUrl() const {
if (_params.empty()) {
return _strUrl;
}
return _strUrl + "?" + _params;
2020-04-20 18:13:45 +08:00
}
2023-06-10 11:04:52 +08:00
const string &Parser::protocol() const {
2020-04-20 18:13:45 +08:00
return _strTail;
}
2023-06-10 11:04:52 +08:00
const std::string &Parser::statusStr() const {
return protocol();
}
2020-04-20 18:13:45 +08:00
const string &Parser::operator[](const char *name) const {
auto it = _mapHeaders.find(name);
if (it == _mapHeaders.end()) {
return _strNull;
}
return it->second;
}
2023-06-10 11:04:52 +08:00
const string &Parser::content() const {
2020-04-20 18:13:45 +08:00
return _strContent;
}
2023-06-10 11:04:52 +08:00
void Parser::clear() {
2020-04-20 18:13:45 +08:00
_strMethod.clear();
_strUrl.clear();
_params.clear();
_strTail.clear();
_strContent.clear();
_mapHeaders.clear();
_mapUrlArgs.clear();
}
2023-06-10 11:04:52 +08:00
const string &Parser::params() const {
2020-04-20 18:13:45 +08:00
return _params;
}
2021-09-30 16:10:09 +08:00
void Parser::setUrl(string url) {
this->_strUrl = std::move(url);
2020-04-20 18:13:45 +08:00
}
2021-09-30 16:10:09 +08:00
void Parser::setContent(string content) {
this->_strContent = std::move(content);
2020-04-20 18:13:45 +08:00
}
StrCaseMap &Parser::getHeader() const {
return _mapHeaders;
}
StrCaseMap &Parser::getUrlArgs() const {
return _mapUrlArgs;
}
StrCaseMap Parser::parseArgs(const string &str, const char *pair_delim, const char *key_delim) {
StrCaseMap ret;
auto arg_vec = split(str, pair_delim);
for (string &key_val : arg_vec) {
2021-09-03 17:58:23 +08:00
if (key_val.empty()) {
//忽略
continue;
}
2020-12-27 18:11:10 +08:00
auto key = trim(FindField(key_val.data(), NULL, key_delim));
if (!key.empty()) {
auto val = trim(FindField(key_val.data(), key_delim, NULL));
ret.emplace_force(key, val);
} else {
2021-09-03 18:11:20 +08:00
trim(key_val);
if (!key_val.empty()) {
ret.emplace_force(key_val, "");
}
2020-12-27 18:11:10 +08:00
}
2020-04-20 18:13:45 +08:00
}
return ret;
}
2023-06-10 11:04:52 +08:00
std::string Parser::mergeUrl(const string &base_url, const string &path) {
//以base_url为基础, 合并path路径生成新的url, path支持相对路径和绝对路径
if (base_url.empty()) {
return path;
}
if (path.empty()) {
return base_url;
}
// 如果包含协议,则直接返回
if (path.find("://") != string::npos) {
return path;
}
2020-04-20 18:13:45 +08:00
string protocol = "http://";
size_t protocol_end = base_url.find("://");
if (protocol_end != string::npos) {
protocol = base_url.substr(0, protocol_end + 3);
}
// 如果path以"//"开头,则直接拼接协议
if (path.find("//") == 0) {
return protocol + path.substr(2);
}
string host;
size_t pos = 0;
if (protocol_end != string::npos) {
pos = base_url.find('/', protocol_end + 3);
host = base_url.substr(0, pos);
if (pos == string::npos) {
pos = base_url.size();
} else {
pos++;
}
}
// 如果path以"/"开头,则直接拼接协议和主机
if (path[0] == '/') {
return host + path;
}
vector<string> path_parts;
size_t next_pos = 0;
if (!host.empty()) {
path_parts.emplace_back(host);
}
while ((next_pos = base_url.find('/', pos)) != string::npos) {
path_parts.emplace_back(base_url.substr(pos, next_pos - pos));
pos = next_pos + 1;
}
pos = 0;
while ((next_pos = path.find('/', pos)) != string::npos) {
string part = path.substr(pos, next_pos - pos);
if (part == "..") {
if (!path_parts.empty() && !path_parts.back().empty()) {
if (path_parts.size() > 1 || protocol_end == string::npos) {
path_parts.pop_back();
}
}
} else if (part != "." && !part.empty()) {
path_parts.emplace_back(part);
}
pos = next_pos + 1;
}
string part = path.substr(pos);
if (part != ".." && part != "." && !part.empty()) {
path_parts.emplace_back(part);
}
stringstream final_url;
for (size_t i = 0; i < path_parts.size(); ++i) {
if (i == 0) {
final_url << path_parts[i];
} else {
final_url << '/' << path_parts[i];
}
}
return final_url.str();
}
2022-05-08 16:33:33 +08:00
void RtspUrl::parse(const string &strUrl) {
auto schema = FindField(strUrl.data(), nullptr, "://");
bool is_ssl = strcasecmp(schema.data(), "rtsps") == 0;
//查找"://"与"/"之间的字符串,用于提取用户名密码
auto middle_url = FindField(strUrl.data(), "://", "/");
if (middle_url.empty()) {
middle_url = FindField(strUrl.data(), "://", nullptr);
}
auto pos = middle_url.rfind('@');
if (pos == string::npos) {
//并没有用户名密码
return setup(is_ssl, strUrl, "", "");
}
//包含用户名密码
auto user_pwd = middle_url.substr(0, pos);
auto suffix = strUrl.substr(schema.size() + 3 + pos + 1);
auto url = StrPrinter << "rtsp://" << suffix << endl;
if (user_pwd.find(":") == string::npos) {
return setup(is_ssl, url, user_pwd, "");
}
auto user = FindField(user_pwd.data(), nullptr, ":");
auto pwd = FindField(user_pwd.data(), ":", nullptr);
return setup(is_ssl, url, user, pwd);
}
void RtspUrl::setup(bool is_ssl, const string &url, const string &user, const string &passwd) {
auto ip = FindField(url.data(), "://", "/");
if (ip.empty()) {
ip = split(FindField(url.data(), "://", NULL), "?")[0];
}
uint16_t port = is_ssl ? 322 : 554;
splitUrl(ip, ip, port);
_url = std::move(url);
_user = std::move(user);
_passwd = std::move(passwd);
_host = std::move(ip);
_port = port;
_is_ssl = is_ssl;
}
static void inline checkHost(std::string &host) {
if (host.back() == ']' && host.front() == '[') {
// ipv6去除方括号
host.pop_back();
host.erase(0, 1);
CHECK(SockUtil::is_ipv6(host.data()), "not a ipv6 address:", host);
}
}
void splitUrl(const std::string &url, std::string &host, uint16_t &port) {
2022-05-29 21:36:34 +08:00
CHECK(!url.empty(), "empty url");
2022-05-08 16:33:33 +08:00
auto pos = url.rfind(':');
if (pos == string::npos || url.back() == ']') {
//没有冒号,未指定端口;或者是纯粹的ipv6地址
host = url;
checkHost(host);
return;
}
2022-12-04 16:21:08 +08:00
CHECK(pos > 0, "invalid url:", url);
2022-05-08 16:33:33 +08:00
CHECK(sscanf(url.data() + pos + 1, "%" SCNu16, &port) == 1, "parse port from url failed:", url);
host = url.substr(0, pos);
checkHost(host);
}
#if 0
//测试代码
static onceToken token([](){
string host;
uint16_t port;
splitUrl("www.baidu.com:8880", host, port);
splitUrl("192.168.1.1:8880", host, port);
splitUrl("[::]:8880", host, port);
splitUrl("[fe80::604d:4173:76e9:1009]:8880", host, port);
});
#endif
}//namespace mediakit