2017-10-09 22:11:01 +08:00
|
|
|
|
/*
|
2020-04-04 20:30:09 +08:00
|
|
|
|
* Copyright (c) 2016 The ZLMediaKit project authors. All Rights Reserved.
|
2017-09-27 16:20:30 +08:00
|
|
|
|
*
|
2021-01-17 18:31:50 +08:00
|
|
|
|
* This file is part of ZLMediaKit(https://github.com/xia-chu/ZLMediaKit).
|
2017-09-27 16:20:30 +08:00
|
|
|
|
*
|
2020-04-04 20:30:09 +08:00
|
|
|
|
* Use of this source code is governed by MIT license that can be found in the
|
|
|
|
|
* LICENSE file in the root of the source tree. All contributing project authors
|
|
|
|
|
* may be found in the AUTHORS file in the root of the source tree.
|
2017-04-01 16:35:56 +08:00
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
#include <string.h>
|
2017-04-25 11:35:41 +08:00
|
|
|
|
#include "strCoding.h"
|
2017-04-01 16:35:56 +08:00
|
|
|
|
|
2017-10-10 00:04:07 +08:00
|
|
|
|
#if defined(_WIN32)
|
|
|
|
|
#include <windows.h>
|
|
|
|
|
#endif//defined(_WIN32)
|
|
|
|
|
|
2018-10-24 17:17:55 +08:00
|
|
|
|
namespace mediakit {
|
2017-04-01 16:35:56 +08:00
|
|
|
|
|
2017-10-10 00:04:07 +08:00
|
|
|
|
//////////////////////////通用///////////////////////
|
2017-10-10 00:11:58 +08:00
|
|
|
|
void UTF8ToUnicode(wchar_t* pOut, const char *pText)
|
2017-10-10 00:04:07 +08:00
|
|
|
|
{
|
2020-03-20 11:51:24 +08:00
|
|
|
|
char* uchar = (char *)pOut;
|
|
|
|
|
uchar[1] = ((pText[0] & 0x0F) << 4) + ((pText[1] >> 2) & 0x0F);
|
|
|
|
|
uchar[0] = ((pText[1] & 0x03) << 6) + (pText[2] & 0x3F);
|
|
|
|
|
return;
|
2017-10-10 00:04:07 +08:00
|
|
|
|
}
|
2017-10-10 00:11:58 +08:00
|
|
|
|
void UnicodeToUTF8(char* pOut, const wchar_t* pText)
|
2017-10-10 00:04:07 +08:00
|
|
|
|
{
|
2020-03-20 11:51:24 +08:00
|
|
|
|
// 注意 WCHAR高低字的顺序,低字节在前,高字节在后
|
|
|
|
|
const char* pchar = (const char *)pText;
|
|
|
|
|
pOut[0] = (0xE0 | ((pchar[1] & 0xF0) >> 4));
|
|
|
|
|
pOut[1] = (0x80 | ((pchar[1] & 0x0F) << 2)) + ((pchar[0] & 0xC0) >> 6);
|
|
|
|
|
pOut[2] = (0x80 | (pchar[0] & 0x3F));
|
|
|
|
|
return;
|
2017-10-10 00:04:07 +08:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
char CharToInt(char ch)
|
|
|
|
|
{
|
2020-03-20 11:51:24 +08:00
|
|
|
|
if (ch >= '0' && ch <= '9')return (char)(ch - '0');
|
|
|
|
|
if (ch >= 'a' && ch <= 'f')return (char)(ch - 'a' + 10);
|
|
|
|
|
if (ch >= 'A' && ch <= 'F')return (char)(ch - 'A' + 10);
|
|
|
|
|
return -1;
|
2017-04-01 16:35:56 +08:00
|
|
|
|
}
|
2017-10-10 00:04:07 +08:00
|
|
|
|
char StrToBin(const char *str)
|
|
|
|
|
{
|
2020-03-20 11:51:24 +08:00
|
|
|
|
char tempWord[2];
|
|
|
|
|
char chn;
|
|
|
|
|
tempWord[0] = CharToInt(str[0]); //make the B to 11 -- 00001011
|
|
|
|
|
tempWord[1] = CharToInt(str[1]); //make the 0 to 0 -- 00000000
|
|
|
|
|
chn = (tempWord[0] << 4) | tempWord[1]; //to change the BO to 10110000
|
|
|
|
|
return chn;
|
2017-04-01 16:35:56 +08:00
|
|
|
|
}
|
2017-10-10 00:04:07 +08:00
|
|
|
|
|
2019-05-27 12:13:27 +08:00
|
|
|
|
string strCoding::UrlEncode(const string &str) {
|
2020-03-20 11:51:24 +08:00
|
|
|
|
string out;
|
2020-03-12 18:14:47 +08:00
|
|
|
|
size_t len = str.size();
|
2020-03-20 11:51:24 +08:00
|
|
|
|
for (size_t i = 0; i < len; ++i) {
|
2020-03-12 18:14:47 +08:00
|
|
|
|
char ch = str[i];
|
2020-03-20 11:51:24 +08:00
|
|
|
|
if (isalnum((uint8_t)ch)) {
|
2020-03-12 18:14:47 +08:00
|
|
|
|
out.push_back(ch);
|
2020-03-20 11:51:24 +08:00
|
|
|
|
}else {
|
|
|
|
|
char buf[4];
|
|
|
|
|
sprintf(buf, "%%%X%X", (uint8_t)ch >> 4,(uint8_t)ch & 0x0F);
|
2020-03-12 18:19:22 +08:00
|
|
|
|
out.append(buf);
|
2020-03-20 11:51:24 +08:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return out;
|
2017-04-01 16:35:56 +08:00
|
|
|
|
}
|
2019-05-27 12:13:27 +08:00
|
|
|
|
string strCoding::UrlDecode(const string &str) {
|
2020-03-20 11:51:24 +08:00
|
|
|
|
string output = "";
|
|
|
|
|
char tmp[2];
|
2021-01-17 18:31:50 +08:00
|
|
|
|
size_t i = 0, len = str.length();
|
2020-03-20 11:51:24 +08:00
|
|
|
|
while (i < len) {
|
|
|
|
|
if (str[i] == '%') {
|
|
|
|
|
if(i > len - 3){
|
|
|
|
|
//防止内存溢出
|
2020-03-12 18:14:47 +08:00
|
|
|
|
break;
|
2020-03-20 11:51:24 +08:00
|
|
|
|
}
|
|
|
|
|
tmp[0] = str[i + 1];
|
|
|
|
|
tmp[1] = str[i + 2];
|
|
|
|
|
output += StrToBin(tmp);
|
|
|
|
|
i = i + 3;
|
|
|
|
|
} else if (str[i] == '+') {
|
|
|
|
|
output += ' ';
|
|
|
|
|
i++;
|
|
|
|
|
} else {
|
|
|
|
|
output += str[i];
|
|
|
|
|
i++;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return output;
|
2017-04-01 16:35:56 +08:00
|
|
|
|
}
|
|
|
|
|
|
2017-10-10 00:04:07 +08:00
|
|
|
|
|
|
|
|
|
///////////////////////////////windows专用///////////////////////////////////
|
|
|
|
|
#if defined(_WIN32)
|
|
|
|
|
void UnicodeToGB2312(char* pOut, wchar_t uData)
|
|
|
|
|
{
|
2020-03-20 11:51:24 +08:00
|
|
|
|
WideCharToMultiByte(CP_ACP, NULL, &uData, 1, pOut, sizeof(wchar_t), NULL, NULL);
|
2017-10-10 00:04:07 +08:00
|
|
|
|
}
|
|
|
|
|
void Gb2312ToUnicode(wchar_t* pOut, const char *gbBuffer)
|
|
|
|
|
{
|
2020-03-20 11:51:24 +08:00
|
|
|
|
MultiByteToWideChar(CP_ACP, MB_PRECOMPOSED, gbBuffer, 2, pOut, 1);
|
2017-10-10 00:04:07 +08:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
string strCoding::UTF8ToGB2312(const string &str) {
|
2020-03-20 11:51:24 +08:00
|
|
|
|
auto len = str.size();
|
|
|
|
|
auto pText = str.data();
|
|
|
|
|
char Ctemp[4] = {0};
|
|
|
|
|
char *pOut = new char[len + 1];
|
|
|
|
|
memset(pOut, 0, len + 1);
|
2017-10-10 00:04:07 +08:00
|
|
|
|
|
2020-03-20 11:51:24 +08:00
|
|
|
|
int i = 0, j = 0;
|
|
|
|
|
while (i < len)
|
|
|
|
|
{
|
|
|
|
|
if (pText[i] >= 0)
|
|
|
|
|
{
|
|
|
|
|
pOut[j++] = pText[i++];
|
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
wchar_t Wtemp;
|
|
|
|
|
UTF8ToUnicode(&Wtemp, pText + i);
|
|
|
|
|
UnicodeToGB2312(Ctemp, Wtemp);
|
|
|
|
|
pOut[j] = Ctemp[0];
|
|
|
|
|
pOut[j + 1] = Ctemp[1];
|
|
|
|
|
i += 3;
|
|
|
|
|
j += 2;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
string ret = pOut;
|
|
|
|
|
delete[] pOut;
|
|
|
|
|
return ret;
|
2017-10-10 00:04:07 +08:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
string strCoding::GB2312ToUTF8(const string &str) {
|
2020-03-20 11:51:24 +08:00
|
|
|
|
auto len = str.size();
|
|
|
|
|
auto pText = str.data();
|
|
|
|
|
char buf[4] = { 0 };
|
2021-01-17 18:31:50 +08:00
|
|
|
|
auto nLength = len * 3;
|
2020-03-20 11:51:24 +08:00
|
|
|
|
char* pOut = new char[nLength];
|
|
|
|
|
memset(pOut, 0, nLength);
|
2021-01-17 18:31:50 +08:00
|
|
|
|
size_t i = 0, j = 0;
|
2020-03-20 11:51:24 +08:00
|
|
|
|
while (i < len)
|
|
|
|
|
{
|
|
|
|
|
//如果是英文直接复制就可以
|
|
|
|
|
if (*(pText + i) >= 0)
|
|
|
|
|
{
|
|
|
|
|
pOut[j++] = pText[i++];
|
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
wchar_t pbuffer;
|
|
|
|
|
Gb2312ToUnicode(&pbuffer, pText + i);
|
|
|
|
|
UnicodeToUTF8(buf, &pbuffer);
|
|
|
|
|
pOut[j] = buf[0];
|
|
|
|
|
pOut[j + 1] = buf[1];
|
|
|
|
|
pOut[j + 2] = buf[2];
|
|
|
|
|
j += 3;
|
|
|
|
|
i += 2;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
string ret = pOut;
|
|
|
|
|
delete[] pOut;
|
|
|
|
|
return ret;
|
2017-10-10 00:04:07 +08:00
|
|
|
|
}
|
|
|
|
|
#endif//defined(_WIN32)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2018-10-24 17:17:55 +08:00
|
|
|
|
} /* namespace mediakit */
|