URL encode 与 URL decode 的C语言实现

时间:2023-03-10 01:22:57
URL encode 与 URL decode 的C语言实现

转载自:http://blog.****.net/langeldep/article/details/6264058

本文代码为从PHP代码中修改而来,只保留了2个函数。

int php_url_decode(char *str, int len);
char *php_url_encode(char const *s, int len, int *new_length);

URL编码做了如下操作:

字符"a"-"z","A"-"Z","0"-"9",".","-","*",和"_" 都不被编码,维持原值;

空格" "被转换为加号"+"。

其他每个字节都被表示成"%xy"格式的由3个字符组成的字符串,编码为UTF-8。

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <ctype.h>
#include <sys/types.h> static unsigned char hexchars[] = "0123456789ABCDEF";
/**
* 16进制数转换成10进制数
* 如:0xE4=14*16+4=228
*/
static int php_htoi(char *s)
{
int value;
int c; c = ((unsigned char *)s)[];
if (isupper(c))
c = tolower(c);
value = (c >= '' && c <= '' ? c - '' : c - 'a' + ) * ; c = ((unsigned char *)s)[];
if (isupper(c))
c = tolower(c);
value += c >= '' && c <= '' ? c - '' : c - 'a' + ; return (value);
} char *php_url_encode(char const *s, int len, int *new_length)
{
register unsigned char c;
unsigned char *to, *start;
unsigned char const *from, *end; from = (unsigned char *)s;
end = (unsigned char *)s + len;
start = to = (unsigned char *) calloc(, *len+); while (from < end)
{
c = *from++; if (c == ' ')
{
*to++ = '+';
}
else if ((c < '' && c != '-' && c != '.') ||
(c < 'A' && c > '') ||
(c > 'Z' && c < 'a' && c != '_') ||
(c > 'z'))
{
to[] = '%';
to[] = hexchars[c >> ];//将2进制转换成16进制表示
to[] = hexchars[c & ];//将2进制转换成16进制表示
to += ;
}
else
{
*to++ = c;
}
}
*to = ;
if (new_length)
{
*new_length = to - start;
}
return (char *) start;
} int php_url_decode(char *str, int len)
{
char *dest = str;
char *data = str; while (len--)
{
if (*data == '+')
{
*dest = ' ';
}
else if (*data == '%' && len >= && isxdigit((int) *(data + )) && isxdigit((int) *(data + )))
{
*dest = (char) php_htoi(data + );
data += ;
len -= ;
}
else
{
*dest = *data;
}
data++;
dest++;
}
*dest = '\0';
return dest - str;
} int main(int argc, char ** argv)
{
char *str = "你好,世界!",*new_str;
int len = ,new_len = ,old_len = ;
len = strlen(str);
new_str = php_url_encode(str,len,&new_len);
printf("new string : %s,new length : %d\n",new_str,new_len);
old_len = php_url_decode(new_str,new_len);
printf("old string : %s,old length : %d\n",new_str,old_len);
return ;
}

ps:查了好多资料才弄明白urldecode的原理,原来如此简单,呵呵

相关文章