关于获取http的gzip内容并解压
2016-10-06 00:40
471 查看
网上很多代码,都是以下的代码。我自己用SOCKET实现的时候(调用ZLIB库),发现都是可以的。
int inflate_read(char *source,int len,char **dest,int gzip)
{
int ret;
unsigned have;
z_stream strm;
unsigned char out[CHUNK];
int totalsize = 0;
/* allocate inflate state */
strm.zalloc = Z_NULL;
strm.zfree = Z_NULL;
strm.opaque = Z_NULL;
strm.avail_in = 0;
strm.next_in = Z_NULL;
if (gzip)
ret = inflateInit2(&strm, 47);
else
ret = inflateInit(&strm);
if (ret != Z_OK)
return ret;
strm.avail_in = len;
strm.next_in = source;
/* run inflate() on input until output buffer not full */
do {
strm.avail_out = CHUNK;
strm.next_out = out;
ret = inflate(&strm, Z_NO_FLUSH);
assert(ret != Z_STREAM_ERROR); /* state not clobbered */
switch (ret) {
case Z_NEED_DICT:
ret = Z_DATA_ERROR; /* and fall through */
case Z_DATA_ERROR:
case Z_MEM_ERROR:
inflateEnd(&strm);
return ret;
}
have = CHUNK - strm.avail_out;
totalsize += have;
*dest = realloc(*dest,totalsize);
memcpy(*dest + totalsize - have,out,have);
} while (strm.avail_out == 0);
/* clean up and return */
(void)inflateEnd(&strm);
return ret == Z_STREAM_END ? Z_OK : Z_DATA_ERROR;
}
而昨天用在WININET的返回数据里面的时候,发现不行。于是去搜索资料,参考了一些资料之后,发现WININET添加了gzip的头部,于是自己参考了 https://github.com/wkoszek/mini_gzip
写了一个函数。并且,miniz.c的代码里面和zlib的略不同,需要把上面一个函数的47修改成 -MZ_DEFAULT_WINDOW_BITS。
int mini_gz_get_data_offset(const unsigned char *buffer, int bufferlength)
{
int offset;
int result = 0;
if (10 < bufferlength)
{
buffer + 0; // .gz header
if (buffer[0] == 0x1F && buffer[1] == 0x8B && buffer[2] == 0x08)
{
// auxillary header
offset = 10;
if (buffer[3] & 0x4)
{
//fextra_len = buffer[offset + 1] << 8 | buffer[offset + 0];
offset += 2;
//fextra_ptr = &buffer[offset];
}
if (buffer[3] & 0x8)
{
//fname_ptr = &buffer[offset];
while (buffer[offset++] != '\0')
{
;
}
}
if (buffer[3] & 0x10)
{
//fcomment_ptr = &buffer[offset];
while (buffer[offset++] != '\0')
{
;
}
}
if (buffer[3] & 0x2)
{
//fcrc = *(unsigned short *)&buffer[offset];
offset += 2;
}
result = offset;
}
}
return (result);
}
希望后来的人可以少走弯路。
int inflate_read(char *source,int len,char **dest,int gzip)
{
int ret;
unsigned have;
z_stream strm;
unsigned char out[CHUNK];
int totalsize = 0;
/* allocate inflate state */
strm.zalloc = Z_NULL;
strm.zfree = Z_NULL;
strm.opaque = Z_NULL;
strm.avail_in = 0;
strm.next_in = Z_NULL;
if (gzip)
ret = inflateInit2(&strm, 47);
else
ret = inflateInit(&strm);
if (ret != Z_OK)
return ret;
strm.avail_in = len;
strm.next_in = source;
/* run inflate() on input until output buffer not full */
do {
strm.avail_out = CHUNK;
strm.next_out = out;
ret = inflate(&strm, Z_NO_FLUSH);
assert(ret != Z_STREAM_ERROR); /* state not clobbered */
switch (ret) {
case Z_NEED_DICT:
ret = Z_DATA_ERROR; /* and fall through */
case Z_DATA_ERROR:
case Z_MEM_ERROR:
inflateEnd(&strm);
return ret;
}
have = CHUNK - strm.avail_out;
totalsize += have;
*dest = realloc(*dest,totalsize);
memcpy(*dest + totalsize - have,out,have);
} while (strm.avail_out == 0);
/* clean up and return */
(void)inflateEnd(&strm);
return ret == Z_STREAM_END ? Z_OK : Z_DATA_ERROR;
}
而昨天用在WININET的返回数据里面的时候,发现不行。于是去搜索资料,参考了一些资料之后,发现WININET添加了gzip的头部,于是自己参考了 https://github.com/wkoszek/mini_gzip
写了一个函数。并且,miniz.c的代码里面和zlib的略不同,需要把上面一个函数的47修改成 -MZ_DEFAULT_WINDOW_BITS。
int mini_gz_get_data_offset(const unsigned char *buffer, int bufferlength)
{
int offset;
int result = 0;
if (10 < bufferlength)
{
buffer + 0; // .gz header
if (buffer[0] == 0x1F && buffer[1] == 0x8B && buffer[2] == 0x08)
{
// auxillary header
offset = 10;
if (buffer[3] & 0x4)
{
//fextra_len = buffer[offset + 1] << 8 | buffer[offset + 0];
offset += 2;
//fextra_ptr = &buffer[offset];
}
if (buffer[3] & 0x8)
{
//fname_ptr = &buffer[offset];
while (buffer[offset++] != '\0')
{
;
}
}
if (buffer[3] & 0x10)
{
//fcomment_ptr = &buffer[offset];
while (buffer[offset++] != '\0')
{
;
}
}
if (buffer[3] & 0x2)
{
//fcrc = *(unsigned short *)&buffer[offset];
offset += 2;
}
result = offset;
}
}
return (result);
}
希望后来的人可以少走弯路。
相关文章推荐
- 获取http的gzip内容并解压相关问题
- 获取http的gzip内容并解压
- 获取http的gzip内容并解压相关问题
- 获取http的gzip内容并解压相关问题(续)
- http client对post内容gzip压缩和server端解压接收
- 关于http的gzip解压
- VBS获取GZIP压缩的HTTP内容的实现代码
- 利用HttpWebRequest获取网页内容,由于Gzip压缩导致乱码的情况
- 【HTTP】WireShark中获取Content-Encoding: gzip时的响应内容
- 关于XMLHTTP无刷新数据获取和发送(转相关内容)
- http中关于gzip的解压_初级调试
- 关于HTTP GZIP解压问题
- 利用HTTP指令直接获取WEB服务器内容
- 通过HttpClient获取响应内容字符集
- 关于chunked gzip,socket下载网页内容.
- http获取网页内容类
- vc 获取网页内容(HTTP)
- Java基础:利用HttpClient获取网页内容
- 解压HTTP gzip的
- 利用HttpClient获取网页内容