【发布时间】:2017-11-27 14:25:48
【问题描述】:
我正在尝试压缩和解压缩一些信息。
对于压缩,我使用了code project,它似乎可以工作。我现在正在压缩字符串。
为了解压,我想压缩一个Stream
这是我目前拥有的
var zipString = _compressor.Compress(request);
using (var sw = new StreamWriter(req.GetRequestStream()))
{
sw.Write(zipString);
sw.Close();
}
WebResponse respStream = req.GetResponse();
Stream resp = respStream.GetResponseStream();
resp = _compressor.UnCompress(resp);
这是压缩的代码
public string Compress(string s)
{
//Transforming string into byte
var byteArray = new byte[s.Length];
var indexBa = 0;
foreach (var item in s.ToCharArray())
{
byteArray[indexBa++] = (byte) item;
}
//prepare for compress
var ms = new MemoryStream();
var sw = new GZipStream(ms, CompressionMode.Compress);
//compress
sw.Write(byteArray,0,byteArray.Length);
//close sw, DO NOT FLUSH because byes will go missing...
sw.Close();
//transform byte[] zip data to string
byteArray = ms.ToArray();
var sb = new StringBuilder(byteArray.Length);
foreach (var item in byteArray)
{
sb.Append((char) item);
}
ms.Close();
sw.Dispose();
ms.Dispose();
return sb.ToString();
}
这是解压
的代码 public Stream UnCompress(Stream s)
{
int readCount;
MemoryStream mem = new MemoryStream();
byte[] tmp = new byte[128];
while ((readCount = s.Read(tmp, 0, 128)) != 0)
{
mem.Write(tmp, 0, readCount);
}
StreamReader reader = new StreamReader(mem);
char[] buffer = new char[mem.Length];
mem.Position = 0;
reader.ReadBlock(buffer, 0, (int)mem.Length);
byte[] zip = Encoding.UTF8.GetBytes(buffer, 0, (int)mem.Length);
Stream wr = new MemoryStream();
wr.Write(zip, 0, zip.Length);
wr.Position = 0;
using (var stream = new GZipStream(wr, CompressionMode.Decompress))
{
mem = new MemoryStream();
while ((readCount = stream.Read(tmp, 0, 128)) != 0)
{
mem.Write(tmp, 0, readCount);
}
mem.Position = 0;
return mem;
}
}
此时我在以下行中解压缩时出错:
while ((readCount = stream.Read(tmp, 0, 128)) != 0)
{
mem.Write(tmp, 0, readCount);
}
它只是不进入while循环并说:
GZip 标头中的幻数不正确。确保您传入的是 GZip 流
我的解压方法是基于stackoverflowpost
尝试2:
public Stream UnCompress(Stream s)
{
byte[] byteArray = null;
using (var m = new MemoryStream())
{
int count;
do
{
byte[] buf = new byte[1024];
count = s.Read(buf, 0, 1024);
m.Write(buf, 0, count);
} while (s.CanRead && count > 0);
byteArray = m.ToArray();
}
var indexBa = 0;
foreach (var item in s.ToString().ToCharArray())
{
byteArray[indexBa++] = (byte) item;
}
//Prepare for decompress
var ms = new MemoryStream(byteArray);
var sr = new GZipStream(ms,
CompressionMode.Decompress);
//Reset variable to collect uncompressed result
byteArray = new byte[byteArray.Length];
//Decompress
var rByte = sr.Read(byteArray, 0, byteArray.Length);
//Transform byte[] unzip data to string
var sB = new MemoryStream(rByte);
for (var i = 0; i < rByte; i++)
{
sB.Write(byteArray,0,rByte);
}
sr.Close();
ms.Close();
sr.Dispose();
ms.Dispose();
return sB;
}
结果:var rByte = sr.Read(byteArray, 0, byteArray.Length); 行中的相同错误
更新 1:
正如代码项目中给出的那样,解压字符串完美地工作。
public static string UnZip(string value)
{
//Transform string into byte[]
byte[] byteArray = new byte[value.Length];
int indexBA = 0;
foreach (char item in value.ToCharArray())
{
byteArray[indexBA++] = (byte)item;
}
//Prepare for decompress
System.IO.MemoryStream ms = new System.IO.MemoryStream(byteArray);
System.IO.Compression.GZipStream sr = new System.IO.Compression.GZipStream(ms,
System.IO.Compression.CompressionMode.Decompress);
//Reset variable to collect uncompressed result
byteArray = new byte[byteArray.Length];
//Decompress
int rByte = sr.Read(byteArray, 0, byteArray.Length);
//Transform byte[] unzip data to string
System.Text.StringBuilder sB = new System.Text.StringBuilder(rByte);
//Read the number of bytes GZipStream red and do not a for each bytes in
//resultByteArray;
for (int i = 0; i < rByte; i++)
{
sB.Append((char)byteArray[i]);
}
sr.Close();
ms.Close();
sr.Dispose();
ms.Dispose();
return sB.ToString();
}
【问题讨论】:
-
除此之外,像这样从任意二进制数据转换为文本是一个非常糟糕的主意。您最终会得到包含各种不可打印字符的文本,这些字符在许多情况下可能无法准确传输。我强烈建议您更改您的
Compress方法以接受并返回一个字节数组,然后您可以调查所涉及的多个转换中的哪一个导致了问题。 -
首先我很幸运你对我的帖子发表了评论。我尝试了几件事,有几次我在某些索引处遇到与十六进制相关的错误。这是否意味着在压缩时会生成一些无法解压缩的字符?
-
根本不要将压缩视为对文本的操作。将其视为对 binary 数据的操作 - 二进制输入,二进制输出。另外,考虑如何将输入字符串转换为二进制(可能是
Encoding.UTF8.GetBytes)以及在绝对必要时如何将输出转换为文本(例如 Convert.ToBase64String)
标签: c# c#-4.0 gzip compression system.io.compression