本文非本人编写,转载自:http://www.cnblogs.com/youngerliu/archive/2013/05/27/3101488.html

今天遇到用LumiSoft.Net这个组件收取邮件中含有类似于=?utf-8?B?5rWL6K+V6YKu5Lu2?= ,=?gbk?Q?=C6=BD=B0=B2=D6=A4=C8=AF*=C3=BF=D6=DC=B1=A8?=这两种格式的乱码,随后Google了下,原因是邮件本身的编码,跟传输过程采用的编码不一致,=?utf-8?B?5rWL6K+V6YKu5Lu2?= 这个表示邮件编码是utf-8,传输采用base64编码格式,第二个Q表示传输格式为Quote-Printable。
对于这种格式的字符,Google大神帮我搜到了相关的处理代码,然后综合项目,整理出来了,留个记号。

 /// <summary>
/// 乱码解析
/// </summary>
/// <param name="input"></param>
/// <returns></returns>
private string GetMailSubject(string input)
{
try
{
string regex = @"=\?(?<encode>.*?)\?(?<type>[B|Q])\?(?<body>.*?)\?=";
Regex re = new Regex(regex, RegexOptions.IgnoreCase | RegexOptions.IgnorePatternWhitespace | RegexOptions.Multiline);
MatchCollection mcs = re.Matches(input);
foreach (Match mc in mcs)
{
string encode = mc.Groups["encode"].Value;
string type = mc.Groups["type"].Value;
Encoding encod = null;
if (!string.IsNullOrEmpty(encode))
{
if ((encode.ToLower().Contains("gbk") || encode.ToLower().Contains("utf8") || encode.ToLower().Contains("utf-8")) && type == "Q")
{
if (encode.ToLower().Contains("utf-8"))
{
encod = Encoding.UTF8;
}
else if (encode.ToLower().Contains("gbk"))
{
encod = Encoding.GetEncoding("gb2312");
}
input = input.Replace(mc.Value, QuotedPrintable.Decode(mc.Groups["body"].Value, encod));
}
else
{
if (encode.ToLower().Contains("euccn") || encode.ToLower().Contains("euc-cn"))
{
encode = "gb2312";
}
else if (encode.ToLower().Contains("utf8"))
{
encode = "utf-8";
}
string body = mc.Groups["body"].Value;
byte[] bytes = Convert.FromBase64String(body);
string result = Encoding.GetEncoding(encode).GetString(bytes);
input = input.Replace(mc.Value, result);
}
} }
if (mcs.Count > )
{
FileLogHelper.WriteInfo(string.Format("原邮件标题:[{0}]\r\n解析后标题:[{1}]", input, input));
}
return input;
}
catch (Exception)
{
return input;
}
}

针对两种不同类型的字符做了处理,这里调用了一个Quote-Printable编码解码类,代码如下:

 using System;
using System.Collections;
using System.Text;
namespace Wind.MailRobot.BLL
{
public class QuotedPrintable
{
private const byte EQUALS = ;
private const byte CR = ;
private const byte LF = ;
private const byte SPACE = ;
private const byte TAB = ; /// <summary>
/// Encodes a string to QuotedPrintable
/// </summary>
/// <param name="_ToEncode">String to encode</param>
/// <returns>QuotedPrintable encoded string</returns>
public static string Encode(string _ToEncode, Encoding encoding)
{
StringBuilder Encoded = new StringBuilder();
string hex = string.Empty;
byte[] bytes = encoding.GetBytes(_ToEncode);
int count = ; for (int i = ; i < bytes.Length; i++)
{
//these characters must be encoded
if ((bytes[i] < || bytes[i] > || bytes[i] == EQUALS) && bytes[i] != CR && bytes[i] != LF && bytes[i] != SPACE)
{
if (bytes[i].ToString("X").Length < )
{
hex = "" + bytes[i].ToString("X");
Encoded.Append("=" + hex);
}
else
{
hex = bytes[i].ToString("X");
Encoded.Append("=" + hex);
}
}
else
{
//check if index out of range
if ((i + ) < bytes.Length)
{
//if TAB is at the end of the line - encode it!
if ((bytes[i] == TAB && bytes[i + ] == LF) || (bytes[i] == TAB && bytes[i + ] == CR))
{
Encoded.Append("=0" + bytes[i].ToString("X"));
}
//if SPACE is at the end of the line - encode it!
else if ((bytes[i] == SPACE && bytes[i + ] == LF) || (bytes[i] == SPACE && bytes[i + ] == CR))
{
Encoded.Append("=" + bytes[i].ToString("X"));
}
else
{
Encoded.Append(System.Convert.ToChar(bytes[i]));
}
}
else
{
Encoded.Append(System.Convert.ToChar(bytes[i]));
}
}
if (count == )
{
Encoded.Append("=\r\n"); //insert soft-linebreak
count = ;
}
count++;
} return Encoded.ToString();
} /// <summary>
/// Decodes a QuotedPrintable encoded string
/// </summary>
/// <param name="_ToDecode">The encoded string to decode</param>
/// <returns>Decoded string</returns>
public static string Decode(string _ToDecode, Encoding encoding)
{
try
{
//remove soft-linebreaks first
_ToDecode = _ToDecode.Replace("=\r\n", "");
char[] chars = _ToDecode.ToCharArray();
byte[] bytes = new byte[chars.Length];
int bytesCount = ;
for (int i = ; i < chars.Length; i++)
{
// if encoded character found decode it
if (chars[i] == '=')
{
bytes[bytesCount++] = System.Convert.ToByte(int.Parse(chars[i + ].ToString() + chars[i + ].ToString(), System.Globalization.NumberStyles.HexNumber));
i += ;
}
else
{
bytes[bytesCount++] = System.Convert.ToByte(chars[i]);
}
}
return encoding.GetString(bytes, , bytesCount);
}
catch (Exception)
{ return _ToDecode;
}
}
}
}

最新文章

  1. dev_set_draw的fill和margin模式
  2. 在ASP.NET MVC中使用Juqery实现页面局部刷新
  3. 移动端web开发进阶
  4. Flex contextMenu
  5. HTML——选择器
  6. ACCESS的参数化查询
  7. C语言的内存管理
  8. JSP SQL注入
  9. linux中ulimit作用
  10. 第一个c++程序 helloworld
  11. MySQL多实例-精典故障案例
  12. python 操作 mysql基础补充
  13. &#39;unicodeescape&#39; codec can&#39;t decode bytes in position 2-3: truncated \UXXXXXXXX escape
  14. fieldset 使用小案例
  15. Android ORM SQL Top 5
  16. 雷林鹏分享:C# 数组(Array)
  17. python学习笔记011——内置函数filter()
  18. Oracle里的执行计划
  19. BankNote
  20. IntelliJ IDEA使用手册

热门文章

  1. (原创)LAMP教程6-使用SecureCRTPortable工具远程连接centos
  2. The Bookcase
  3. linux常用命令之--目录与文件的操作命令
  4. 修改linux主机名称
  5. MapReducer Counter计数器的使用,Combiner ,Partitioner,Sort,Grop的使用,
  6. Google App Engine Deployment 相关问题
  7. 【Spark学习】Apache Spark for 第三方Hadoop分发版
  8. SqlServer修改数据库文件及日志文件存放位置
  9. MongoVUE 如何导出数据
  10. Android强大的开源库与系统架构工具