时间:2016-02-15 22:20 来源: 我爱IT技术网 作者:佚名
欢迎您访问我爱IT技术网,今天小编为你分享的编程技术是:【asp.net HttpWebRequest自动识别网页编码】,下面是详细的讲解!
asp.net HttpWebRequest自动识别网页编码
static string GetEncoding(string url)
{
HttpWebRequest request=null;
HttpWebResponse response=null;
StreamReader reader=null;
try
{
request=(HttpWebRequest)WebRequest.Create(url);
request.Timeout=20000;
request.AllowAutoRedirect=false;
response=(HttpWebResponse)request.GetResponse();
if (response.StatusCode==HttpStatusCode.OK && response.ContentLength < 1024 * 1024)
{
if (response.ContentEncoding !=null && response.ContentEncoding.Equals("gzip", StringComparison.InvariantCultureIgnoreCase))
reader=new StreamReader(new GZipStream(response.GetResponseStream(), CompressionMode.Decompress));
else
reader=new StreamReader(response.GetResponseStream(), Encoding.ASCII);
string html=reader.ReadToEnd();
Regex reg_charset=new Regex(@"charset\b\s*=\s*(?<charset>[^""]*)");
if (reg_charset.IsMatch(html))
{
return reg_charset.Match(html).Groups["charset"].Value;
}
else if (response.CharacterSet !=string.Empty)
{
return response.CharacterSet;
}
else
return Encoding.Default.BodyName;
}
}
catch
{
}
finally
{
if (response !=null)
{
response.Close();
response=null;
}
if (reader !=null)
reader.Close();
if (request !=null)
request=null;
}
return Encoding.Default.BodyName;
}
/// <summary>
/// 获取源代码
/// </summary>
/// <param name="url"></param>
/// <returns></returns>
static string GetHtml(string url, Encoding encoding)
{
HttpWebRequest request=null;
HttpWebResponse response=null;
StreamReader reader=null;
try
{
request=(HttpWebRequest)WebRequest.Create(url);
request.Timeout=20000;
request.AllowAutoRedirect=false;
response=(HttpWebResponse)request.GetResponse();
if (response.StatusCode==HttpStatusCode.OK && response.ContentLength < 1024 * 1024)
{
if (response.ContentEncoding !=null && response.ContentEncoding.Equals("gzip", StringComparison.InvariantCultureIgnoreCase))
reader=new StreamReader(new GZipStream(response.GetResponseStream(), CompressionMode.Decompress), encoding);
else
reader=new StreamReader(response.GetResponseStream(), encoding);
string html=reader.ReadToEnd();
return html;
}
}
catch
{
}
finally
{
if (response !=null)
{
response.Close();
response=null;
}
if (reader !=null)
reader.Close();
if (request !=null)
request=null;
}
return string.Empty;
}
关于asp.net HttpWebRequest自动识别网页编码的用户互动如下:
相关问题:
答: >>详细
相关问题:
答: >>详细
相关问题:
答: >>详细
- 【asp】asp.net url重写浅谈-net-url重写
- 【DataSet】DataSet、DataTable、DataRow区别详解
- 【asp】asp.net 动态添加多个用户控件-net-动态添
- 【创建】ASP.NET Web API教程 创建域模型的方法详
- 【asp】asp.net ubb使用代码-net-ubb使用
- 【默认图片】图片不存在使用默认图片代替的实例
- 【asp】asp.net 页面转向 Response.Redirect Ser
- 【页面打印】关于ASP.NET页面打印技术的常用方法
- 【MVC5】MVC 5 第一章 创建MVC 5 web应用程序-net
- 【MVC】一个简单MVC5 + EF6示例分享-EF6实例-MVC5
- 评论列表(网友评论仅供网友表达个人看法,并不表明本站同意其观点或证实其描述)
-
