随笔 - 491  文章 - 0  评论 - 97  阅读 - 239万

使用CInternetSession和CHttpFile提取网页源码

程序界面:

为编辑框添加一个对应的变量:m_sUrl,再为Button1添加点击事件,主要代码如下:

void CGetHtmlCodeDlg::OnButton1()
{
    CString sHtml;
 
    UpdateData();
    GetHtmlCode(m_sUrl, sHtml);
    WritetoFile(sHtml);
    MessageBox("提取网页源码完成");
}
 
void CGetHtmlCodeDlg::GetHtmlCode(const CString url, CString &html)
{
    CInternetSession session;
    CHttpFile * file = NULL;
     
    try
    {
        file = (CHttpFile *)session.OpenURL(url);
        if(file)
        {
            CString line;
            while(file->ReadString(line) != NULL)
            {
                html += line + "\n";
            }
            file->Close();
        }
    }
    catch (CInternetException* e)
    {
        e->Delete();
        html = "CInternet Exception";
    }
    file = NULL;
    session.Close();
}
 
BOOL CGetHtmlCodeDlg::WritetoFile(const CString& sValue)
{
    CString sFile = GetExePath() + "\\1.html";
     
    CStdioFile file;
    if(file.Open(sFile, CFile::modeCreate | CFile::modeWrite | CFile::modeNoTruncate))
    {
        file.SeekToEnd();               // 移动文件指针到末尾
        file.WriteString(sValue);
        file.Close();
    }
    return FALSE;
}
 
CString CGetHtmlCodeDlg::GetExePath()
{
    char sFileName[256] = {0};
    CString sPath = _T("");
     
    GetModuleFileName(AfxGetInstanceHandle(), sFileName, 255);
    sPath.Format("%s", sFileName);
    int pos = sPath.ReverseFind('\\');
    if(pos != -1)
        sPath = sPath.Left(pos);
    else
        sPath = _T("");
     
    return sPath;
}
posted on   清清飞扬  阅读(6076)  评论(0编辑  收藏  举报
< 2011年1月 >
26 27 28 29 30 31 1
2 3 4 5 6 7 8
9 10 11 12 13 14 15
16 17 18 19 20 21 22
23 24 25 26 27 28 29
30 31 1 2 3 4 5

点击右上角即可分享
微信分享提示