html - WindowsMobile6.0でのWebページドキュメントの取得

Question

インターネットでたくさん検索した後、次のコードを見つけて、Webページの本文部分のみをWebブラウザコントロールにロードしました。

IPIEHTMLDocument2 *pHTMLDocument;

IPIEHTMLElement* pBodyElement; 

CComPtr<IDispatch> spDispDoc;

HRESULT res = m_spWebBrowser2->get_Document(&spDispDoc);


if(SUCCEEDED(res))
{
    spDispDoc->QueryInterface( __uuidof(IPIEHTMLDocument2), (void**)&pHTMLDocument);

    WCHAR szText[256];
    DISPID id;
    OLECHAR FAR* szTemp;

    // store "body"
    szTemp = szText;
    StringCchPrintf(szText, 256, L"body", id);

    // get the body
    pHTMLDocument->GetIDsOfNames(IID_NULL, &szTemp, 1, LOCALE_USER_DEFAULT, &id);

    VARIANT varResult;
    varResult.vt = VT_DISPATCH;
    VARIANT FAR *pVarResult = &varResult;
    DISPPARAMS dispparamsNoArgs = {NULL, NULL, 0, 0};

    pHTMLDocument->Invoke(id, IID_NULL, LOCALE_USER_DEFAULT, DISPATCH_PROPERTYGET, &dispparamsNoArgs, pVarResult, NULL, NULL);

    BSTR bodyValue;

    if( NULL != pVarResult->pdispVal)
    {
        pVarResult->pdispVal->QueryInterface(IID_IPIEHTMLElement, (void**)&pBodyElement);

        pBodyElement->get_innerHTML(&bodyValue);
    }         
}

しかし、ロードされたWebページから残りのheadおよびその他のタグドキュメントテキストを取得する方法では、「head」文字列をGetIDsOfNames（）メソッドに渡そうとしても、失敗値が渡されるため、問題が発生します。WindowsMobile6.0でWebページのコンテンツ全体にアクセス/抽出する方法を教えてください

ありがとう、ラマナンドバート。

score 0 · Accepted Answer

void  CBrowserWindow::ExtractWebPageDoc()

{
HRESULT                         hrResult           = E_FAIL;    
IDispatch                      *pIDisp             = NULL;
IPIEHTMLDocument3              *pIHTMLDocument     = NULL;
IPIEHTMLElementCollection      *pHTMLElementcol    = NULL;
IPIEHTMLImgElement             *pHTMLImgElement    = NULL; 


hrResult = m_spIWebBrowser2->get_Document( &pIDisp);
if (NULL != pIDisp)
{
    hrResult = pIDisp->QueryInterface( __uuidof(IPIEHTMLDocument3), (void**)&pIHTMLDocument);
    if( NULL != pIHTMLDocument)
    {
        IPIEHTMLElement* pElement = NULL;
        CComBSTR pHTMLElement;

        hrResult = pIHTMLDocument->get_documentElement( &pElement);
        if (SUCCEEDED(hrResult)) 
        {                               
            pElement->get_innerHTML(&pHTMLElement.m_str);
            SaveToHTMLFile( pHTMLElement);
        }

        hrResult = pIHTMLDocument->get_images( &pHTMLElementcol);
        if (NULL != pHTMLElementcol)
        {
            CComBSTR  strImage;
            VARIANT vtBase, vtIndex;
            long pHTMLElementCollectionLength = 0;

            VariantInit( &vtBase);
            vtIndex.vt = VT_UINT;

            hrResult = pHTMLElementcol->get_length( &pHTMLElementCollectionLength);
            for (int ilen = 0; ilen < (int)pHTMLElementCollectionLength ; ilen++)
            {           
                vtIndex.lVal = ilen;

                pIDisp = NULL;
                hrResult =  pHTMLElementcol->item( vtBase, vtIndex , &pIDisp);
                if (NULL != pIDisp)
                {
                    hrResult = pIDisp->QueryInterface( __uuidof(IPIEHTMLImgElement), (void**)&pHTMLImgElement);

                    if (NULL != pHTMLImgElement)
                    //CComQIPtr<IPIEHTMLImgElement> imgElement( pIDisp);
                    //imgElement->get_src( &strImage.m_str);    //I get it here :)
                    pHTMLImgElement->get_src( &strImage.m_str);
                }
            }
        }
    }
}

}

上記のコードは、Windows モバイルデバイスで Web ページコンテンツ全体を取得します。

html - WindowsMo​​bile6.0でのWebページドキュメントの取得

1 に答える 1

Related

Reference

html - WindowsMobile6.0でのWebページドキュメントの取得