This sample connects to the running instances of IE on your computer and prints out the URL, Cookie- if any, and the HTML content of the site. It can be extended to connect to running instances on another computer using DCOM and particularly using CoCreateInstanceEx(): Extend it as you wish and let me know how useful it has been to you!
| 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 | """
This sample connects to the running instances of IE on your computer and prints out
the URL, Cookie- if any, and the HTML content of the site.
You need to generate stub files for IE and MSHTML using the readtlb tool of ctypes.
python ctypes\com\tools\readtlb.py c:\winnt\system32\MSHTML.TLB > mshtml.py
python ctypes\com\tools\readtlb.py C:\windows\system32\SHDOCVW.DLL > ie6.py
Known Issues:
Filters out Explorer sinces we don't expect it to have HTML content or cookies. Explorer and IExplore are part of the Shell and therefore IShellWindows.
The mshmtl.py file must be fixed manually by inserting this at the top, otherwise you get NameErrors:
 
 LONG_PTR = c_long
 UINT_PTR = c_uint 
 wireHGLOBAL = wireHWND = wireHDC = wireHBITMAP = c_int 
 SAFEARRAY = POINTER # I"m quite sure this is wrong
usage:
python IEconnect.py
You need the good ctypes module from http://starship.python.net/crew/theller/ctypes/
Sample based on information from 
http://support.microsoft.com/default.aspx?scid=http://support.microsoft.com:80/support/kb/articles/Q176/7/92.ASP&NoWebContent=1
By Eric Koome
email ekoome@yahoo.com
"""
from ctypes import *
from ctypes.com import GUID, HRESULT, IUnknown, CreateInstance
from ctypes.com.automation import IDispatch, VARIANT, BSTR, oleaut32
from ctypes.wintypes import DWORD
from win32con import NULL
from ie6 import ShellWindows, IShellWindows, InternetExplorer, IWebBrowser2 #generated from SHDOCVW.DLL
from mshtml import IHTMLDocument2, IHTMLElement # generated using MSHTML.TLB
            
def IsInternetExplorer(name):
    import re
    from types import NoneType
    if type(re.search(r'iexplore.exe$',name)) != NoneType:
        return True
    else:
        return False
    
# Lets create an instance of ShellWindows Interface
pItf = CreateInstance(ShellWindows)
windows = pItf
#Get num of IE window by using IShellwindows
nCount = c_long()
hret = windows._get_Count(byref(nCount))
#print "nCount", nCount
for i in range(nCount.value):
        
    #Get IDispatch interfaces from IshellWindows
    disp = POINTER(IDispatch)()
    va = VARIANT(i)
    from ctypes.com.automation import VT_I4
    # apparently IE doesn't like VT_INT (which automation uses),
    # it has to be VT_I4
    oleaut32.VariantChangeType(byref(va), byref(va), 0, VT_I4)
    hret = windows.Item(va, byref(disp))
    oleaut32.VariantClear(byref(va))
    #print "disp",disp
    #Get IwebBrowser2 Interfaces from IDispatch
    browser = POINTER(IWebBrowser2)()
    if disp != NULL:
            hret = disp.QueryInterface(byref(IWebBrowser2._iid_),
                                       byref(browser))
            #print "browser", browser
            
    #Get the full path of the EXE (IE or explorer)
    if browser != None:
        Name = BSTR()
        hret = browser._get_FullName(byref(Name))
        
        #Lets Check whether we are dealing with IE 
        if IsInternetExplorer(Name.value):
            #Get browsing URL string
            url= BSTR()
            hret = browser._get_LocationURL(byref(url))
            print "url", url.value
            #Get IHTMLDocument2 from IWebBrowser2
            htmlDisp = POINTER(IDispatch)()
            hret = browser._get_Document(byref(htmlDisp))
            #print "htmlDisp", htmlDisp
            doc = POINTER(IHTMLDocument2)()
            if htmlDisp != NULL:
                try:
                    hret = htmlDisp.QueryInterface(byref(IHTMLDocument2._iid_), byref(doc))
                    #print "doc", doc
                except:
                    pass
            #Call get_cookie method of IHTMLDocument2
            if doc != NULL:
                cookie = BSTR()
                try:
                    hret = doc._get_cookie(byref(cookie))
                    print "cookie", cookie
                except:
                    pass
                
                #Get IHTMLElement from IHTMLDocument2
                element = POINTER(IHTMLElement)()
                hret = doc._get_body(byref(element))
                #print "element", element
                
                #Call get_outerHTML of IHTMLElement
                if element != NULL:
                    html = BSTR()
                    try:
                        hret = element._get_outerHTML(byref(html))
                        print "html",html
                    except:
                        pass
        
    
    
 | 
    Tags: web
  
  
      
 Download
Download Copy to clipboard
Copy to clipboard
