要获取整个页面的HTML:
from selenium import webdriverdriver = webdriver.Firefox()driver.get("http://stackoverflow.com")html = driver.page_source要获取外部HTML(包括标记):
# HTML from `<html>`html = driver.execute_script("return document.documentElement.outerHTML;")# HTML from `<body>`html = driver.execute_script("return document.body.outerHTML;")# HTML from element with some Javascriptelement = driver.find_element_by_css_selector("#hireme")html = driver.execute_script("return arguments[0].outerHTML;", element)# HTML from element with `get_attribute`element = driver.find_element_by_css_selector("#hireme")html = element.get_attribute('outerHTML')要获取内部HTML(不包括标签):
# HTML from `<html>`html = driver.execute_script("return document.documentElement.innerHTML;")# HTML from `<body>`html = driver.execute_script("return document.body.innerHTML;")# HTML from element with some Javascriptelement = driver.find_element_by_css_selector("#hireme")html = driver.execute_script("return arguments[0].innerHTML;", element)# HTML from element with `get_attribute`element = driver.find_element_by_css_selector("#hireme")html = element.get_attribute('innerHTML')


