from bs4 import BeautifulSoup html_doc = """ <html><head><title>The Dormouse's story</title></head> <body> <p class="title"><b>The Dormouse's story</b></p> <p class="story">Once upon a time there were three little sisters; and their names were <a href="http://example.com/elsie" class="sister" id="link1">Elsie</a>, <a href="http://example.com/lacie" class="sister" id="link2">Lacie</a> and <a href="http://example.com/tillie" class="sister" id="link3">Tillie</a>; and they lived at the bottom of a well.</p> <p class="story">...</p> """
from bs4 import BeautifulSoup html_doc = """ <html><head><title>The Dormouse's story</title></head> <body> <p class="title"><b>The Dormouse's story</b></p> <p class="story">Once upon a time there were three little sisters; and their names were <a href="http://example.com/elsie" class="sister" id="link1">Elsie</a>, <a href="http://example.com/lacie" class="sister" id="link2">Lacie</a> and <a href="http://example.com/tillie" class="sister" id="link3">Tillie</a>; and they lived at the bottom of a well.</p> <p class="story">...</p> """
from bs4 import BeautifulSoup html_doc = """ <html><head><title>The Dormouse's story</title></head> <body> <p class="title"><b>The Dormouse's story</b></p> <p class="story">Once upon a time there were three little sisters; and their names were <a href="http://example.com/elsie" class="sister" id="link1">Elsie</a>, <a href="http://example.com/lacie" class="sister" id="link2">Lacie</a> and <a href="http://example.com/tillie" class="sister" id="link3">Tillie</a>; and they lived at the bottom of a well.</p> <p class="story">...</p> """
soup = BeautifulSoup(html_doc, 'lxml') # 获取指定元素 tag = soup.find(id='link1')
# 获取单个元素 element = browser.find_element_by_id('id') element = browser.find_element_by_name('name') element = browser.find_element_by_xpath('xpath') element = browser.find_element_by_link_text('link text') element = browser.find_element_by_tag_name('tag name') element = browser.find_element_by_class_name('class name') element = browser.find_element_by_css_selector('css selector') element = browser.find_element_by_partial_link_text('partial link text') # 获取多个元素 elements = browser.find_elements_by_id('id') elements = browser.find_elements_by_name('name') elements = browser.find_elements_by_xpath('xpath') elements = browser.find_elements_by_link_text('link text') elements = browser.find_elements_by_tag_name('tag name') elements = browser.find_elements_by_class_name('class name') elements = browser.find_elements_by_css_selector('css selector') elements = browser.find_elements_by_partial_link_text('partial link text')