May-07-2020, 10:48 AM
>>> import bs4 >>> html_string='''<div class="bhgxx2 col-12-12"> ... <div class="MocXoX"> ... <div class="_2GiuhO">Specifications</div> ... <div> ... <div class="_3Rrcbo V39ti-"> ... <div class="_2RngUh"> ... <div class="_2lzn0o">General</div> ... <table class="_3ENrHu"> ... <tbody> ... <tr class="_3_6Uyw row"> ... <td class="_3-wDH3 col col-3-12">Sales Package</td> ... <td class="_2k4JXJ col col-9-12"> ... <ul> ... <li class="_3YhLQA">Laptop, Power Adaptor, User Guide, Warranty Documents</li> ... </ul> ... </td> ... </tr> ... <tr class="_3_6Uyw row"> ... <td class="_3-wDH3 col col-3-12">Model Number</td> ... <td class="_2k4JXJ col col-9-12"> ... <ul>''' >>> >>> soup = bs4.BeautifulSoup(html_string) >>> >>> for element in soup.find_all(class_=True): ... elm=element['class'][0] ... try: ... if soup.find('div',class_=elm).text == 'Specifications': ... print(elm) ... except: ... pass ... _2GiuhO