BeautifulSoup 对象方法

来源:互联网 发布:王者归来 软件程序 编辑:程序博客网 时间:2024/06/15 06:50
from bs4 import BeautifulSoup,Tag,CDataimport redoc = ['<html><head><title>Page title</title></head>',       '<body><p id="firstpara" align="center">This is paragraph <b>one</b>.</p>',       '<p id="secondpara" align="blah">This is paragraph <b>two</b>.</p>',       '</body></html>']soup = BeautifulSoup(''.join(doc))print(soup.prettify)print(soup.contents[0].name)print(soup.contents[0].contents[0].name)print(soup.contents[0].contents[0].contents[0].string)head = soup.contents[0].contents[0]print(head.parent.name)print(head.next)print(head.nextSibling.name)print(head.nextSibling.contents[0])print(head.nextSibling.contents[0])      print(soup.findAll('p', align="center"))print(soup.find('p', align="center"))print(soup('p', align ="center")[0]['id'])print(soup.find('p').b.string)print(soup('p')[1].b.string)titleTag = soup.html.head.titletitleTag['id'] = 'theTitle'print(titleTag)titleTag.contents[0].replaceWith("new title")soup.p.replaceWith(soup.b)print(soup.prettify)soup.body.insert(0, "this page used to have")

0 0
原创粉丝点击