Additional Inherited Members | |
Public Member Functions inherited from BeautifulSoup.BeautifulSoup | |
def | __init__ (self, args, kwargs) |
def | start_meta (self, attrs) |
Public Member Functions inherited from BeautifulSoup.BeautifulStoneSoup | |
def | __getattr__ (self, methodName) |
def | __init__ (self, markup="", parseOnlyThese=None, fromEncoding=None, markupMassage=True, smartQuotesTo=XML_ENTITIES, convertEntities=None, selfClosingTags=None, isHTML=False) |
def | convert_charref (self, name) |
def | endData (self, containerClass=NavigableString) |
def | handle_charref (self, ref) |
def | handle_comment (self, text) |
def | handle_data (self, data) |
def | handle_decl (self, data) |
def | handle_entityref (self, ref) |
def | handle_pi (self, text) |
def | isSelfClosingTag (self, name) |
def | parse_declaration (self, i) |
def | popTag (self) |
def | pushTag (self, tag) |
def | reset (self) |
def | unknown_endtag (self, name) |
def | unknown_starttag (self, name, attrs, selfClosing=0) |
Public Member Functions inherited from BeautifulSoup.Tag | |
def | __call__ (self, args, kwargs) |
def | __contains__ (self, x) |
def | __delitem__ (self, key) |
def | __eq__ (self, other) |
def | __getattr__ (self, tag) |
def | __getitem__ (self, key) |
def | __init__ (self, parser, name, attrs=None, parent=None, previous=None) |
def | __iter__ (self) |
def | __len__ (self) |
def | __ne__ (self, other) |
def | __nonzero__ (self) |
def | __repr__ (self, encoding=DEFAULT_OUTPUT_ENCODING) |
def | __setitem__ (self, key, value) |
def | __str__ (self, encoding=DEFAULT_OUTPUT_ENCODING, prettyPrint=False, indentLevel=0) |
def | __unicode__ (self) |
def | childGenerator (self) |
def | clear (self) |
def | decompose (self) |
def | fetchText (self, text=None, recursive=True, limit=None) |
def | find (self, name=None, attrs={}, recursive=True, text=None, kwargs) |
def | findAll (self, name=None, attrs={}, recursive=True, text=None, limit=None, kwargs) |
def | firstText (self, text=None, recursive=True) |
def | get (self, key, default=None) |
def | getString (self) |
def | getText (self, separator=u"") |
def | has_key (self, key) |
def | index (self, element) |
def | prettify (self, encoding=DEFAULT_OUTPUT_ENCODING) |
def | recursiveChildGenerator (self) |
def | renderContents (self, encoding=DEFAULT_OUTPUT_ENCODING, prettyPrint=False, indentLevel=0) |
def | setString (self, string) |
Public Member Functions inherited from BeautifulSoup.PageElement | |
def | append (self, tag) |
def | extract (self) |
def | findAllNext (self, name=None, attrs={}, text=None, limit=None, kwargs) |
def | findAllPrevious (self, name=None, attrs={}, text=None, limit=None, kwargs) |
def | findNext (self, name=None, attrs={}, text=None, kwargs) |
def | findNextSibling (self, name=None, attrs={}, text=None, kwargs) |
def | findNextSiblings (self, name=None, attrs={}, text=None, limit=None, kwargs) |
def | findParent (self, name=None, attrs={}, kwargs) |
def | findParents (self, name=None, attrs={}, limit=None, kwargs) |
def | findPrevious (self, name=None, attrs={}, text=None, kwargs) |
def | findPreviousSibling (self, name=None, attrs={}, text=None, kwargs) |
def | findPreviousSiblings (self, name=None, attrs={}, text=None, limit=None, kwargs) |
def | insert (self, position, newChild) |
def | nextGenerator (self) |
def | nextSiblingGenerator (self) |
def | parentGenerator (self) |
def | previousGenerator (self) |
def | previousSiblingGenerator (self) |
def | replaceWith (self, replaceWith) |
def | replaceWithChildren (self) |
def | setup (self, parent=None, previous=None) |
def | substituteEncoding (self, str, encoding=None) |
def | toEncoding (self, s, encoding=None) |
Public Attributes inherited from BeautifulSoup.BeautifulSoup | |
declaredHTMLEncoding | |
originalEncoding | |
Public Attributes inherited from BeautifulSoup.BeautifulStoneSoup | |
convertEntities | |
convertHTMLEntities | |
convertXMLEntities | |
currentData | |
currentTag | |
declaredHTMLEncoding | |
escapeUnrecognizedEntities | |
fromEncoding | |
hidden | |
instanceSelfClosingTags | |
literal | |
markup | |
markupMassage | |
originalEncoding | |
parseOnlyThese | |
previous | |
quoteStack | |
smartQuotesTo | |
tagStack | |
Public Attributes inherited from BeautifulSoup.Tag | |
attrMap | |
attrs | |
containsSubstitutions | |
contents | |
convertHTMLEntities | |
convertXMLEntities | |
escapeUnrecognizedEntities | |
hidden | |
isSelfClosing | |
name | |
parserClass | |
Public Attributes inherited from BeautifulSoup.PageElement | |
next | |
nextSibling | |
parent | |
previous | |
previousSibling | |
Properties inherited from BeautifulSoup.Tag | |
string = property(getString, setString) | |
text = property(getText) | |
The MinimalSoup class is for parsing HTML that contains pathologically bad markup. It makes no assumptions about tag nesting, but it does know which tags are self-closing, that <script> tags contain Javascript and should not be parsed, that META tags may contain encoding information, and so on. This also makes it better for subclassing than BeautifulStoneSoup or BeautifulSoup.
Definition at line 1662 of file BeautifulSoup.py.