|
|
__init__(self,
*args,
**kwargs)
The Soup object is initialized as the 'root tag', and the
provided markup (which can be a string or a file-like object)
is fed into the underlying parser. |
source code
|
|
|
|
extractCharsetFromMeta(self,
attrs)
Beautiful Soup can detect a charset included in a META tag, try to
convert the document to that charset, and re-parse the document from
the beginning. |
source code
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
__getitem__(self,
key)
tag[key] returns the value of the 'key' attribute for the tag, and
throws an exception if it's not there.
(Inherited from rosdeb.BeautifulSoup.Tag) |
source code
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
fetchNextSiblings(self,
name=None,
attrs={},
text=None,
limit=None,
**kwargs)
Returns the siblings of this Tag that match the given criteria and
appear after this Tag in the document.
(Inherited from rosdeb.BeautifulSoup.PageElement) |
source code
|
|
|
|
|
|
|
fetchPrevious(self,
name=None,
attrs={},
text=None,
limit=None,
**kwargs)
Returns all items that match the given criteria and appear before
this Tag in the document.
(Inherited from rosdeb.BeautifulSoup.PageElement) |
source code
|
|
|
|
fetchPreviousSiblings(self,
name=None,
attrs={},
text=None,
limit=None,
**kwargs)
Returns the siblings of this Tag that match the given criteria and
appear before this Tag in the document.
(Inherited from rosdeb.BeautifulSoup.PageElement) |
source code
|
|
|
|
|
|
|
find(self,
name=None,
attrs={},
recursive=True,
text=None,
**kwargs)
Return only the first child of this Tag matching the given criteria.
(Inherited from rosdeb.BeautifulSoup.Tag) |
source code
|
|
|
|
|
|
|
findAllNext(self,
name=None,
attrs={},
text=None,
limit=None,
**kwargs)
Returns all items that match the given criteria and appear after this
Tag in the document.
(Inherited from rosdeb.BeautifulSoup.PageElement) |
source code
|
|
|
|
findAllPrevious(self,
name=None,
attrs={},
text=None,
limit=None,
**kwargs)
Returns all items that match the given criteria and appear before
this Tag in the document.
(Inherited from rosdeb.BeautifulSoup.PageElement) |
source code
|
|
|
|
findChild(self,
name=None,
attrs={},
recursive=True,
text=None,
**kwargs)
Return only the first child of this Tag matching the given criteria.
(Inherited from rosdeb.BeautifulSoup.Tag) |
source code
|
|
|
|
|
|
|
findNext(self,
name=None,
attrs={},
text=None,
**kwargs)
Returns the first item that matches the given criteria and appears
after this Tag in the document.
(Inherited from rosdeb.BeautifulSoup.PageElement) |
source code
|
|
|
|
findNextSibling(self,
name=None,
attrs={},
text=None,
**kwargs)
Returns the closest sibling to this Tag that matches the given
criteria and appears after this Tag in the document.
(Inherited from rosdeb.BeautifulSoup.PageElement) |
source code
|
|
|
|
findNextSiblings(self,
name=None,
attrs={},
text=None,
limit=None,
**kwargs)
Returns the siblings of this Tag that match the given criteria and
appear after this Tag in the document.
(Inherited from rosdeb.BeautifulSoup.PageElement) |
source code
|
|
|
|
|
|
|
|
|
|
findPrevious(self,
name=None,
attrs={},
text=None,
**kwargs)
Returns the first item that matches the given criteria and appears
before this Tag in the document.
(Inherited from rosdeb.BeautifulSoup.PageElement) |
source code
|
|
|
|
findPreviousSibling(self,
name=None,
attrs={},
text=None,
**kwargs)
Returns the closest sibling to this Tag that matches the given
criteria and appears before this Tag in the document.
(Inherited from rosdeb.BeautifulSoup.PageElement) |
source code
|
|
|
|
findPreviousSiblings(self,
name=None,
attrs={},
text=None,
limit=None,
**kwargs)
Returns the siblings of this Tag that match the given criteria and
appear before this Tag in the document.
(Inherited from rosdeb.BeautifulSoup.PageElement) |
source code
|
|
|
|
first(self,
name=None,
attrs={},
recursive=True,
text=None,
**kwargs)
Return only the first child of this Tag matching the given criteria.
(Inherited from rosdeb.BeautifulSoup.Tag) |
source code
|
|
|
|
|
|
|
get(self,
key,
default=None)
Returns the value of the 'key' attribute for the tag, or the value
given for 'default' if it doesn't have that attribute.
(Inherited from rosdeb.BeautifulSoup.Tag) |
source code
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
SELF_CLOSING_TAGS = {'base': None, 'br': None, 'frame': None, ...
|
|
|
PRESERVE_WHITESPACE_TAGS = set(['pre', 'textarea'])
|
|
|
QUOTE_TAGS = {'script': None, 'textarea': None}
|
|
|
NESTABLE_INLINE_TAGS = ['span', 'font', 'q', 'object', 'bdo', ...
|
|
|
NESTABLE_BLOCK_TAGS = ['blockquote', 'div', 'fieldset', 'ins',...
|
|
|
NESTABLE_LIST_TAGS = {'dd': ['dl'], 'dl': [], 'dt': ['dl'], 'l...
|
|
|
NESTABLE_TABLE_TAGS = {'table': [], 'tbody': ['table'], 'td': ...
|
|
|
NON_NESTABLE_BLOCK_TAGS = ['address', 'form', 'p', 'pre']
|
|
|
RESET_NESTING_TAGS = {'address': None, 'blockquote': None, 'dd...
|
|
|
NESTABLE_TAGS = {'bdo': [], 'blockquote': [], 'center': [], 'd...
|
|
|
CHARSET_RE = re.compile(r'(?m)((^|;)\s*charset=)([^;]*)')
|
|
|
ALL_ENTITIES = 'xhtml'
(Inherited from rosdeb.BeautifulSoup.BeautifulStoneSoup)
|
|
|
BARE_AMPERSAND_OR_BRACKET = re.compile(r'([<>]|&(?!#\d+;|#x[0-...
(Inherited from rosdeb.BeautifulSoup.Tag)
|
|
|
HTML_ENTITIES = 'html'
(Inherited from rosdeb.BeautifulSoup.BeautifulStoneSoup)
|
|
|
MARKUP_MASSAGE = [(re.compile('(<[^<>]*)/>'), lambda x: x.grou...
(Inherited from rosdeb.BeautifulSoup.BeautifulStoneSoup)
|
|
|
ROOT_TAG_NAME = u'[document]'
(Inherited from rosdeb.BeautifulSoup.BeautifulStoneSoup)
|
|
|
STRIP_ASCII_SPACES = {9: None, 10: None, 12: None, 13: None, 3...
(Inherited from rosdeb.BeautifulSoup.BeautifulStoneSoup)
|
|
|
XHTML_ENTITIES = 'xhtml'
(Inherited from rosdeb.BeautifulSoup.BeautifulStoneSoup)
|
|
|
XML_ENTITIES = 'xml'
(Inherited from rosdeb.BeautifulSoup.BeautifulStoneSoup)
|
|
|
XML_ENTITIES_TO_SPECIAL_CHARS = {'amp': '&', 'apos': '\'', 'gt...
(Inherited from rosdeb.BeautifulSoup.Tag)
|
|
|
XML_SPECIAL_CHARS_TO_ENTITIES = {'"': 'quot', '&': 'amp', '\''...
(Inherited from rosdeb.BeautifulSoup.Tag)
|