Foo
Bar
Baz

Foo
Bar
Baz

An H1

Some text

Some more text

An H2

Another

Bob

Another H2

me span1a1 span1a2 test span2a1

English

English UK

English US

French

""" def setUp(self): self.soup = BeautifulSoup(self.HTML, 'html.parser') def assertSelects(self, selector, expected_ids, **kwargs): el_ids = [el['id'] for el in self.soup.select(selector, **kwargs)] el_ids.sort() expected_ids.sort() self.assertEqual(expected_ids, el_ids, "Selector %s, expected [%s], got [%s]" % ( selector, ', '.join(expected_ids), ', '.join(el_ids) ) ) assertSelect = assertSelects def assertSelectMultiple(self, *tests): for selector, expected_ids in tests: self.assertSelect(selector, expected_ids) def test_one_tag_one(self): els = self.soup.select('title') self.assertEqual(len(els), 1) self.assertEqual(els[0].name, 'title') self.assertEqual(els[0].contents, ['The title']) def test_one_tag_many(self): els = self.soup.select('div') self.assertEqual(len(els), 4) for div in els: self.assertEqual(div.name, 'div') el = self.soup.select_one('div') self.assertEqual('main', el['id']) def test_select_one_returns_none_if_no_match(self): match = self.soup.select_one('nonexistenttag') self.assertEqual(None, match) def test_tag_in_tag_one(self): els = self.soup.select('div div') self.assertSelects('div div', ['inner', 'data1']) def test_tag_in_tag_many(self): for selector in ('html div', 'html body div', 'body div'): self.assertSelects(selector, ['data1', 'main', 'inner', 'footer']) def test_limit(self): self.assertSelects('html div', ['main'], limit=1) self.assertSelects('html body div', ['inner', 'main'], limit=2) self.assertSelects('body div', ['data1', 'main', 'inner', 'footer'], limit=10) def test_tag_no_match(self): self.assertEqual(len(self.soup.select('del')), 0) def test_invalid_tag(self): self.assertRaises(ValueError, self.soup.select, 'tag%t') def test_select_dashed_tag_ids(self): self.assertSelects('custom-dashed-tag', ['dash1', 'dash2']) def test_select_dashed_by_id(self): dashed = self.soup.select('custom-dashed-tag[id=\"dash2\"]') self.assertEqual(dashed[0].name, 'custom-dashed-tag') self.assertEqual(dashed[0]['id'], 'dash2') def test_dashed_tag_text(self): self.assertEqual(self.soup.select('body > custom-dashed-tag')[0].text, 'Hello there.') def test_select_dashed_matches_find_all(self): self.assertEqual(self.soup.select('custom-dashed-tag'), self.soup.find_all('custom-dashed-tag')) def test_header_tags(self): self.assertSelectMultiple( ('h1', ['header1']), ('h2', ['header2', 'header3']), ) def test_class_one(self): for selector in ('.onep', 'p.onep', 'html p.onep'): els = self.soup.select(selector) self.assertEqual(len(els), 1) self.assertEqual(els[0].name, 'p') self.assertEqual(els[0]['class'], ['onep']) def test_class_mismatched_tag(self): els = self.soup.select('div.onep') self.assertEqual(len(els), 0) def test_one_id(self): for selector in ('div#inner', '#inner', 'div div#inner'): self.assertSelects(selector, ['inner']) def test_bad_id(self): els = self.soup.select('#doesnotexist') self.assertEqual(len(els), 0) def test_items_in_id(self): els = self.soup.select('div#inner p') self.assertEqual(len(els), 3) for el in els: self.assertEqual(el.name, 'p') self.assertEqual(els[1]['class'], ['onep']) self.assertFalse(els[0].has_attr('class')) def test_a_bunch_of_emptys(self): for selector in ('div#main del', 'div#main div.oops', 'div div#main'): self.assertEqual(len(self.soup.select(selector)), 0) def test_multi_class_support(self): for selector in ('.class1', 'p.class1', '.class2', 'p.class2', '.class3', 'p.class3', 'html p.class2', 'div#inner .class2'): self.assertSelects(selector, ['pmulti']) def test_multi_class_selection(self): for selector in ('.class1.class3', '.class3.class2', '.class1.class2.class3'): self.assertSelects(selector, ['pmulti']) def test_child_selector(self): self.assertSelects('.s1 > a', ['s1a1', 's1a2']) self.assertSelects('.s1 > a span', ['s1a2s1']) def test_child_selector_id(self): self.assertSelects('.s1 > a#s1a2 span', ['s1a2s1']) def test_attribute_equals(self): self.assertSelectMultiple( ('p[class="onep"]', ['p1']), ('p[id="p1"]', ['p1']), ('[class="onep"]', ['p1']), ('[id="p1"]', ['p1']), ('link[rel="stylesheet"]', ['l1']), ('link[type="text/css"]', ['l1']), ('link[href="blah.css"]', ['l1']), ('link[href="no-blah.css"]', []), ('[rel="stylesheet"]', ['l1']), ('[type="text/css"]', ['l1']), ('[href="blah.css"]', ['l1']), ('[href="no-blah.css"]', []), ('p[href="no-blah.css"]', []), ('[href="no-blah.css"]', []), ) def test_attribute_tilde(self): self.assertSelectMultiple( ('p[class~="class1"]', ['pmulti']), ('p[class~="class2"]', ['pmulti']), ('p[class~="class3"]', ['pmulti']), ('[class~="class1"]', ['pmulti']), ('[class~="class2"]', ['pmulti']), ('[class~="class3"]', ['pmulti']), ('a[rel~="friend"]', ['bob']), ('a[rel~="met"]', ['bob']), ('[rel~="friend"]', ['bob']), ('[rel~="met"]', ['bob']), ) def test_attribute_startswith(self): self.assertSelectMultiple( ('[rel^="style"]', ['l1']), ('link[rel^="style"]', ['l1']), ('notlink[rel^="notstyle"]', []), ('[rel^="notstyle"]', []), ('link[rel^="notstyle"]', []), ('link[href^="bla"]', ['l1']), ('a[href^="http://"]', ['bob', 'me']), ('[href^="http://"]', ['bob', 'me']), ('[id^="p"]', ['pmulti', 'p1']), ('[id^="m"]', ['me', 'main']), ('div[id^="m"]', ['main']), ('a[id^="m"]', ['me']), ('div[data-tag^="dashed"]', ['data1']) ) def test_attribute_endswith(self): self.assertSelectMultiple( ('[href$=".css"]', ['l1']), ('link[href$=".css"]', ['l1']), ('link[id$="1"]', ['l1']), ('[id$="1"]', ['data1', 'l1', 'p1', 'header1', 's1a1', 's2a1', 's1a2s1', 'dash1']), ('div[id$="1"]', ['data1']), ('[id$="noending"]', []), ) def test_attribute_contains(self): self.assertSelectMultiple( # From test_attribute_startswith ('[rel*="style"]', ['l1']), ('link[rel*="style"]', ['l1']), ('notlink[rel*="notstyle"]', []), ('[rel*="notstyle"]', []), ('link[rel*="notstyle"]', []), ('link[href*="bla"]', ['l1']), ('[href*="http://"]', ['bob', 'me']), ('[id*="p"]', ['pmulti', 'p1']), ('div[id*="m"]', ['main']), ('a[id*="m"]', ['me']), # From test_attribute_endswith ('[href*=".css"]', ['l1']), ('link[href*=".css"]', ['l1']), ('link[id*="1"]', ['l1']), ('[id*="1"]', ['data1', 'l1', 'p1', 'header1', 's1a1', 's1a2', 's2a1', 's1a2s1', 'dash1']), ('div[id*="1"]', ['data1']), ('[id*="noending"]', []), # New for this test ('[href*="."]', ['bob', 'me', 'l1']), ('a[href*="."]', ['bob', 'me']), ('link[href*="."]', ['l1']), ('div[id*="n"]', ['main', 'inner']), ('div[id*="nn"]', ['inner']), ('div[data-tag*="edval"]', ['data1']) ) def test_attribute_exact_or_hypen(self): self.assertSelectMultiple( ('p[lang|="en"]', ['lang-en', 'lang-en-gb', 'lang-en-us']), ('[lang|="en"]', ['lang-en', 'lang-en-gb', 'lang-en-us']), ('p[lang|="fr"]', ['lang-fr']), ('p[lang|="gb"]', []), ) def test_attribute_exists(self): self.assertSelectMultiple( ('[rel]', ['l1', 'bob', 'me']), ('link[rel]', ['l1']), ('a[rel]', ['bob', 'me']), ('[lang]', ['lang-en', 'lang-en-gb', 'lang-en-us', 'lang-fr']), ('p[class]', ['p1', 'pmulti']), ('[blah]', []), ('p[blah]', []), ('div[data-tag]', ['data1']) ) def test_quoted_space_in_selector_name(self): html = """

nope

yes

""" soup = BeautifulSoup(html, 'html.parser') [chosen] = soup.select('div[style="display: right"]') self.assertEqual("yes", chosen.string) def test_unsupported_pseudoclass(self): self.assertRaises( NotImplementedError, self.soup.select, "a:no-such-pseudoclass") self.assertRaises( NotImplementedError, self.soup.select, "a:nth-of-type(a)") def test_nth_of_type(self): # Try to select first paragraph els = self.soup.select('div#inner p:nth-of-type(1)') self.assertEqual(len(els), 1) self.assertEqual(els[0].string, 'Some text') # Try to select third paragraph els = self.soup.select('div#inner p:nth-of-type(3)') self.assertEqual(len(els), 1) self.assertEqual(els[0].string, 'Another') # Try to select (non-existent!) fourth paragraph els = self.soup.select('div#inner p:nth-of-type(4)') self.assertEqual(len(els), 0) # Pass in an invalid value. self.assertRaises( ValueError, self.soup.select, 'div p:nth-of-type(0)') def test_nth_of_type_direct_descendant(self): els = self.soup.select('div#inner > p:nth-of-type(1)') self.assertEqual(len(els), 1) self.assertEqual(els[0].string, 'Some text') def test_id_child_selector_nth_of_type(self): self.assertSelects('#inner > p:nth-of-type(2)', ['p1']) def test_select_on_element(self): # Other tests operate on the tree; this operates on an element # within the tree. inner = self.soup.find("div", id="main") selected = inner.select("div") # The

tag was selected. The

# tag was not. self.assertSelectsIDs(selected, ['inner', 'data1']) def test_overspecified_child_id(self): self.assertSelects(".fancy #inner", ['inner']) self.assertSelects(".normal #inner", []) def test_adjacent_sibling_selector(self): self.assertSelects('#p1 + h2', ['header2']) self.assertSelects('#p1 + h2 + p', ['pmulti']) self.assertSelects('#p1 + #header2 + .class1', ['pmulti']) self.assertEqual([], self.soup.select('#p1 + p')) def test_general_sibling_selector(self): self.assertSelects('#p1 ~ h2', ['header2', 'header3']) self.assertSelects('#p1 ~ #header2', ['header2']) self.assertSelects('#p1 ~ h2 + a', ['me']) self.assertSelects('#p1 ~ h2 + [rel="me"]', ['me']) self.assertEqual([], self.soup.select('#inner ~ h2')) def test_dangling_combinator(self): self.assertRaises(ValueError, self.soup.select, 'h1 >') def test_sibling_combinator_wont_select_same_tag_twice(self): self.assertSelects('p[lang] ~ p', ['lang-en-gb', 'lang-en-us', 'lang-fr']) # Test the selector grouping operator (the comma) def test_multiple_select(self): self.assertSelects('x, y', ['xid', 'yid']) def test_multiple_select_with_no_space(self): self.assertSelects('x,y', ['xid', 'yid']) def test_multiple_select_with_more_space(self): self.assertSelects('x, y', ['xid', 'yid']) def test_multiple_select_duplicated(self): self.assertSelects('x, x', ['xid']) def test_multiple_select_sibling(self): self.assertSelects('x, y ~ p[lang=fr]', ['xid', 'lang-fr']) def test_multiple_select_tag_and_direct_descendant(self): self.assertSelects('x, y > z', ['xid', 'zidb']) def test_multiple_select_direct_descendant_and_tags(self): self.assertSelects('div > x, y, z', ['xid', 'yid', 'zida', 'zidb', 'zidab', 'zidac']) def test_multiple_select_indirect_descendant(self): self.assertSelects('div x,y, z', ['xid', 'yid', 'zida', 'zidb', 'zidab', 'zidac']) def test_invalid_multiple_select(self): self.assertRaises(ValueError, self.soup.select, ',x, y') self.assertRaises(ValueError, self.soup.select, 'x,,y') def test_multiple_select_attrs(self): self.assertSelects('p[lang=en], p[lang=en-gb]', ['lang-en', 'lang-en-gb']) def test_multiple_select_ids(self): self.assertSelects('x, y > z[id=zida], z[id=zidab], z[id=zidb]', ['xid', 'zidb', 'zidab']) def test_multiple_select_nested(self): self.assertSelects('body > div > x, y > z', ['xid', 'zidb']) def test_select_duplicate_elements(self): # When markup contains duplicate elements, a multiple select # will find all of them. markup = '

' soup = BeautifulSoup(markup, 'html.parser') selected = soup.select(".c1, .c2") self.assertEqual(3, len(selected)) # Verify that find_all finds the same elements, though because # of an implementation detail it finds them in a different # order. for element in soup.find_all(class_=['c1', 'c2']): assert element in selected PK�je[�nb++tests/test_html5lib.pynu�[��"""Tests to ensure that the html5lib tree builder generates good trees.""" import warnings try: from bs4.builder import HTML5TreeBuilder HTML5LIB_PRESENT = True except ImportError as e: HTML5LIB_PRESENT = False from bs4.element import SoupStrainer from bs4.testing import ( HTML5TreeBuilderSmokeTest, SoupTest, skipIf, ) @skipIf( not HTML5LIB_PRESENT, "html5lib seems not to be present, not testing its tree builder.") class HTML5LibBuilderSmokeTest(SoupTest, HTML5TreeBuilderSmokeTest): """See ``HTML5TreeBuilderSmokeTest``.""" @property def default_builder(self): return HTML5TreeBuilder() def test_soupstrainer(self): # The html5lib tree builder does not support SoupStrainers. strainer = SoupStrainer("b") markup = "

A bold statement.

" with warnings.catch_warnings(record=True) as w: soup = self.soup(markup, parse_only=strainer) self.assertEqual( soup.decode(), self.document_for(markup)) self.assertTrue( "the html5lib tree builder doesn't support parse_only" in str(w[0].message)) def test_correctly_nested_tables(self): """html5lib inserts tags where other parsers don't.""" markup = ('' '' "') self.assertSoupEquals( markup, '

Here's another table:" '' '' '

foo

Here\'s another table:' '

foo

' '

') self.assertSoupEquals( "" "" "

Foo
Bar
Baz

") def test_xml_declaration_followed_by_doctype(self): markup = '''

foo

''' soup = self.soup(markup) # Verify that we can reach the

tag; this means the tree is connected. self.assertEqual(b"

foo

", soup.p.encode()) def test_reparented_markup(self): markup = '

foo

bar

' soup = self.soup(markup) self.assertEqual("

foo

bar

", soup.body.decode()) self.assertEqual(2, len(soup.find_all('p'))) def test_reparented_markup_ends_with_whitespace(self): markup = '

foo

bar

\n' soup = self.soup(markup) self.assertEqual("

foo

bar

\n", soup.body.decode()) self.assertEqual(2, len(soup.find_all('p'))) def test_reparented_markup_containing_identical_whitespace_nodes(self): """Verify that we keep the two whitespace nodes in this document distinct when reparenting the adjacent tags. """ markup = '

' soup = self.soup(markup) space1, space2 = soup.find_all(string=' ') tbody1, tbody2 = soup.find_all('tbody') assert space1.next_element is tbody1 assert tbody2.next_element is space2 def test_reparented_markup_containing_children(self): markup = '

aftermath

' soup = self.soup(markup) noscript = soup.noscript self.assertEqual("target", noscript.next_element) target = soup.find(string='target') # The 'aftermath' string was duplicated; we want the second one. final_aftermath = soup.find_all(string='aftermath')[-1] # The

tag, # but the 'target' string within is still connected to the # (second) 'aftermath' string. self.assertEqual(final_aftermath, target.next_element) self.assertEqual(target, final_aftermath.previous_element) def test_processing_instruction(self): """Processing instructions become comments.""" markup = b"""""" soup = self.soup(markup) assert str(soup).startswith("") def test_cloned_multivalue_node(self): markup = b"""""" soup = self.soup(markup) a1, a2 = soup.find_all('a') self.assertEqual(a1, a2) assert a1 is not a2 def test_foster_parenting(self): markup = b"""

foo") dumped = pickle.dumps(tree, 2) loaded = pickle.loads(dumped) self.assertTrue(isinstance(loaded.builder, type(tree.builder))) def test_redundant_empty_element_closing_tags(self): self.assertSoupEquals('

', "

") self.assertSoupEquals('

', "") def test_empty_element(self): # This verifies that any buffered data present when the parser # finishes working is handled. self.assertSoupEquals("foo &# bar", "foo &# bar") class TestHTMLParserSubclass(SoupTest): def test_error(self): """Verify that our HTMLParser subclass implements error() in a way that doesn't cause a crash. """ parser = BeautifulSoupHTMLParser() parser.error("don't crash") PK��je[��+��+��tests/test_docs.pynu��[��"Test harness for doctests." # pylint: disable-msg=E0611,W0142 __metaclass__ = type __all__ = [ 'additional_tests', ] import atexit import doctest import os #from pkg_resources import ( # resource_filename, resource_exists, resource_listdir, cleanup_resources) import unittest DOCTEST_FLAGS = ( doctest.ELLIPSIS | doctest.NORMALIZE_WHITESPACE | doctest.REPORT_NDIFF) # def additional_tests(): # "Run the doc tests (README.txt and docs/*, if any exist)" # doctest_files = [ # os.path.abspath(resource_filename('bs4', 'README.txt'))] # if resource_exists('bs4', 'docs'): # for name in resource_listdir('bs4', 'docs'): # if name.endswith('.txt'): # doctest_files.append( # os.path.abspath( # resource_filename('bs4', 'docs/%s' % name))) # kwargs = dict(module_relative=False, optionflags=DOCTEST_FLAGS) # atexit.register(cleanup_resources) # return unittest.TestSuite(( # doctest.DocFileSuite(*doctest_files, **kwargs))) PK��je[��j��tests/test_builder_registry.pynu��[��"""Tests of the builder registry.""" import unittest import warnings from bs4 import BeautifulSoup from bs4.builder import ( builder_registry as registry, HTMLParserTreeBuilder, TreeBuilderRegistry, ) try: from bs4.builder import HTML5TreeBuilder HTML5LIB_PRESENT = True except ImportError: HTML5LIB_PRESENT = False try: from bs4.builder import ( LXMLTreeBuilderForXML, LXMLTreeBuilder, ) LXML_PRESENT = True except ImportError: LXML_PRESENT = False class BuiltInRegistryTest(unittest.TestCase): """Test the built-in registry with the default builders registered.""" def test_combination(self): if LXML_PRESENT: self.assertEqual(registry.lookup('fast', 'html'), LXMLTreeBuilder) if LXML_PRESENT: self.assertEqual(registry.lookup('permissive', 'xml'), LXMLTreeBuilderForXML) self.assertEqual(registry.lookup('strict', 'html'), HTMLParserTreeBuilder) if HTML5LIB_PRESENT: self.assertEqual(registry.lookup('html5lib', 'html'), HTML5TreeBuilder) def test_lookup_by_markup_type(self): if LXML_PRESENT: self.assertEqual(registry.lookup('html'), LXMLTreeBuilder) self.assertEqual(registry.lookup('xml'), LXMLTreeBuilderForXML) else: self.assertEqual(registry.lookup('xml'), None) if HTML5LIB_PRESENT: self.assertEqual(registry.lookup('html'), HTML5TreeBuilder) else: self.assertEqual(registry.lookup('html'), HTMLParserTreeBuilder) def test_named_library(self): if LXML_PRESENT: self.assertEqual(registry.lookup('lxml', 'xml'), LXMLTreeBuilderForXML) self.assertEqual(registry.lookup('lxml', 'html'), LXMLTreeBuilder) if HTML5LIB_PRESENT: self.assertEqual(registry.lookup('html5lib'), HTML5TreeBuilder) self.assertEqual(registry.lookup('html.parser'), HTMLParserTreeBuilder) def test_beautifulsoup_constructor_does_lookup(self): with warnings.catch_warnings(record=True) as w: # This will create a warning about not explicitly # specifying a parser, but we'll ignore it. # You can pass in a string. BeautifulSoup("", features="html") # Or a list of strings. BeautifulSoup("", features=["html", "fast"]) # You'll get an exception if BS can't find an appropriate # builder. self.assertRaises(ValueError, BeautifulSoup, "", features="no-such-feature") class RegistryTest(unittest.TestCase): """Test the TreeBuilderRegistry class in general.""" def setUp(self): self.registry = TreeBuilderRegistry() def builder_for_features(self, *feature_list): cls = type('Builder_' + '_'.join(feature_list), (object,), {'features' : feature_list}) self.registry.register(cls) return cls def test_register_with_no_features(self): builder = self.builder_for_features() # Since the builder advertises no features, you can't find it # by looking up features. self.assertEqual(self.registry.lookup('foo'), None) # But you can find it by doing a lookup with no features, if # this happens to be the only registered builder. self.assertEqual(self.registry.lookup(), builder) def test_register_with_features_makes_lookup_succeed(self): builder = self.builder_for_features('foo', 'bar') self.assertEqual(self.registry.lookup('foo'), builder) self.assertEqual(self.registry.lookup('bar'), builder) def test_lookup_fails_when_no_builder_implements_feature(self): builder = self.builder_for_features('foo', 'bar') self.assertEqual(self.registry.lookup('baz'), None) def test_lookup_gets_most_recent_registration_when_no_feature_specified(self): builder1 = self.builder_for_features('foo') builder2 = self.builder_for_features('bar') self.assertEqual(self.registry.lookup(), builder2) def test_lookup_fails_when_no_tree_builders_registered(self): self.assertEqual(self.registry.lookup(), None) def test_lookup_gets_most_recent_builder_supporting_all_features(self): has_one = self.builder_for_features('foo') has_the_other = self.builder_for_features('bar') has_both_early = self.builder_for_features('foo', 'bar', 'baz') has_both_late = self.builder_for_features('foo', 'bar', 'quux') lacks_one = self.builder_for_features('bar') has_the_other = self.builder_for_features('foo') # There are two builders featuring 'foo' and 'bar', but # the one that also features 'quux' was registered later. self.assertEqual(self.registry.lookup('foo', 'bar'), has_both_late) # There is only one builder featuring 'foo', 'bar', and 'baz'. self.assertEqual(self.registry.lookup('foo', 'bar', 'baz'), has_both_early) def test_lookup_fails_when_cannot_reconcile_requested_features(self): builder1 = self.builder_for_features('foo', 'bar') builder2 = self.builder_for_features('foo', 'baz') self.assertEqual(self.registry.lookup('bar', 'baz'), None) PK��je[ʮ�s8U��8U��0��tests/__pycache__/test_soup.cpython-36.opt-1.pycnu��[��3 *6]dO��@��s~��d�Z�ddlmZ�ddlZddlZddlZddlZddlmZm Z �ddl mZmZm Z mZ�ddlZddlmZmZmZ�ddlmZmZ�ddlZyddlmZmZ�d ZW�n&�ek r��Z�z d ZW�Y�ddZ[X�nX�ejd�dko�ejdk�ZG�d d��de�ZG�dd��de�Z G�dd��de�Z G�dd��de�Z!G�dd��dej"�Z#G�dd��de�Z$G�dd��dej"�Z%G�dd��de�Z&G�dd��dej"�Z'dS�)z#Tests of Beautiful Soup as a whole.��)� set_traceN)� BeautifulSoup�BeautifulStoneSoup)�CharsetMetaAttributeValue�ContentMetaAttributeValue�SoupStrainer�NamespacedAttribute)�EntitySubstitution� UnicodeDammit�EncodingDetector)�SoupTest�skipIf)�LXMLTreeBuilder�LXMLTreeBuilderForXMLTF��c��@��s$��e�Zd�Zdd��Zdd��Zdd��ZdS�)�TestConstructorc��C��s"��d}|�j�|�}|�jd|jj��d�S�)Nu ��

éé

u��éé)�soup�assertEqual�h1�string)�self�datar��r��/usr/lib/python3.6/test_soup.py�test_short_unicode_input*��s�� z(TestConstructor.test_short_unicode_inputc��C��s"��d}|�j�|�}|�jd|jj��d�S�)Nz

foo�bar

r<��)r��r��Zdivr��)r��rR��r��r��r��1test_attribute_name_containing_unicode_characters��s��zHTestEncodingConversion.test_attribute_name_containing_unicode_characters)r"��r#��r$��rV��rx��r{��r|��r}��r ��PYTHON_3_PRE_3_2r~�� __classcell__r��r��)rk��r��rh��s�� rh��c��@��s��e�Zd�ZdZdd��Zdd��Zdd��Zdd ��Zd d��Zdd ��Z dd��Z dd��Zdd��Zdd��Z dd��Zdd��Zdd��Zdd��Zdd��Zd d!��Zd"d#��Zd$S�)%�TestUnicodeDammitz"Standalone tests of UnicodeDammit.c��C��s��d}t�|�}|�j|j|��d�S�)Nu��I'm already Unicode! ☃)r ��r��unicode_markup)r��rR��rY��r��r��r��test_unicode_input"��s��z$TestUnicodeDammit.test_unicode_inputc��C��s��d}t�|�}|�j|jd��d�S�)Ns��z#\u2018\u2019\u201c\u201d)r ��r��r��)r��rR��rY��r��r��r��test_smart_quotes_to_unicode'��s��z.TestUnicodeDammit.test_smart_quotes_to_unicodec��C��s"��d}t�|dd�}|�j|jd��d�S�)Ns��Zxml)�smart_quotes_toz+‘’“”)r ��r��r��)r��rR��rY��r��r��r��!test_smart_quotes_to_xml_entities-��s��z3TestUnicodeDammit.test_smart_quotes_to_xml_entitiesc��C��s"��d}t�|dd�}|�j|jd��d�S�)Ns��r5��)r��z'‘’“”)r ��r��r��)r��rR��rY��r��r��r��"test_smart_quotes_to_html_entities3��s��z4TestUnicodeDammit.test_smart_quotes_to_html_entitiesc��C��s"��d}t�|dd�}|�j|jd��d�S�)Ns��rw��)r��z''"")r ��r��r��)r��rR��rY��r��r��r��test_smart_quotes_to_ascii9��s��z,TestUnicodeDammit.test_smart_quotes_to_asciic��C��s0��d}t�|�}|�j|jj��d��|�j|jd��d�S�)Ns��Sacré bleu! ☃zutf-8u��Sacré bleu! ☃)r ��r��r��rt��r��)r��r<��rY��r��r��r��test_detect_utf8?��s��z"TestUnicodeDammit.test_detect_utf8c��C��s4��d}t�|dg�}|�j|jj��d��|�j|jd��d�S�)Ns��z iso-8859-8z\u05dd\u05d5\u05dc\u05e9)r ��r��r��rt��r��)r��hebrewrY��r��r��r��test_convert_hebrewF��s��z%TestUnicodeDammit.test_convert_hebrewc��C��s6��d}t�|�}|�j|jj��d��|�j|jjd�|��d�S�)Ns��ケータイ Watchzutf-8)r ��r��r��rt��r��r��)r��utf_8rY��r��r��r��/test_dont_see_smart_quotes_where_there_are_noneL��s��zATestUnicodeDammit.test_dont_see_smart_quotes_where_there_are_nonec��C��s,��dj�d�}t|dg�}|�j|jj��d��d�S�)Nu ��Räksmörgåszutf-8z iso-8859-8)r��r ��r��r��rt��)r��r ��rY��r��r��r�� test_ignore_inappropriate_codecsR��s�� z2TestUnicodeDammit.test_ignore_inappropriate_codecsc��C��s:��dj�d�}x*dD�]"}t||g�}|�j|jj��d��qW�d�S�)Nu ��Räksmörgåszutf-8�.utf8�...� utF---16.!)r��r��r��)r��r ��r��r��rt��)r��r ��Zbad_encodingrY��r��r��r��test_ignore_invalid_codecsW��s�� z,TestUnicodeDammit.test_ignore_invalid_codecsc��C��sL��dj�d�}t|dgd�}|�j|jj��d��t|ddgd�}|�j|jd��d�S�)Nu ��Räksmörgåszutf-8)r��zwindows-1252)r��r ��r��r��rt��)r��r ��rY��r��r��r��r!��]��s�� z(TestUnicodeDammit.test_exclude_encodingsc��C��s��t�d�}t|j�}d�S�)Ns'��)r��list� encodings)r��Zdetectedr��r��r��r��Ptest_encoding_detector_replaces_junk_in_encoding_name_with_replacement_characterk��s�� zbTestUnicodeDammit.test_encoding_detector_replaces_junk_in_encoding_name_with_replacement_characterc��C��s,��x&dD�]}t�|dd�}|�jd|j��qW�d�S�) N�&��&��$��#��T)Zis_htmlzeuc-jp)r��r��r��r��)r ��r��r��)r��r��rY��r��r��r�� test_detect_html5_style_meta_tagq��s��z2TestUnicodeDammit.test_detect_html5_style_meta_tagc��C��s��d}t�jj}tjtj��zPdd��}|t�j_t|�}|�jd|j��|�j d|j k��t|d�}|�j |j��W�d�tjtj��|t�j_X�d�S�)NsT�� بتر ��ѐ��c��S��s��d�S�)Nr��)r/��r��r��r��rl��s��zBTestUnicodeDammit.test_last_ditch_entity_replacement..noopTz\ufffdzhtml.parser) rm��rY��rn��ro��rp��rq��r ��r��Zcontains_replacement_charactersr(��r��r��ru��)r��docrv��rl��rY��r��r��r��r��"test_last_ditch_entity_replacement|��s�� z4TestUnicodeDammit.test_last_ditch_entity_replacementc��C��s,��d}t�|�}|�jd|j��|�jd|j��d�S�)Ns��<�a�>��<�/�a�>�u��áézutf-16le)r ��r��r��r��)r��r��rY��r��r��r��test_byte_order_mark_removed��s��z.TestUnicodeDammit.test_byte_order_mark_removedc��C��sP��dj�d�}dj�d�}||�|�}|�jt|jd��tj|�}|�jd|jd��d�S�)Nu��☃r��r<��u��“Hi, I like Windows!”�windows_1252u+��☃☃☃“Hi, I like Windows!”☃☃☃u ��☃☃☃)r��r?��UnicodeDecodeErrorrr��r �� detwingler��)r��r<��r��r��Zfixedr��r��r��test_detwingle��s�� z TestUnicodeDammit.test_detwinglec��C��sB��x��s6��,/ E<�/PK��je[]_@u� �� 0��tests/__pycache__/test_htmlparser.cpython-36.pycnu��[��3 Y=K[��@��sf��d�Z�ddlmZ�ddlZddlmZmZ�ddlmZ�ddl m Z �G�dd��dee�ZG�d d ��d e�ZdS�)zGTests to ensure that the html.parser tree builder generates good trees.��)� set_traceN)�SoupTest�HTMLTreeBuilderSmokeTest)�HTMLParserTreeBuilder)�BeautifulSoupHTMLParserc��@��s@��e�Zd�Zedd��Zdd��Zdd��Zdd��Zd d ��Zdd��Z d S�)�HTMLParserTreeBuilderSmokeTestc��C��s��t��S�)N)r��)�self��r ��%/usr/lib/python3.6/test_htmlparser.py�default_builder��s��z.HTMLParserTreeBuilderSmokeTest.default_builderc��C��s��d�S�)Nr ��)r��r ��r ��r ��test_namespaced_system_doctype��s��z=HTMLParserTreeBuilderSmokeTest.test_namespaced_system_doctypec��C��s��d�S�)Nr ��)r��r ��r ��r ��test_namespaced_public_doctype��s��z=HTMLParserTreeBuilderSmokeTest.test_namespaced_public_doctypec��C��s<��|�j�d�}tj|d�}tj|�}|�jt|jt|j��dS�)zfUnlike most tree builders, HTMLParserTreeBuilder and will be restored after pickling. z foo��N)Zsoup�pickle�dumps�loadsZ assertTrue� isinstanceZbuilder�type)r��ZtreeZdumpedZloadedr ��r ��r ��test_builder_is_pickled��s�� z6HTMLParserTreeBuilderSmokeTest.test_builder_is_pickledc��C��s��|�j�dd��|�j�dd��d�S�)Nz

z

z

��)�assertSoupEquals)r��r ��r ��r ��)test_redundant_empty_element_closing_tags!��s��zHHTMLParserTreeBuilderSmokeTest.test_redundant_empty_element_closing_tagsc��C��s��|�j�dd��d�S�)Nz foo &# barzfoo &# bar)r��)r��r ��r ��r ��test_empty_element%��s��z1HTMLParserTreeBuilderSmokeTest.test_empty_elementN) �__name__� __module__�__qualname__�propertyr��r��r ��r��r��r��r ��r ��r ��r ��r�� s�� r��c��@��s��e�Zd�Zdd��ZdS�)�TestHTMLParserSubclassc��C��s��t��}|jd��dS�)zlVerify that our HTMLParser subclass implements error() in a way that doesn't cause a crash. zdon't crashN)r��error)r��parserr ��r ��r �� test_error,��s��z!TestHTMLParserSubclass.test_errorN)r��r��r��r ��r ��r ��r ��r ��r��+��s��r��) �__doc__Zpdbr��r��Zbs4.testingr��r��Zbs4.builderr��Zbs4.builder._htmlparserr��r��r��r ��r ��r ��r ��s��!PK��je[��ٺ��0��tests/__pycache__/test_lxml.cpython-36.opt-1.pycnu��[��3 6]U ��@��s��d�Z�ddlZddlZyddlZdZejjZW�n*�ek rV�Z �zdZdZW�Y�ddZ [ X�nX�erlddl mZmZ�ddl mZmZ�ddlmZmZmZ�ddlmZ�dd lmZ�dd lmZmZmZmZ�ee�d�G�dd ��d ee��Zee�d�G�dd��dee��ZdS�)z@Tests to ensure that the lxml tree builder generates good trees.��NTF)�LXMLTreeBuilder�LXMLTreeBuilderForXML)� BeautifulSoup�BeautifulStoneSoup)�Comment�Doctype�SoupStrainer)�skipIf)�test_htmlparser)�HTMLTreeBuilderSmokeTest�XMLTreeBuilderSmokeTest�SoupTestr ��z;lxml seems not to be present, not testing its tree builder.c��@��sP��e�Zd�ZdZedd��Zdd��Zdd��Zee �p6e dk�d�d d��Zdd��ZdS�)�LXMLTreeBuilderSmokeTestz!See ``HTMLTreeBuilderSmokeTest``.c��C��s��t��S�)N)r��)�self��r��/usr/lib/python3.6/test_lxml.py�default_builder%��s��z(LXMLTreeBuilderSmokeTest.default_builderc��C��s(��|�j�dd��|�j�dd��|�j�dd��d�S�)Nz
foo�bar
z
foobar
z
foo�bar
z
foo�bar
)ZassertSoupEquals)r��r��r��r��test_out_of_range_entity)��s��z1LXMLTreeBuilderSmokeTest.test_out_of_range_entityc��C��s��d�S�)Nr��)r��r��r��r��*test_entities_in_foreign_document_encoding1��s��zCLXMLTreeBuilderSmokeTest.test_entities_in_foreign_document_encoding��r��z@Skipping doctype test for old version of lxml to avoid segfault.c��C��s(��|�j�d�}|jd�}|�jd|j��d�S�)Nz r��)�soup�contents�assertEqual�strip)r��r��Zdoctyper��r��r��test_empty_doctype:��s�� z+LXMLTreeBuilderSmokeTest.test_empty_doctypec��C��sN��t�jdd��}td�}W�d�Q�R�X�|�jdt|j��|�jdt|d�j�k��d�S�)NT)�recordzzz&BeautifulStoneSoup class is deprecatedr��)�warnings�catch_warningsr��r��str�bZ assertTrue�message)r��wr��r��r��r��%test_beautifulstonesoup_is_xml_parserB��s��z>LXMLTreeBuilderSmokeTest.test_beautifulstonesoup_is_xml_parserN)r��r��r��r��) �__name__� __module__�__qualname__�__doc__�propertyr��r��r��r ��LXML_PRESENT�LXML_VERSIONr��r%��r��r��r��r��r��s�� r��z?lxml seems not to be present, not testing its XML tree builder.c��@��s��e�Zd�ZdZedd��ZdS�)�LXMLXMLTreeBuilderSmokeTestz!See ``HTMLTreeBuilderSmokeTest``.c��C��s��t��S�)N)r��)r��r��r��r��r��P��s��z+LXMLXMLTreeBuilderSmokeTest.default_builderN)r&��r'��r(��r)��r*��r��r��r��r��r��r-��J��s��r-��)r��)r)��rer��Z lxml.etreeZlxmlr+��Zetreer,��ImportError�eZbs4.builderr��r��Zbs4r��r��Zbs4.elementr��r��r��Zbs4.testingr ��Z bs4.testsr ��r��r��r ��r��r-��r��r��r��r��s0�� (PK��je[� ,k��k��6��tests/__pycache__/test_builder_registry.cpython-36.pycnu��[��3 c�T��@��s��d�Z�ddlZddlZddlmZ�ddlmZmZm Z �yddlm Z �dZW�n�ek r`��dZY�nX�yddlm Z mZ�dZW�n�ek r��dZY�nX�G�d d ��d ej�ZG�dd��dej�ZdS�) zTests of the builder registry.��N)� BeautifulSoup)�builder_registry�HTMLParserTreeBuilder�TreeBuilderRegistry)�HTML5TreeBuilderTF)�LXMLTreeBuilderForXML�LXMLTreeBuilderc��@��s0��e�Zd�ZdZdd��Zdd��Zdd��Zdd ��Zd S�)�BuiltInRegistryTestz@Test the built-in registry with the default builders registered.c��C��s`��t�r|�jtjdd�t��t�r0|�jtjdd�t��|�jtjdd�t��tr\|�jtjdd�t��d�S�)N�fast�htmlZ permissive�xml�strict�html5lib) �LXML_PRESENT�assertEqual�registry�lookupr��r��r��HTML5LIB_PRESENTr��)�self��r��+/usr/lib/python3.6/test_builder_registry.py�test_combination ��s��z$BuiltInRegistryTest.test_combinationc��C��sj��t�r*|�jtjd�t��|�jtjd�t��n<|�jtjd�d��trT|�jtjd�t��n|�jtjd�t��d�S�)Nr��r��) r��r��r��r��r��r��r��r��r��)r��r��r��r��test_lookup_by_markup_type.��s��z.BuiltInRegistryTest.test_lookup_by_markup_typec��C��sX��t�r,|�jtjdd�t��|�jtjdd�t��trB|�jtjd�t��|�jtjd�t��d�S�)NZlxmlr��r��r��zhtml.parser) r��r��r��r��r��r��r��r��r��)r��r��r��r��test_named_library9��s��z&BuiltInRegistryTest.test_named_libraryc�� C��sJ��t�jdd��"}tddd��tdddgd��W�d�Q�R�X�|�jttddd��d�S�)NT)�record��r��)�featuresr ��zno-such-feature)�warnings�catch_warningsr��ZassertRaises� ValueError)r��wr��r��r��*test_beautifulsoup_constructor_does_lookupF��s ��z>BuiltInRegistryTest.test_beautifulsoup_constructor_does_lookupN)�__name__� __module__�__qualname__�__doc__r��r��r��r!��r��r��r��r��r ��s �� r ��c��@��sX��e�Zd�ZdZdd��Zdd��Zdd��Zdd ��Zd d��Zdd ��Z dd��Z dd��Zdd��ZdS�)�RegistryTestz.Test the TreeBuilderRegistry class in general.c��C��s��t��|�_d�S�)N)r��r��)r��r��r��r��setUpY��s��zRegistryTest.setUpc��G��s,��t�ddj|��tfd|i�}|�jj|��|S�)NZBuilder_�_r��)�type�join�objectr��register)r��Zfeature_list�clsr��r��r��builder_for_features\��s��z!RegistryTest.builder_for_featuresc��C��s2��|�j��}|�j|�jjd�d��|�j|�jj��|��d�S�)N�foo)r.��r��r��r��)r��builderr��r��r��test_register_with_no_featuresc��s��z+RegistryTest.test_register_with_no_featuresc��C��s8��|�j�dd�}|�j|�jjd�|��|�j|�jjd�|��d�S�)Nr/��bar)r.��r��r��r��)r��r0��r��r��r��0test_register_with_features_makes_lookup_succeedn��s��z=RegistryTest.test_register_with_features_makes_lookup_succeedc��C��s$��|�j�dd�}|�j|�jjd�d��d�S�)Nr/��r2��baz)r.��r��r��r��)r��r0��r��r��r��4test_lookup_fails_when_no_builder_implements_features��s��zARegistryTest.test_lookup_fails_when_no_builder_implements_featurec��C��s*��|�j�d�}|�j�d�}|�j|�jj��|��d�S�)Nr/��r2��)r.��r��r��r��)r��builder1�builder2r��r��r��Ctest_lookup_gets_most_recent_registration_when_no_feature_specifiedw��s�� zPRegistryTest.test_lookup_gets_most_recent_registration_when_no_feature_specifiedc��C��s��|�j�|�jj��d��d�S�)N)r��r��r��)r��r��r��r��2test_lookup_fails_when_no_tree_builders_registered|��s��z?RegistryTest.test_lookup_fails_when_no_tree_builders_registeredc��C��sv��|�j�d�}|�j�d�}|�j�ddd�}|�j�ddd�}|�j�d�}|�j�d�}|�j|�jjdd�|��|�j|�jjddd�|��d�S�)Nr/��r2��r4��Zquux)r.��r��r��r��)r��Zhas_oneZ has_the_otherZhas_both_earlyZ has_both_lateZ lacks_oner��r��r��s �� 9PK��je[��)��tests/__pycache__/__init__.cpython-36.pycnu��[��3 ��CN��@��s��d�Z�dS�)zThe beautifulsoup tests.N)�__doc__��r��r��/usr/lib/python3.6/__init__.py��s��PK��je[��/��tests/__pycache__/__init__.cpython-36.opt-1.pycnu��[��3 ��CN��@��s��d�Z�dS�)zThe beautifulsoup tests.N)�__doc__��r��r��/usr/lib/python3.6/__init__.py��s��PK��je[� ,k��k��<��tests/__pycache__/test_builder_registry.cpython-36.opt-1.pycnu��[��3 c�T��@��s��d�Z�ddlZddlZddlmZ�ddlmZmZm Z �yddlm Z �dZW�n�ek r`��dZY�nX�yddlm Z mZ�dZW�n�ek r��dZY�nX�G�d d ��d ej�ZG�dd��dej�ZdS�) zTests of the builder registry.��N)� BeautifulSoup)�builder_registry�HTMLParserTreeBuilder�TreeBuilderRegistry)�HTML5TreeBuilderTF)�LXMLTreeBuilderForXML�LXMLTreeBuilderc��@��s0��e�Zd�ZdZdd��Zdd��Zdd��Zdd ��Zd S�)�BuiltInRegistryTestz@Test the built-in registry with the default builders registered.c��C��s`��t�r|�jtjdd�t��t�r0|�jtjdd�t��|�jtjdd�t��tr\|�jtjdd�t��d�S�)N�fast�htmlZ permissive�xml�strict�html5lib) �LXML_PRESENT�assertEqual�registry�lookupr��r��r��HTML5LIB_PRESENTr��)�self��r��+/usr/lib/python3.6/test_builder_registry.py�test_combination ��s��z$BuiltInRegistryTest.test_combinationc��C��sj��t�r*|�jtjd�t��|�jtjd�t��n<|�jtjd�d��trT|�jtjd�t��n|�jtjd�t��d�S�)Nr��r��) r��r��r��r��r��r��r��r��r��)r��r��r��r��test_lookup_by_markup_type.��s��z.BuiltInRegistryTest.test_lookup_by_markup_typec��C��sX��t�r,|�jtjdd�t��|�jtjdd�t��trB|�jtjd�t��|�jtjd�t��d�S�)NZlxmlr��r��r��zhtml.parser) r��r��r��r��r��r��r��r��r��)r��r��r��r��test_named_library9��s��z&BuiltInRegistryTest.test_named_libraryc�� C��sJ��t�jdd��"}tddd��tdddgd��W�d�Q�R�X�|�jttddd��d�S�)NT)�record��r��)�featuresr ��zno-such-feature)�warnings�catch_warningsr��ZassertRaises� ValueError)r��wr��r��r��*test_beautifulsoup_constructor_does_lookupF��s ��z>BuiltInRegistryTest.test_beautifulsoup_constructor_does_lookupN)�__name__� __module__�__qualname__�__doc__r��r��r��r!��r��r��r��r��r ��s �� r ��c��@��sX��e�Zd�ZdZdd��Zdd��Zdd��Zdd ��Zd d��Zdd ��Z dd��Z dd��Zdd��ZdS�)�RegistryTestz.Test the TreeBuilderRegistry class in general.c��C��s��t��|�_d�S�)N)r��r��)r��r��r��r��setUpY��s��zRegistryTest.setUpc��G��s,��t�ddj|��tfd|i�}|�jj|��|S�)NZBuilder_�_r��)�type�join�objectr��register)r��Zfeature_list�clsr��r��r��builder_for_features\��s��z!RegistryTest.builder_for_featuresc��C��s2��|�j��}|�j|�jjd�d��|�j|�jj��|��d�S�)N�foo)r.��r��r��r��)r��builderr��r��r��test_register_with_no_featuresc��s��z+RegistryTest.test_register_with_no_featuresc��C��s8��|�j�dd�}|�j|�jjd�|��|�j|�jjd�|��d�S�)Nr/��bar)r.��r��r��r��)r��r0��r��r��r��0test_register_with_features_makes_lookup_succeedn��s��z=RegistryTest.test_register_with_features_makes_lookup_succeedc��C��s$��|�j�dd�}|�j|�jjd�d��d�S�)Nr/��r2��baz)r.��r��r��r��)r��r0��r��r��r��4test_lookup_fails_when_no_builder_implements_features��s��zARegistryTest.test_lookup_fails_when_no_builder_implements_featurec��C��s*��|�j�d�}|�j�d�}|�j|�jj��|��d�S�)Nr/��r2��)r.��r��r��r��)r��builder1�builder2r��r��r��Ctest_lookup_gets_most_recent_registration_when_no_feature_specifiedw��s�� zPRegistryTest.test_lookup_gets_most_recent_registration_when_no_feature_specifiedc��C��s��|�j�|�jj��d��d�S�)N)r��r��r��)r��r��r��r��2test_lookup_fails_when_no_tree_builders_registered|��s��z?RegistryTest.test_lookup_fails_when_no_tree_builders_registeredc��C��sv��|�j�d�}|�j�d�}|�j�ddd�}|�j�ddd�}|�j�d�}|�j�d�}|�j|�jjdd�|��|�j|�jjddd�|��d�S�)Nr/��r2��r4��Zquux)r.��r��r��r��)r��Zhas_oneZ has_the_otherZhas_both_earlyZ has_both_lateZ lacks_oner��r��r��s �� 9PK��je[�)p�W��W�0��tests/__pycache__/test_tree.cpython-36.opt-1.pycnu��[��3 6]�8��@��s��d�Z�ddlmZ�ddlZddlZddlZddlZddlmZ�ddl m Z mZ�ddlm Z mZmZmZmZmZmZmZ�ddlmZmZ�e jd�dk Ze jd �dk ZG�d d��de�ZG�dd ��d e�ZG�dd��de�ZG�dd��de�ZG�dd��de�ZG�dd��de�Z G�dd��de�Z!G�dd��de�Z"G�dd��de�Z#G�dd��de#�Z$G�dd��de#�Z%G�d d!��d!e�Z&G�d"d#��d#e&�Z'G�d$d%��d%e&�Z(G�d&d'��d'e�Z)G�d(d)��d)e�Z*G�d*d+��d+e�Z+G�d,d-��d-e�Z,G�d.d/��d/e�Z-G�d0d1��d1e�Z.G�d2d3��d3e�Z/G�d4d5��d5e�Z0G�d6d7��d7e�Z1dS�)8a8��Tests for Beautiful Soup's tree traversal methods. The tree traversal methods are the main advantage of using Beautiful Soup over just using a parser. Different parsers will build different Beautiful Soup trees given the same markup, but all Beautiful Soup trees can be traversed with the methods tested here. ��)� set_traceN)� BeautifulSoup)�builder_registry�HTMLParserTreeBuilder)�PY3K�CData�Comment�Declaration�Doctype�NavigableString�SoupStrainer�Tag)�SoupTest�skipIfZxmlZlxmlc��@��s��e�Zd�Zdd��Zdd��ZdS�)�TreeTestc��C��s��|�j�dd��|D��|��dS�)z�Make sure that the given tags have the correct text. This is used in tests that define a bunch of tags, each containing a single string, and then select certain strings by some mechanism. c��S��s��g�|�] }|j��qS��)�string)�.0�tagr��r��/usr/lib/python3.6/test_tree.py� 2��s��z*TreeTest.assertSelects..N)�assertEqual)�self�tags�should_matchr��r��r�� assertSelects+��s��zTreeTest.assertSelectsc��C��s��|�j�dd��|D��|��dS�)z�Make sure that the given tags have the correct IDs. This is used in tests that define a bunch of tags, each containing a single string, and then select certain strings by some mechanism. c��S��s��g�|�]}|d��qS�)�idr��)r��r��r��r��r��r��;��s��z-TreeTest.assertSelectsIDs..N)r��)r��r��r��r��r��r��assertSelectsIDs4��s��zTreeTest.assertSelectsIDsN)�__name__� __module__�__qualname__r��r��r��r��r��r��r��)��s�� r��c��@��s8��e�Zd�ZdZdd��Zdd��Zdd��Zdd ��Zd d��ZdS�) �TestFindz�Basic tests of the find() method. find() just calls find_all() with limit=1, so it's not tested all that thouroughly here. c��C��s"��|�j�d�}|�j|jd�jd��d�S�)Nz 1234�b�2)�soupr��findr��)r��r$��r��r��r�� test_find_tagE��s�� zTestFind.test_find_tagc��C��s"��|�j�d�}|�j|jdd�d��d�S�)Nu��
Räksmörgås
u ��Räksmörgås)r��)r$��r��r%��)r��r$��r��r��r��test_unicode_text_findI��s�� zTestFind.test_unicode_text_findc��C��s,��|�j�d�}t|��|�jd|jdd�j��d�S�)Nu&��
here it is
z here it isu ��Räksmörgås)r��)r$��strr��r%��text)r��r$��r��r��r��test_unicode_attribute_findM��s�� z$TestFind.test_unicode_attribute_findc��C��s"��|�j�d�}|�jdt|j��dS�)z)Test an optimization that finds all tags.zfoobar��N)r$��r��len�find_all)r��r$��r��r��r��test_find_everythingS��s�� zTestFind.test_find_everythingc��C��s$��|�j�d�}|�jdt|jd��dS�)z;Test an optimization that finds all tags with a given name.zfoobarbazr+��aN)r$��r��r,��r-��)r��r$��r��r��r��test_find_everything_with_nameX��s�� z'TestFind.test_find_everything_with_nameN) r��r��r ��__doc__r&��r'��r*��r.��r0��r��r��r��r��r!��>��s��r!��c��@��s8��e�Zd�ZdZdd��Zdd��Zdd��Zdd ��Zd d��ZdS�) �TestFindAllz%Basic tests of the find_all() method.c��C��s��|�j�d�}|�j|jdd�dg��|�j|jdd�dg��|�j|jddgd�ddg��|�j|jtjd�d�dddg��|�j|jdd�dddg��d S�) z'You can search the tree for text nodes.u��Foobar»�bar)r��)r)��Fooz.*��»TN)r$��r��r-��re�compile)r��r$��r��r��r��test_find_all_text_nodes`��s�� z$TestFindAll.test_find_all_text_nodesc��C��s��|�j�d�}|�j|jddd�dddg��|�j|jddd�dg��|�j|jdd d�dddd dg��|�j|jddd�dddd dg��d S�)z7You can limit the number of items returned by find_all.z(1 2 3 4 5r/��)�limit�1r#��3�� 4�5r��N)r$��r��r-��)r��r$��r��r��r��test_find_all_limitp��s�� zTestFindAll.test_find_all_limitc��C��s:��|�j�d�}|�j|ddd�dg��|�j|jdd�dg��d�S�) Nz!123r/��r=��)r:��r;��foo)r��r<��)r$��r��r"��)r��r$��r��r��r��%test_calling_a_tag_is_calling_findall|��s�� z1TestFindAll.test_calling_a_tag_is_calling_findallc��C��s.��|�j�d�}g�}|j|��|�jg�|j|��d�S�)Nz)r$��appendr��r-��)r��r$��lr��r��r��Ttest_find_all_with_self_referential_data_structure_does_not_cause_infinite_recursion��s�� z`TestFindAll.test_find_all_with_self_referential_data_structure_does_not_cause_infinite_recursionc��C��s^��|�j�d�}|jd�}|�jt|d��|jd�}|�jt|d��|jdd�}|�jt|d��dS�)z%All find_all calls return a ResultSetzr/��sourceTrB��)r)��N)r$��r-�� assertTrue�hasattr)r��r$��resultr��r��r��test_find_all_resultset��s�� z#TestFindAll.test_find_all_resultsetN) r��r��r ��r1��r8��rA��rC��rF��rK��r��r��r��r��r2��]��s�� r2��c��@��s��e�Zd�Zdd��ZdS�)�TestFindAllBasicNamespacesc��C��s<��|�j�d�}|�jd|jd�j��|�jd|jddid�j��d�S�)Nz04r?��zmathml:msqrtr/��zsvg:fillZred)�attrs)r$��r��r%��r��name)r��r$��r��r��r��test_find_by_namespaced_name��s�� z7TestFindAllBasicNamespaces.test_find_by_namespaced_nameN)r��r��r ��rO��r��r��r��r��rL��s��rL��c��sp��e�Zd�ZdZ��fdd�Zdd��Zdd��Zdd ��Zd d��Zdd ��Z dd��Z dd��Zdd��Zdd��Z dd��Z��ZS�)�TestFindAllByNamez&Test ways of finding tags by tag name.c��s��t�t|��j��|�jd�|�_d�S�)Nz�First tag. Second tag. Third Nested tag. tag.)�superr��setUpr$��tree)r��)� __class__r��r��rR��s��zTestFindAllByName.setUpc��C��s��|�j�|�jjd�ddg��d�S�)Nr/��z First tag.zNested tag.)r��rS��r-��)r��r��r��r��test_find_all_by_tag_name��s��z+TestFindAllByName.test_find_all_by_tag_namec��C��s\��|�j�|�jjddd�dg��|�j�|�jjddd�ddg��|�j�|�jjdtjd�d�ddg��d�S�)Nr/��z First tag.)r)��TzNested tag.r��)r��rS��r-��r6��r7��)r��r��r��r��test_find_all_by_name_and_text��s��z0TestFindAllByName.test_find_all_by_name_and_textc��C��s��|�j�|�jjjd�dg��d�S�)Nr/��zNested tag.)r��rS��cr-��)r��r��r��r��!test_find_all_on_non_root_element��s��z3TestFindAllByName.test_find_all_on_non_root_elementc��C��s��|�j�|�jd�ddg��d�S�)Nr/��z First tag.zNested tag.)r��rS��)r��r��r��r��%test_calling_element_invokes_find_all��s��z7TestFindAllByName.test_calling_element_invokes_find_allc��C��s ��|�j�|�jjtd��ddg��d�S�)Nr/��z First tag.zNested tag.)r��rS��r-��r��)r��r��r��r��test_find_all_by_tag_strainer��s��z/TestFindAllByName.test_find_all_by_tag_strainerc��C��s"��|�j�|�jjddg�dddg��d�S�)Nr/��r"��z First tag.zSecond tag.zNested tag.)r��rS��r-��)r��r��r��r��test_find_all_by_tag_names��s��z,TestFindAllByName.test_find_all_by_tag_namesc��C��s$��|�j�|�jjddd��dddg��d�S�)NT)r/��r"��z First tag.zSecond tag.zNested tag.)r��rS��r-��)r��r��r��r��test_find_all_by_tag_dict��s��z+TestFindAllByName.test_find_all_by_tag_dictc��C��s$��|�j�|�jjtjd��dddg��d�S�)Nz^[ab]$z First tag.zSecond tag.zNested tag.)r��rS��r-��r6��r7��)r��r��r��r��test_find_all_by_tag_re��s��z)TestFindAllByName.test_find_all_by_tag_rec��C��s,��dd��}|�j�d�}|�j|j|�ddg��d�S�)Nc��S��s��|�j�|�jd�kS�)Nr��)rN��get)r��r��r��r��id_matches_name��s��zRTestFindAllByName.test_find_all_with_tags_matching_method..id_matches_namez�Match 1. Does not match. Match 2.zMatch 1.zMatch 2.)r$��r��r-��)r��r_��rS��r��r��r��'test_find_all_with_tags_matching_method��s ��z9TestFindAllByName.test_find_all_with_tags_matching_methodc��C��sx��|�j�d�}|jdd�}|jdtjd��}|jdddg�\}}|�jd|j��|�jd|j��|�jd|j��|�jd|j��d�S�)NzH
1
2
3
�divza dza br<��r;��)r$��r%��r6��r7��r-��r��r��)r��r$��Zr1Zr2Zr3Zr4r��r��r��%test_find_with_multi_valued_attribute��s��z7TestFindAllByName.test_find_with_multi_valued_attribute)r��r��r ��r1��rR��rU��rV��rX��rY��rZ��r[��r\��r]��r`��rb�� __classcell__r��r��)rT��r��rP��s�� rP��c��@��s��e�Zd�Zdd��Zdd��Zdd��Zdd��Zd d ��Zdd��Zd d��Z dd��Z dd��Zdd��Zdd��Z dd��Zdd��Zdd��Zdd��Zdd ��Zd!S�)"�TestFindAllByAttributec��C��s&��|�j�d�}|�j|jdd�ddg��d�S�)Nz� Matching a. Non-matching Matching b.a. �first)r��zMatching a.zMatching b.)r$��r��r-��)r��rS��r��r��r��test_find_all_by_attribute_name��s��z6TestFindAllByAttribute.test_find_all_by_attribute_namec��C��st��dj�d�}dj�d�}|�j|�}|�j|jg|j|d��|�j|jg|j|jd�d��|�j|jg|j|dgd��d�S�)Nu��םולש�utf8u��)�titlezsomething else)�encoder$��r��r/��r-��decode)r��Zpeace�datar$��r��r��r��%test_find_all_by_utf8_attribute_value��s�� zName match. Class match. Non-match. A tag called 'name1'. Zname1)rN��zA tag called 'name1'.rN��)rM��zName match.�classZclass2zClass match.)r$��r��r-��)r��rS��r��r��r��test_find_all_by_attribute_dict��s��z6TestFindAllByAttribute.test_find_all_by_attribute_dictc��C��s��|�j�d�}|�j|jddd�dg��|�j|jddd�dg��|�j|jdd d�dg��|�j|jdd�dg��|�j|jdd �ddg��|�j|jdd�dg��|�j|jdd �dg��d�S�)Nz� Class 1. Class 2. Class 1. Class 3 and 4. r/��r;��)�class_zClass 1.rW��r<��zClass 3 and 4.r?��)rM��)r$��r��r-��)r��rS��r��r��r��test_find_all_by_class��s��z-TestFindAllByAttribute.test_find_all_by_classc��C��st��|�j�d�}|jdtjd�d�}|�j|dg��|jdtjd�d�}|�j|dg��|jdtjd�d�}|�j|dg��d�S�)Nz#Found itZgar�o)ro��zFound itr/��zo b)r$��r-��r6��r7��r��)r��rS��fr��r��r��0test_find_by_class_when_multiple_classes_present-��s�� zGTestFindAllByAttribute.test_find_by_class_when_multiple_classes_presentc��C��sd��|�j�d�}|�j|jdtjd��dg��dd��}|�j|jd|�g��dd��}|�j|jd|�dg��d�S�) NzFound itr/��ZbazFound itc��S��s��t�|��dkS�)Nr9��)r,��)�valuer��r��r��big_attribute_value@��s��znTestFindAllByAttribute.test_find_all_with_non_dictionary_for_attrs_finds_by_class..big_attribute_valuec��S��s��t�|��dkS�)Nr9��)r,��)rt��r��r��r��small_attribute_valueE��s��zpTestFindAllByAttribute.test_find_all_with_non_dictionary_for_attrs_finds_by_class..small_attribute_value)r$��r��r-��r6��r7��)r��r$��ru��rv��r��r��r��:test_find_all_with_non_dictionary_for_attrs_finds_by_class;��s�� zQTestFindAllByAttribute.test_find_all_with_non_dictionary_for_attrs_finds_by_classc��C��s��|�j�d�}|jd�\}}|�j||g|jdd��|�j|g|jdd��|�j|g|jddd��|�j|g|jdd��|�jg�|jdd��d�S�)Nz*r/��rB��r3��zfoo bar)ro��zbar foo)r$��r-��r��)r��r$��r/��Za2r��r��r��:test_find_all_with_string_for_attrs_finds_multiple_classesK��s�� zQTestFindAllByAttribute.test_find_all_with_string_for_attrs_finds_multiple_classesc��C��s0��|�j�d�}tddid�}|�j|j|�dg��d�S�)Nzi Match. Non-match.r��re��)rM��zMatch.)r$��r��r��r-��)r��rS��strainerr��r��r��'test_find_all_by_attribute_soupstrainerW��s��z>TestFindAllByAttribute.test_find_all_by_attribute_soupstrainerc��C��s&��|�j�d�}|�j|jdd�d�dg��d�S�)Nz�ID present. No ID present. ID is empty.r/��)r��zNo ID present.)r$��r��r-��)r��rS��r��r��r��$test_find_all_with_missing_attribute_��s��z;TestFindAllByAttribute.test_find_all_with_missing_attributec��C��s&��|�j�d�}|�j|jdd�ddg��d�S�)Nz�ID present. No ID present. ID is empty.T)r��zID present.zID is empty.)r$��r��r-��)r��rS��r��r��r��$test_find_all_with_defined_attributeg��s��z;TestFindAllByAttribute.test_find_all_with_defined_attributec��C��s>��|�j�d�}ddg}|�j|jdd�|��|�j|jdd�|��d�S�)Nz[Unquoted attribute. Quoted attribute.zUnquoted attribute.zQuoted attribute.r=��)r��r;��)r$��r��r-��)r��rS��Zexpectedr��r��r��$test_find_all_with_numeric_attributep��s ��z;TestFindAllByAttribute.test_find_all_with_numeric_attributec��C��s,��|�j�d�}|�j|jdddgd�ddg��d�S�)Nz�1 2 3 No ID.r;��r<��r?��)r��)r$��r��r-��)r��rS��r��r��r��(test_find_all_with_list_attribute_valuesy��s��z?TestFindAllByAttribute.test_find_all_with_list_attribute_valuesc��C��s,��|�j�d�}|�j|jtjd�d�ddg��d�S�)Nz�One a. Two as. Mixed as and bs. One b. No ID.z^a+$)r��zOne a.zTwo as.)r$��r��r-��r6��r7��)r��rS��r��r��r��5test_find_all_with_regular_expression_attribute_value��s��zLTestFindAllByAttribute.test_find_all_with_regular_expression_attribute_valuec��C��sX��|�j�d�}|j}|�j|g|jddd��|�jg�|jddd��|�jg�|jddd��d�S�)Nzfoobarfoor/��rB��)r)��r3��)r$��r/��r��r-��)r��r$��r/��r��r��r��'test_find_by_name_and_containing_string��s �� z>TestFindAllByAttribute.test_find_by_name_and_containing_stringc��C��s*��|�j�d�}|�j|jd�|jddd��d�S�)Nz"foo foor/��rB��)r)��)r$��r��r-��)r��r$��r��r��r��=test_find_by_name_and_containing_string_when_string_is_buried��s�� zTTestFindAllByAttribute.test_find_by_name_and_containing_string_when_string_is_buriedc��C��sB��|�j�d�}|j}|�j|g|jddd��|�jg�|jddd��d�S�)Nz"foofoor+��rB��)r��r)��r=��r3��)r$��r/��r��r-��)r��r$��r/��r��r��r��,test_find_by_attribute_and_containing_string��s�� zCTestFindAllByAttribute.test_find_by_attribute_and_containing_stringN)r��r��r ��rf��rl��rn��rp��rs��rw��rx��rz��r{��r|��r}��r~��r��r��r��r��r��r��r��r��rd��s �� rd��c��@��s��e�Zd�ZdZdd��ZdS�)� TestIndexzTest Tag.indexc��C��sN��|�j�d�}|j}x(t|j�D�]\}}|�j||j|��qW�|�jt|jd��d�S�)Nah��
Identical Not identical Identical Identical with child Also not identical Identical with child
r=��)r$��ra�� enumerate�contentsr��index�assertRaises� ValueError)r��rS��ra��i�elementr��r��r�� test_index��s��zTestIndex.test_indexN)r��r��r ��r1��r��r��r��r��r��r��s��r��c��s`��e�Zd�ZdZ��fdd�Zdd��Zdd��Zdd ��Zd d��Zdd ��Z dd��Z dd��Zdd��Z��Z S�)�TestParentOperationsz;Test navigation and searching through an element's parents.c��s(��t�t|��j��|�jd�|�_|�jj|�_d�S�)Na1��

Start here

)rQ��r��rR��r$��rS��r"��start)r��)rT��r��r��rR��s��zTestParentOperations.setUpc��C��sF��|�j�|�jjd�d��|�j�|�jjjd�d��|�j�|�jjjjd�d��d�S�)Nr��bottom�middle�top)r��r��parent)r��r��r��r��test_parent��s��z TestParentOperations.test_parentc��C��s ��|�j�jd�}|�j|j|�j��d�S�)Nr��)rS��r��r��r��)r��Ztop_tagr��r��r��%test_parent_of_top_tag_is_soup_object��s��z:TestParentOperations.test_parent_of_top_tag_is_soup_objectc��C��s��|�j�d�|�jj��d�S�)N)r��rS��r��)r��r��r��r��test_soup_object_has_no_parent��s��z3TestParentOperations.test_soup_object_has_no_parentc��C��s8��|�j�|�jjd�dddg��|�j�|�jjddd�dg��d�S�)N�ulr��r��r��)r��)r��r��Zfind_parents)r��r��r��r��test_find_parents��s��z&TestParentOperations.test_find_parentsc��C��s8��|�j�|�jjd�d�d��|�j�|�jjddd�d�d��d�S�)Nr��r��r��r��)r��)r��r��find_parent)r��r��r��r��test_find_parent��s��z%TestParentOperations.test_find_parentc��C��s"��|�j�jdd�}|�j|jjd��d�S�)Nz Start here)r)��r"��)rS��r%��r��r��rN��)r��r)��r��r��r��test_parent_of_text_element��s��z0TestParentOperations.test_parent_of_text_elementc��C��s(��|�j�jdd�}|�j|jd�d�d��d�S�)Nz Start here)r)��r��r��r��)rS��r%��r��r��)r��r)��r��r��r��test_text_element_find_parent��s��z2TestParentOperations.test_text_element_find_parentc��C��s(��dd��|�j�jD��}|�j|dddg��d�S�)Nc��S��s&��g�|�]}|d�k rd|j�kr|d��qS�)Nr��)rM��)r��r��r��r��r��r��s��z>TestParentOperations.test_parent_generator..r��r��r��)r��parentsr��)r��r��r��r��r��test_parent_generator��s��z*TestParentOperations.test_parent_generator)r��r��r ��r1��rR��r��r��r��r��r��r��r��r��rc��r��r��)rT��r��r��s��r��c��s��e�Zd�Z��fdd�Z��ZS�)� ProximityTestc��s��t�t|��j��|�jd�|�_d�S�)NzgOneTwoThree)rQ��r��rR��r$��rS��)r��)rT��r��r��rR��s��zProximityTest.setUp)r��r��r ��rR��rc��r��r��)rT��r��r��s��r��c��sT��e�Zd�Z��fdd�Zdd��Zdd��Zdd��Zd d ��Zdd��Zd d��Z dd��Z ��ZS�)�TestNextOperationsc��s��t�t|��j��|�jj|�_d�S�)N)rQ��r��rR��rS��r"��r��)r��)rT��r��r��rR��s��zTestNextOperations.setUpc��C��s*��|�j�|�jjd��|�j�|�jjjd�d��d�S�)N�Oner��r#��)r��r��next_element)r��r��r��r�� test_next��s��zTestNextOperations.test_nextc��C��s ��|�j�jdd�}|�j|jd��d�S�)N�Three)r)��)rS��r%��r��r��)r��Zlastr��r��r��test_next_of_last_item_is_none��s��z1TestNextOperations.test_next_of_last_item_is_nonec��C��s��|�j�|�jjd��d�S�)N)r��rS��r��)r��r��r��r��test_next_of_root_is_none��s��z,TestNextOperations.test_next_of_root_is_nonec��C��sB��|�j�|�jjd�ddg��|�jjdd��|�j�|�jjdd�dg��d�S�)Nr"��Twor��r9��)r��)r��r�� find_all_next)r��r��r��r��test_find_all_next��s��z%TestNextOperations.test_find_all_nextc��C��s2��|�j�|�jjd�d�d��|�j�|�jjdd�d��d�S�)Nr"��r��r#��r��)r)��)r��r�� find_next)r��r��r��r��test_find_next ��s��z!TestNextOperations.test_find_nextc��C��s<��|�j�jdd�}|�j|jd�jd��|�j|jd�ddg��d�S�)Nr��)r)��r"��r��r��)rS��r%��r��r��r��r��r��)r��r)��r��r��r��test_find_next_for_text_element��s��z2TestNextOperations.test_find_next_for_text_elementc��C��sF��|�j�jdd�}dd��|jD��}|\}}|�j|d�d��|�j|d��d�S�)Nr��)r)��c��S��s��g�|�]}|�qS�r��r��)r��noder��r��r��r��s��z:TestNextOperations.test_next_generator..r��r<��r��)rS��r%��Z next_elementsr��)r��r��Z successorsr��r��r��r��r��test_next_generator��s ��z&TestNextOperations.test_next_generator)r��r��r ��rR��r��r��r��r��r��r��r��rc��r��r��)rT��r��r��s��r��c��sT��e�Zd�Z��fdd�Zdd��Zdd��Zdd��Zd d ��Zdd��Zd d��Z dd��Z ��ZS�)�TestPreviousOperationsc��s"��t�t|��j��|�jjdd�|�_d�S�)Nr��)r)��)rQ��r��rR��rS��r%��end)r��)rT��r��r��rR��s��zTestPreviousOperations.setUpc��C��s*��|�j�|�jjd�d��|�j�|�jjjd��d�S�)Nr��r<��r��)r��r��previous_element)r��r��r��r�� test_previous!��s��z$TestPreviousOperations.test_previousc��C��s��|�j�jd�}|�j|jd��d�S�)N�html)rS��r%��r��r��)r��re��r��r��r��#test_previous_of_first_item_is_none%��s��z:TestPreviousOperations.test_previous_of_first_item_is_nonec��C��s��d�S�)Nr��)r��r��r��r��test_previous_of_root_is_none)��s��z4TestPreviousOperations.test_previous_of_root_is_nonec��C��s6��|�j�|�jjd�dddg��|�j�|�jjdd�dg��d�S�)Nr"��r��r��r��r=��)r��)r��r��find_all_previous)r��r��r��r��test_find_all_previous/��s��z-TestPreviousOperations.test_find_all_previousc��C��s2��|�j�|�jjd�d�d��|�j�|�jjdd�d��d�S�)Nr"��r��r<��r��)r)��)r��r�� find_previous)r��r��r��r��test_find_previous7��s��z)TestPreviousOperations.test_find_previousc��C��s>��|�j�jdd�}|�j|jd�jd��|�j|jd�dddg��d�S�)Nr��)r)��r"��r��r��)rS��r%��r��r��r��r��r��)r��r)��r��r��r��#test_find_previous_for_text_element;��s��z:TestPreviousOperations.test_find_previous_for_text_elementc��C��sh��|�j�jdd�}dd��|jD��}|\}}}}|�j|d�d��|�j|jd��|�j|jd��|�j|jd ��d�S�) Nr��)r)��c��S��s��g�|�]}|�qS�r��r��)r��r��r��r��r��r��C��s��zBTestPreviousOperations.test_previous_generator..r��r;��body�headr��)rS��r%��Zprevious_elementsr��rN��)r��r��Zpredecessorsr"��r��r��r��r��r��r��test_previous_generatorA��s��z.TestPreviousOperations.test_previous_generator)r��r��r ��rR��r��r��r��r��r��r��r��rc��r��r��)rT��r��r��s��r��c��s��e�Zd�Z��fdd�Z��ZS�)�SiblingTestc��s4��t�t|��j��d}tjd�jd|�}|�j|�|�_d�S�)Na�� z\n\s*��)rQ��r��rR��r6��r7��subr$��rS��)r��markup)rT��r��r��rR��P��s��zSiblingTest.setUp)r��r��r ��rR��rc��r��r��)rT��r��r��N��s��r��c��sL��e�Zd�Z��fdd�Zdd��Zdd��Zdd��Zd d ��Zdd��Zd d��Z ��Z S�)�TestNextSiblingc��s"��t�t|��j��|�jjdd�|�_d�S�)Nr;��)r��)rQ��r��rR��rS��r%��r��)r��)rT��r��r��rR��f��s��zTestNextSibling.setUpc��C��s��|�j�|�jjd��d�S�)N)r��rS��next_sibling)r��r��r��r��!test_next_sibling_of_root_is_nonej��s��z1TestNextSibling.test_next_sibling_of_root_is_nonec��C��sB��|�j�|�jjd�d��|�j�|�jjjd�d��|�j�|�jjd�d��d�S�)Nr��r#��r<��z1.1)r��r��r��r��)r��r��r��r��test_next_siblingm��s��z!TestNextSibling.test_next_siblingc��C��sN��|�j�|�jjjd��|�jjdd�}|�j�|jd��|�jjdd�}|�j�|jd��d�S�)Nz1.1)r��r?��)r��rS��r��r��r%��)r��nested_spanZ last_spanr��r��r��test_next_sibling_may_not_existt��s ��z/TestNextSibling.test_next_sibling_may_not_existc��C��s��|�j�|�jjd�d�d��d�S�)N�spanr��r#��)r��r��find_next_sibling)r��r��r��r��test_find_next_sibling}��s��z&TestNextSibling.test_find_next_siblingc��C��s6��|�j�|�jjd�dddg��|�j�|�jjdd�dg��d�S�)Nr��r#��r<��r?��)r��)r��r��find_next_siblings)r��r��r��r��test_next_siblings��s��z"TestNextSibling.test_next_siblingsc��C��sv��|�j�d�}|jdd�}|�j|jjd��|�j|jjd��|�j|jd�dg��|�j|jdd�d��|�j|jdd�d��d�S�)NzFoobarbazr4��)r)��r"��bazr3��nonesuch)r$��r%��r��r��rN��r��r��r��)r��r$��r��r��r��r��"test_next_sibling_for_text_element��s�� z2TestNextSibling.test_next_sibling_for_text_element)r��r��r ��rR��r��r��r��r��r��r��rc��r��r��)rT��r��r��d��s�� r��c��sL��e�Zd�Z��fdd�Zdd��Zdd��Zdd��Zd d ��Zdd��Zd d��Z ��Z S�)�TestPreviousSiblingc��s"��t�t|��j��|�jjdd�|�_d�S�)Nr?��)r��)rQ��r��rR��rS��r%��r��)r��)rT��r��r��rR��s��zTestPreviousSibling.setUpc��C��s��|�j�|�jjd��d�S�)N)r��rS��previous_sibling)r��r��r��r��%test_previous_sibling_of_root_is_none��s��z9TestPreviousSibling.test_previous_sibling_of_root_is_nonec��C��sB��|�j�|�jjd�d��|�j�|�jjjd�d��|�j�|�jjd�d��d�S�)Nr��r<��r#��z3.1)r��r��r��r��)r��r��r��r��test_previous_sibling��s��z)TestPreviousSibling.test_previous_siblingc��C��sN��|�j�|�jjjd��|�jjdd�}|�j�|jd��|�jjdd�}|�j�|jd��d�S�)Nz1.1)r��r;��)r��rS��r��r��r%��)r��r��Z first_spanr��r��r��#test_previous_sibling_may_not_exist��s ��z7TestPreviousSibling.test_previous_sibling_may_not_existc��C��s��|�j�|�jjd�d�d��d�S�)Nr��r��r<��)r��r��find_previous_sibling)r��r��r��r��test_find_previous_sibling��s��z.TestPreviousSibling.test_find_previous_siblingc��C��s6��|�j�|�jjd�dddg��|�j�|�jjdd�dg��d�S�)Nr��r<��r#��r;��)r��)r��r��find_previous_siblings)r��r��r��r��test_previous_siblings��s��z*TestPreviousSibling.test_previous_siblingsc��C��sv��|�j�d�}|jdd�}|�j|jjd��|�j|jjd��|�j|jd�dg��|�j|jdd�d��|�j|jdd�d��d�S�)NzFoobarbazr��)r)��r"��r4��r3��r��)r$��r%��r��r��rN��r��r��r��)r��r$��r��r��r��r��&test_previous_sibling_for_text_element��s�� z:TestPreviousSibling.test_previous_sibling_for_text_element)r��r��r ��rR��r��r��r��r��r��r��rc��r��r��)rT��r��r��s�� r��c��@��s0��e�Zd�ZdZdd��Zdd��Zdd��Zdd ��Zd S�)�TestTagCreationz$Test the ability to create new tags.c��C��sd��|�j�d�}|jddddid�}|�jt|t��|�jd|j��|�jtddd�|j��|�jd�|j ��d�S�)Nr��rB��r��rN��za name)r3��rM��)r3��rN��) r$��new_tagrH�� isinstancer ��r��rN��dictrM��r��)r��r$��r��r��r��r��test_new_tag��s�� zTestTagCreation.test_new_tagc��C��s��t�rBtdd�}|jd�}|jd�}|�jd|j��|�jd|j��tdd�}|jd�}|jd�}|�jd|j��|�jd|j��d�S�) Nr��zlxml-xml�br�ps��
s��
zhtml.parsers��
)�XML_BUILDER_PRESENTr��r��r��ri��)r��Zxml_soupZxml_brZxml_pZ html_soupZhtml_brZhtml_pr��r��r��1test_tag_inherits_self_closing_rules_from_builder��s�� zATestTagCreation.test_tag_inherits_self_closing_rules_from_builderc��C��s4��|�j�d�}|jd�}|�jd|��|�jt|t��d�S�)Nr��rB��)r$�� new_stringr��rH��r��r��)r��r$��sr��r��r��'test_new_string_creates_navigablestring��s�� z7TestTagCreation.test_new_string_creates_navigablestringc��C��s6��|�j�d�}|jdt�}|�jd|��|�jt|t��d�S�)Nr��rB��)r$��r��r��r��rH��r��)r��r$��r��r��r��r��3test_new_string_can_create_navigablestring_subclass��s�� zCTestTagCreation.test_new_string_can_create_navigablestring_subclassN)r��r��r ��r1��r��r��r��r��r��r��r��r��r��s ��r��c��@��s<��e�Zd�Zdd��Zdd��Zdd��Zdd��Zd d ��Zdd��Zd d��Z dd��Z dd��Zdd��Zdd��Z dd��Zdd��Zdd��Zdd��Zdd ��Zd!d"��Zd#d$��Zd%d&��Zd'd(��Zd)d*��Zd+d,��Zd-d.��Zd/d0��Zd1d2��Zd3d4��Zd5d6��Zd7d8��Zd9d:��Zd;d<��Z d=d>��Z!d?d@��Z"dAdB��Z#dCdD��Z$dEdF��Z%dGdH��Z&dIdJ��Z'dKdL��Z(dMS�)N�TestTreeModificationc��C��sl��|�j�d�}d|jd<�|�j|j��|�jd��|jd=�|�j|j��|�jd��d|jd<�|�j|j��|�jd��d�S�) Nzr+��r��zzrB��Zid2z)r$��r/��r��rj��document_for)r��r$��r��r��r��test_attribute_modification��s�� z0TestTreeModification.test_attribute_modificationc��C��sl��t�jd��}|�jd|d�}t||d�}t||d�}d|d<�|jjd|��|jjd |��|�j|jj��d ��d�S�)Nr��z )�builderr/��olzhttp://foo.com/Zhrefr��r=��s4��
)r��lookupr$��r ��r��insertr��ri��)r��r��r$��r/��r��r��r��r��test_new_tag_creation��s��z*TestTreeModification.test_new_tag_creationc��C��s\��d}|�j�|�}|jdd�}|j}|jdd�j|j��|�j|j|��|�j|j��|�jd��d�S�)NzT
Don't leave me here.

Don't leave!
r#��)r��zD
Don't leave me .

Don't leave!here
)r$��r%��r"��rD��r��r��rj��r��)r��docr$��Zsecond_paraZboldr��r��r��!test_append_to_contents_moves_tag��s�� z6TestTreeModification.test_append_to_contents_moves_tagc��C��s0��d}|�j�|�}|j}|j|j�}|�j||��d�S�)Nz)r$��r/��replace_withrW��r��)r��r)��r$��r/��new_ar��r��r��1test_replace_with_returns_thing_that_was_replaced��s �� zFTestTreeModification.test_replace_with_returns_thing_that_was_replacedc��C��s,��d}|�j�|�}|j}|j��}|�j||��d�S�)Nz)r$��r/��unwrapr��)r��r)��r$��r/��r��r��r��r��+test_unwrap_returns_thing_that_was_replaced��s �� z@TestTreeModification.test_unwrap_returns_thing_that_was_replacedc��C��sJ��|�j�d�}|j}|j��|�jd�|j��|�jt|j��|�jt|j|j ��d�S�)NzFooBar) r$��r/��extractr��r��r��r��r��r��rW��)r��r$��r/��r��r��r��Itest_replace_with_and_unwrap_give_useful_exception_when_tag_has_no_parent��s�� z^TestTreeModification.test_replace_with_and_unwrap_give_useful_exception_when_tag_has_no_parentc��C��s:��d}|�j�|�}|j}|jj|��|�j|j��|�j|��d�S�)Nz-Foo )r$��rW��r��r��rj��r��)r��r)��r$��rW��r��r��r��test_replace_tag_with_itself'��s �� z1TestTreeModification.test_replace_tag_with_itselfc��C��s&��d}|�j�|�}|�jt|jj|j��d�S�)Nz)r$��r��r��r"��r��r/��)r��r)��r$��r��r��r��1test_replace_tag_with_its_parent_raises_exception.��s�� zFTestTreeModification.test_replace_tag_with_its_parent_raises_exceptionc��C��s(��d}|�j�|�}|�jt|jjd|j��d�S�)Nzr��)r$��r��r��r/��r��)r��r)��r$��r��r��r��,test_insert_tag_into_itself_raises_exception3��s�� zATestTreeModification.test_insert_tag_into_itself_raises_exceptionc�� C��s��|�j�d�}d}|�j�|�}|jd|��x|jD�]}q,W�t|j�\}}}}|�jd|j��|�jd|j��|�jd|j��|�jd|j��dS�) z�Inserting one BeautifulSoup object into another actually inserts all of its children -- you'll never combine BeautifulSoup objects. z-
And now, a word:
And we're back.
z
p2
p3
r=��zAnd now, a word:�p2�p3zAnd we're back.N)r$��r��Zdescendants�listZchildrenr��r��) r��r$��r)��Z to_insertr��p1r��r��Zp4r��r��r��1test_insert_beautifulsoup_object_inserts_children8��s�� zFTestTreeModification.test_insert_beautifulsoup_object_inserts_childrenc��C��sX��|�j�d�}|j}|jd�}|jdd��|j\}}|jd��|jd��|�jd|jj��d�S�)Nz
onethree
r��r=��Ztwor��Zthree)r$��r/��r��r��ZreplaceWithr��r"��r��)r��r$��r/��r"��left�rightr��r��r��3test_replace_with_maintains_next_element_throughoutL��s�� zHTestTreeModification.test_replace_with_maintains_next_element_throughoutc��C��sl��|�j�d�}|jdd�jd��|jdd�}|j}|�j|j|��|�j|j|��|�j|jj|��|�j|jd��d�S�)NzArgh!zArgh!)r)��zHooray!)r$��r%��r��r"��r��r��r��r��)r��r$��new_textr"��r��r��r��test_replace_final_node[��s�� z,TestTreeModification.test_replace_final_nodec��C��s��|�j�d�}|jjdd��|�j|j��|�jd��|jdd�}|�j|jd��|�j|jj|��|�j|j d��|�j|j j |��|�j|j d��|�j|j|j��d�S�)NzArgh!r=��zHooray!z!Argh!Hooray!)r)��zArgh!)r$��r"��r��r��rj��r��r%��r��r��r��r��rW��)r��r$��r��r��r��r��test_consecutive_text_nodese��s�� z0TestTreeModification.test_consecutive_text_nodesc��C��sT��|�j�d�}|jjdd��|jjdd��|�jddg|jj��|�j|jjd�jd��d�S�)Nzr��r3��rB��)r$��r/��r��r��r��r��)r��r$��r��r��r��test_insert_stringz��s �� z'TestTreeModification.test_insert_stringc��C��s��|�j�}|�jd|d�}t||d�}|jdd��|jjd|��|�j|j��|�jd��|j}|�j|j |��|�j|j |��|jdd �}|�j|j|��|�j|j |��|j}|�j|j |��|�j|j |��|jdd �}|�j|j|��|�j|j|��|�j|j |��d�S�) Nz%Findlady!)r��Zmagictagr��ther=��z=Findthelady!ZFind)r)��)Zdefault_builderr$��r ��r��r/��r��rj��r��r"��r��r��r%��r��r��rW��r��)r��r��r$��Z magic_tagZb_tagr%��Zc_tagr��r��r��r��test_insert_tag��s,�� z$TestTreeModification.test_insert_tagc��C��s0��d}|�j�|�}|jj|j��|�j||j��d�S�)Nz)r$��r/��rD��r"��r��rj��)r��rk��r$��r��r��r��*test_append_child_thats_already_at_the_end��s�� z?TestTreeModification.test_append_child_thats_already_at_the_endc��C��s2��d}|�j�|�}|jjd|j��|�jd|j��d�S�)Nzr��z)r$��r/��r��dr��rj��)r��rk��r$��r��r��r��$test_move_tag_to_beginning_of_parent��s�� z9TestTreeModification.test_move_tag_to_beginning_of_parentc��C��s.��|�j�d�}|jjdd��|�jt|j�d��d�S�)Nz
r=��ZContentsz
Contents
)r$��r��r��r��r(��)r��r$��r��r��r��&test_insert_works_on_empty_element_tag��s�� z;TestTreeModification.test_insert_works_on_empty_element_tagc��C��s`��|�j�d�}|jjd��|jjd��|�j|j��|�jd��|jj|j��|�j|j��|�jd��d�S�)Nzfoobar�BAZ�QUUXzQUUXfooBAZbarzQUUXbarfooBAZ)r$��r"�� insert_beforer/��r��rj��r��)r��r$��r��r��r��test_insert_before��s�� z'TestTreeModification.test_insert_beforec��C��s`��|�j�d�}|jjd��|jjd��|�j|j��|�jd��|jj|j��|�j|j��|�jd��d�S�)Nzfoobarr��r��zfooQUUXbarBAZzQUUXbarfooBAZ)r$��r"��insert_afterr/��r��rj��r��)r��r$��r��r��r��test_insert_after��s�� z&TestTreeModification.test_insert_afterc��C��sR��|�j�d�}|jd�}|jd�}|�jt|j|��|�jt|j|��|�jt|j|��d�S�)Nr��r/��)r$��r��r��r��r��r��NotImplementedError)r��r$��r��r��r��r��r��:test_insert_after_raises_exception_if_after_has_no_meaning��s�� zOTestTreeModification.test_insert_after_raises_exception_if_after_has_no_meaningc��C��sR��|�j�d�}|jd�}|jd�}|�jt|j|��|�jt|j|��|�jt|j|��d�S�)Nr��r/��)r$��r��r��r��r��r ��r��)r��r$��r��r��r��r��r��Ftest_insert_before_raises_notimplementederror_if_before_has_no_meaning��s�� z[TestTreeModification.test_insert_before_raises_notimplementederror_if_before_has_no_meaningc��C��sv��|�j�d�}|jd�\}}|j|��|�j|j��|�jd��|�j|jd��|�j|j|j��|�j|jd��|�j|j d��d�S�)Nz;
There's no business like show business
r"��z0
There's business like no business
�noz business) r$��r-��r��r��rj��r��r��r��r��r��)r��r$��r��Zshowr��r��r��test_replace_with��s�� z&TestTreeModification.test_replace_withc��C��s0��d}|�j�|�}|jj|j��|�jd|j��d�S�)Nzz)r$��r"��r��rW��r��rj��)r��rk��r$��r��r��r��test_replace_first_child��s�� z-TestTreeModification.test_replace_first_childc��C��s0��d}|�j�|�}|jj|j��|�jd|j��d�S�)Nzz)r$��rW��r��r"��r��rj��)r��rk��r$��r��r��r��test_replace_last_child��s�� z,TestTreeModification.test_replace_last_childc��C��s��|�j�d�}|j}|j}|j|��|�j|j��|�jd��|�j|jd��|�j|jdd�j d��|�j|j d��|�j|jd��|�j|jd��|�j|j|j ��|�j|j d��|�j|j j |j��|�j|jd��|jdd�}|j}|�j|j |��|�j|j|��|�j|j |��|�j|j|��d�S�)NzQWereservetherighttorefuseservicez-Werefusetoservicer��)r)��ZWeZto)r$��r"��rr��r��r��rj��r��r��r%��r��r��r��r��r/��e�g)r��r$��Z remove_tagZmove_tagZto_textZg_tagr��r��r��test_nested_tag_replace_with��s.�� z1TestTreeModification.test_nested_tag_replace_withc��C��s6��|�j�d�}|jj��|�j|jd��|�j|jjd��d�S�)NzI
Unneeded formatting is unneeded
zUnneeded formatting is unneeded)r$��emr��r��r��r)��)r��rS��r��r��r��test_unwrap��s �� z TestTreeModification.test_unwrapc��C��sF��|�j�d�}|jj|jd��}|�j|j��d��|�j|j��|�jd��d�S�)NzI wish I was bold.r"��zI wish I was bold.)r$��r��wrapr��r��rj��r��)r��r$��rt��r��r��r�� test_wrap"��s �� zTestTreeModification.test_wrapc��C��s4��|�j�d�}|jjj|j��|�j|j��|�jd��d�S�)NzI wish I was bold.zI wish I was bold.)r$��r"��r��r��r��rj��r��)r��r$��r��r��r��%test_wrap_extracts_tag_from_elsewhere)��s�� z:TestTreeModification.test_wrap_extracts_tag_from_elsewherec��C��sH��|�j�d�}|jjj|j��|�jdt|jj��|�j|j��|�jd��d�S�)Nz+I like being bold.I wish I was bold.r+��z+I like being bold.I wish I was bold.) r$��r"��r��r��r��r,��r��rj��r��)r��r$��r��r��r��&test_wrap_puts_new_contents_at_the_end/��s�� z;TestTreeModification.test_wrap_puts_new_contents_at_the_endc��C��s��|�j�d�}|�jt|jj�d��|jdd�j��}|�j|j��d��|�j|j��d��|�jt|jj�d��|�j|jd��|�j|j d��|�j|j j d��|jdd �}|jd d �}|�j|j |��|�j|j|��|�j|j |��|�j|j|��d�S�)NzRSome content.
Nav crap
More content.r9��Znav)r��z6Some content. More content.z
Nav crap
r+��zSome content. )r)��z More content.) r$��r��r,��r��r��r%��r��rj��r��r��r��r��r��)r��r$��Z extractedZ content_1Z content_2r��r��r��test_extract7��s"��z!TestTreeModification.test_extractc��C��sz��|�j�d�}|jj}|jj}|jd�}|jd�}|jj|��|jj|��|j��|j��|�j||jj��|�j||jj��d�S�)NzfoobarrB��r3��)r$��r/��r��r"��r��rD��r��r��)r��r$��Zfoo_1Zbar_1Zfoo_2Zbar_2r��r��r��4test_extract_distinguishes_between_identical_stringsP��s�� zITestTreeModification.test_extract_distinguishes_between_identical_stringsc��s8��|�j�d��fdd��jd�D��|�jdt��j��d�S�)Nzv c��s��g�|�]}��j�j��qS�r��)�scriptr��)r��r��)r$��r��r��r��m��s��zKTestTreeModification.test_extract_multiples_of_same_tag..r#��z )r$��r-��r��r(��r��)r��r��)r$��r��"test_extract_multiples_of_same_taga��s�� z7TestTreeModification.test_extract_multiples_of_same_tagc��C��s.��|�j�d�}|jd�j��|�jd�|jd��d�S�)Nz hi r��)r$��r%��r��r��)r��r$��r��r��r��Btest_extract_works_when_element_is_surrounded_by_identical_stringsq��s��zWTestTreeModification.test_extract_works_when_element_is_surrounded_by_identical_stringsc��C��sf��|�j�d�}|j}|jj��|�jt|jj�d��|�jt|d��|j }|jdd��|�jdt|j��dS�)zTag.clear()z4
String Italicized and another
r��r��T)Z decomposeN) r$��r/��r��clearr��r,��r��rH��rI��r��)r��r$��r/��r��r��r��r�� test_clearz��s�� zTestTreeModification.test_clearc��C��sB��|�j�d�}d|j_|�j|jjdg��d|j_|�j|jjdg��dS�)zTag.string = 'string'z rB��r3��N)r$��r/��r��r��r��r"��)r��r$��r��r��r��test_string_set��s �� z$TestTreeModification.test_string_setc��C��s,��|�j�d�}|jj|j_|�j|jj��d��d�S�)Nzfoobars��barbar)r$��rW��r��r"��r��r/��ri��)r��r$��r��r��r��/test_string_set_does_not_affect_original_string��s�� zDTestTreeModification.test_string_set_does_not_affect_original_stringc��C��s2��|�j�d�}td�}||j_|�jt|jjt��d�S�)NzrB��)r$��r��r/��r��rH��r��)r��r$��cdatar��r��r��)test_set_string_preserves_class_of_string��s�� z>TestTreeModification.test_set_string_preserves_class_of_stringN))r��r��r ��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r ��r ��r��r��r��r��r��r��r��r��r��r��r��r ��r!��r"��r$��r%��r'��r(��r)��r+��r��r��r��r��r��sL�� $ r��c��@��sx��e�Zd�ZdZdd��Zdd��Zdd��Zdd ��Zd d��Zdd ��Z dd��Z dd��Zdd��Zdd��Z dd��Zdd��Zdd��ZdS�)�TestElementObjectsz)Test various features of element objects.c��C��sV��|�j�d�}|�jt|j�d��|�jt|�d��|�jt|j�d��|�jt|jj�d��dS�)z3The length of an element is its number of children.z123r=��r9��N)r$��r��r,��r��r��)r��r$��r��r��r��test_len��s �� zTestElementObjects.test_lenc��C��sL��|�j�d�}|�j|j|jd��|�j|jj|jd�jd��|�j|jd��dS�)z2Accessing a Python member .foo invokes find('foo')zr"��r��N)r$��r��r"��r%��r��r/��)r��r$��r��r��r��test_member_access_invokes_find��s�� z2TestElementObjects.test_member_access_invokes_findc��C��sP��|�j�d�}tjdd��}|j}W�d�Q�R�X�|�j|j|��|�jdt|d�j��d�S�)NzT)�recordzp.bTag is deprecated, use .find("b") instead. If you really were looking for a tag called bTag, use .find("bTag")r��)r$��warnings�catch_warningsZbTagr��r"��r(��message)r��r$��wr��r��r��r��test_deprecated_member_access��s�� z0TestElementObjects.test_deprecated_member_accessc��C��s2��|�j�d�}|�j|jjd��|�j|jjd��dS�)z�has_attr() checks for the presence of an attribute. Please note note: has_attr() is different from __in__. has_attr() checks the tag's attributes and __in__ checks the tag's chidlren. z�attrZattr2N)r$��rH��rB��has_attr�assertFalse)r��r$��r��r��r�� test_has_attr��s�� z TestElementObjects.test_has_attrc��C��s��d}|�j�|d��d�S�)Nz%z%)ZassertSoupEquals)r��r��r��r��r��.test_attributes_come_out_in_alphabetical_order��s��zATestElementObjects.test_attributes_come_out_in_alphabetical_orderc��C��s��|�j�d�}|�j|jjd��d�S�)Nz foorB��)r$��r��r"��r��)r��r$��r��r��r��test_string��s�� zTestElementObjects.test_stringc��C��s��|�j�d�}|�j|jjd��d�S�)Nz)r$��r��r"��r��)r��r$��r��r��r��test_empty_tag_has_no_string��s�� z/TestElementObjects.test_empty_tag_has_no_stringc��C��s`��|�j�d�}|�j|jjd��|�j�d�}|�j|jjd��|�j�d�}|jjdd��|�j|jjd��d�S�)Nzfoozfoobarz foor=��r3��)r$��r��r"��r��r/��r��)r��r$��r��r��r��-test_tag_with_multiple_children_has_no_string��s�� z@TestElementObjects.test_tag_with_multiple_children_has_no_stringc��C��s,��|�j�d�}|�j|jjd��|�j|jd��d�S�)NzfoorB��)r$��r��r/��r��)r��r$��r��r��r��)test_tag_with_recursive_string_has_string��s�� zfeozN)r$��r7��r"��r��)r��r$��r��r��r��test_lack_of_string��s�� z&TestElementObjects.test_lack_of_stringc��C��s`��|�j�d�}|�j|jjd��|�j|jjdd�d��|�j|jjd�d��|�j|jjddd�d��d S�) zBTag.text and Tag.get_text(sep=u"") -> all child text, concatenatedzar t zar t T)�stripZart�,z a,r, , t za,r,tN)r$��r��r/��r)��get_text)r��r$��r��r��r�� test_all_text��s �� z TestElementObjects.test_all_textc��C��sJ��|�j�d�}|�j|j��d��|�j|jttfd�d��|�j|jd�d�d��d�S�)NzfoobarZfoobar)�typesZfooIGNOREbar)r$��r��rA��r��r��)r��r$��r��r��r��test_get_text_ignores_comments��s�� z1TestElementObjects.test_get_text_ignores_commentsc��C��s$��|�j�d�}|�jddgt|j��d�S�)NzfoobarrB��r3��)r$��r��r��Zstrings)r��r$��r��r��r��!test_all_strings_ignores_comments��s�� z4TestElementObjects.test_all_strings_ignores_commentsN)r��r��r ��r1��r-��r.��r4��r8��r9��r:��r;��r<��r=��r>��rB��rD��rE��r��r��r��r��r,��s�� r,��c��@��sP��e�Zd�ZdZdd��Zdd��Zdd��Zdd ��Zd d��Zdd ��Z dd��Z dd��ZdS�)�TestCDAtaListAttributesz0Testing cdata-list attributes like 'class'. c��C��s"��|�j�d�}|�jdg|jd��d�S�)NzrB��rm��)r$��r��r/��)r��r$��r��r��r��test_single_value_becomes_list ��s�� z6TestCDAtaListAttributes.test_single_value_becomes_listc��C��s$��|�j�d�}|�jddg|jd��d�S�)NzrB��r3��rm��)r$��r��r/��)r��r$��r��r��r��!test_multiple_values_becomes_list��s�� z9TestCDAtaListAttributes.test_multiple_values_becomes_listc��C��s&��|�j�d�}|�jdddg|jd��d�S�)NzrB��r3��r��rm��)r$��r��r/��)r��r$��r��r��r��2test_multiple_values_separated_by_weird_whitespace��s�� zJTestCDAtaListAttributes.test_multiple_values_separated_by_weird_whitespacec��C��s ��|�j�d�}|�jd|jj��d�S�)Nzs��)r$��r��r/��ri��)r��r$��r��r��r��,test_attributes_joined_into_string_on_output��s�� zDTestCDAtaListAttributes.test_attributes_joined_into_string_on_outputc��C��s$��|�j�d�}|�jdg|jjd��d�S�)Nzzabc defr��)r$��r��r/��Zget_attribute_list)r��r$��r��r��r��test_get_attribute_list��s�� z/TestCDAtaListAttributes.test_get_attribute_listc��C��s$��|�j�d�}|�jddg|jd��d�S�)Nz(
z ISO-8859-1zUTF-8zaccept-charset)r$��r��Zform)r��r$��r��r��r��test_accept_charset!��s�� z+TestCDAtaListAttributes.test_accept_charsetc��C��s$��d}|�j�|�}|�jd|jd��d�S�)Nz)zISO-8859-1 UTF-8zaccept-charset)r$��r��r/��)r��rk��r$��r��r��r��-test_cdata_attribute_applying_only_to_one_tag%��s�� zETestCDAtaListAttributes.test_cdata_attribute_applying_only_to_one_tagc��s6��|�j�d�j��|�jd��j��fdd�}|�jt|��d�S�)Nr��c��s ��d��_�d�S�)NrB��)rN��r��)r��r��r��t0��s��zJTestCDAtaListAttributes.test_string_has_immutable_name_property..t)r$��r��r��rN��r��AttributeError)r��rN��r��)r��r��'test_string_has_immutable_name_property-��s��z?TestCDAtaListAttributes.test_string_has_immutable_name_propertyN)r��r��r ��r1��rG��rH��rI��rJ��rK��rL��rM��rP��r��r��r��r��rF�� s��rF��c��s`��e�Zd�ZdZ��fdd�Zdd��Zdd��Zdd ��Zd d��Zdd ��Z dd��Z dd��Zdd��Z��Z S�)�TestPersistencez*Testing features like pickle and deepcopy.c��s&��t�t|��j��d|�_|�j|�j�|�_d�S�)Nay�� Beautiful Soup: We called him Tortoise because he taught us. foo bar )rQ��rQ��rR��Zpager$��rS��)r��)rT��r��r��rR��7��s��zTestPersistence.setUpc��C��s@��t�j|�jd�}t�j|�}|�j|jt��|�j|j��|�jj��d�S�)Nr+��)�pickle�dumpsrS��loadsr��rT��r��rj��)r��dumped�loadedr��r��r��!test_pickle_and_unpickle_identityK��s�� z1TestPersistence.test_pickle_and_unpickle_identityc��C��s&��t�j|�j�}|�j|j��|�jj��d�S�)N)�copy�deepcopyrS��r��rj��)r��Zcopiedr��r��r��test_deepcopy_identityS��s��z&TestPersistence.test_deepcopy_identityc��C��s:��t�dd�}|j}|j��}|�jdt|��|�j||j��d�S�)Ns ��

zhtml.parseru ��

)r��Zoriginal_encoding�__copy__r��r(��)r��r$��encodingrX��r��r��r��test_copy_preserves_encodingX��s �� z,TestPersistence.test_copy_preserves_encodingc��C��s>��d}|�j�|�}tj|tj�}tj|�}|�j|j��|j��d�S�)Nu ��☃)r$��rR��rS��ZHIGHEST_PROTOCOLrT��r��rj��)r��r��r$��rU��rV��r��r��r��test_unicode_pickle_��s �� z#TestPersistence.test_unicode_picklec��C��sz��d}|�j�|�}|jdd�}tj|�}|�j||��|�jd�|j��|�jd�|j��|�jd�|j��|�jd�|j��|�jd�|j��d�S�)NzFooBarr4��)r��) r$��r%��rX��r��r��r��assertNotEqualr��r��)r��r��r$��s1�s2r��r��r��1test_copy_navigablestring_is_not_attached_to_treeg��s�� zATestPersistence.test_copy_navigablestring_is_not_attached_to_treec��C��s>��d}|�j�|�}|j}tj|�}|�j||��|�jt|t��d�S�)Nz)r$��r��rX��r��rH��r��r��)r��r��r$��r`��ra��r��r��r��0test_copy_navigablestring_subclass_has_same_types��s�� z@TestPersistence.test_copy_navigablestring_subclass_has_same_typec��C��s(��d}|�j�|�}tj|�}|�j||��d�S�)Nz)
FooBar
end)r$��rX��r��)r��r��r$��Z soup_copyr��r��r��test_copy_entire_soup{��s�� z%TestPersistence.test_copy_entire_soupc��C��s��d}|�j�|�}|j}tj|�}|�jt|�t|��|�j||��|�j||k��|�jd�|j��|�jd�|j��|�jd�|jdd�j ��|�j d�|jdd�j ��d�S�)Nz)
FooBar
endZBar)r��)r$��ra��rX��r��r(��r7��r��r��r%��r��r_��)r��r��r$��ra��Zdiv_copyr��r��r��test_copy_tag_copies_contents��s�� z-TestPersistence.test_copy_tag_copies_contents)r��r��r ��r1��rR��rW��rZ��r]��r^��rb��rc��rd��re��rc��r��r��)rT��r��rQ��4��s��rQ��c��@��s��e�Zd�Zdd��Zdd��Zdd��Zdd��Zd d ��Zdd��Zd d��Z dd��Z dd��Zdd��Zdd��Z dd��Zdd��Zdd��Zdd��Zdd ��Zd!S�)"�TestSubstitutionsc��C��s0��d}|�j�|�}|jdd�}|�j||�jd��d�S�)Nu#��<<Sacré bleu!>>�minimal)� formatter)r$��rj��r��r��)r��r��r$��decodedr��r��r��!test_default_formatter_is_minimal��s�� z3TestSubstitutions.test_default_formatter_is_minimalc��C��s0��d}|�j�|�}|jdd�}|�j||�jd��d�S�)Nu'��
<<Sacré bleu!>>r��)rh��z.
<<Sacré bleu!>>)r$��rj��r��r��)r��r��r$��ri��r��r��r��test_formatter_html��s�� z%TestSubstitutions.test_formatter_htmlc��C��s0��d}|�j�|�}|jdd�}|�j||�jd��d�S�)Nu'��
<<Sacré bleu!>>Zhtml5)rh��z-
<<Sacré bleu!>>)r$��rj��r��r��)r��r��r$��ri��r��r��r��test_formatter_html5��s�� z&TestSubstitutions.test_formatter_html5c��C��s0��d}|�j�|�}|jdd�}|�j||�jd��d�S�)Nu#��<<Sacré bleu!>>rg��)rh��)r$��rj��r��r��)r��r��r$��ri��r��r��r��test_formatter_minimal��s�� z(TestSubstitutions.test_formatter_minimalc��C��s0��d}|�j�|�}|jd�d�}|�j||�jd��d�S�)Nu#��<<Sacré bleu!>>)rh��u��<>)r$��rj��r��r��)r��r��r$��ri��r��r��r��test_formatter_null��s �� z%TestSubstitutions.test_formatter_nullc��C��s4��d}|�j�|�}|jdd��d�}|�j||�jd��d�S�)Nz!<foo>bar
c��S��s��|�j��S�)N)�upper)�xr��r��r��s��z9TestSubstitutions.test_formatter_custom..)rh��zBAR
)r$��rj��r��r��)r��r��r$��ri��r��r��r��test_formatter_custom��s�� z'TestSubstitutions.test_formatter_customc��C��s��d}|�j�|�}|j}d}|�j||j��|�j||jdd��d}|�j||jdd��|�j||jd�d��d}|�j||jdd ��d��d�S�) Nu%��eu)��erg��)rh��z/er��u%��Ec��S��s��|�j��S�)N)ro��)rp��r��r��r��rq��s��zMTestSubstitutions.test_formatter_is_run_on_attribute_values..)r$��r/��r��rj��)r��r��r$��r/��Zexpect_minimalZexpect_htmlZexpect_upperr��r��r��)test_formatter_is_run_on_attribute_values��s�� z;TestSubstitutions.test_formatter_is_run_on_attribute_valuesc��C��s$��d}t�|d�j��}|�jd|k��d�S�)NzO zhtml.parsers��< < hey > >)r��ri��rH��)r��r��encodedr��r��r��2test_formatter_skips_script_tag_for_html_documents��s��zDTestSubstitutions.test_formatter_skips_script_tag_for_html_documentsc��C��s$��d}t�|d�j��}|�jd|k��d�S�)NzF zhtml.parsers��< < hey > >)r��ri��rH��)r��r��rt��r��r��r��1test_formatter_skips_style_tag_for_html_documents��s��zCTestSubstitutions.test_formatter_skips_style_tag_for_html_documentsc��C��s ��|�j�d�}|�jd|jj��d�S�)Nz*
foo
bar
baz z/
foo
bar
baz
)r$��r��ra��prettify)r��r$��r��r��r��,test_prettify_leaves_preformatted_text_alone��s�� z>TestSubstitutions.test_prettify_leaves_preformatted_text_alonec��C��s,��t�dd�}|jdd��d�}|�jd|k��d�S�)Nzfoozhtml.parserc��S��s��|�j��S�)N)ro��)rp��r��r��r��rq��s��zLTestSubstitutions.test_prettify_accepts_formatter_function..)rh��ZFOO)r��rw��rH��)r��r$��Zprettyr��r��r��(test_prettify_accepts_formatter_function��s�� z:TestSubstitutions.test_prettify_accepts_formatter_functionc��C��s"��|�j�d�}|�jtt|j��d�S�)Nz)r$��r��r(��typerw��)r��r$��r��r��r��(test_prettify_outputs_unicode_by_default��s�� z:TestSubstitutions.test_prettify_outputs_unicode_by_defaultc��C��s$��|�j�d�}|�jtt|jd��d�S�)Nzzutf-8)r$��r��bytesrz��rw��)r��r$��r��r��r��test_prettify_can_encode_data��s�� z/TestSubstitutions.test_prettify_can_encode_datac��C��s0��d}|�j�|�}|jjd�}|�j||jd��d�S�)Nu��Sacré bleu!zutf-8)r$��r"��ri��r��)r��r��r$��rt��r��r��r��,test_html_entity_substitution_off_by_default��s�� z>TestSubstitutions.test_html_entity_substitution_off_by_defaultc��C��s��d}|�j�|�}|�j|jd�d��|jd�}|�jd|k��|jd�}|�jd|k��|jd�}|�jd |k��|jd �jd �}|�jd|k��d�S�)NzEZcontentztext/html; charset=x-sjiszutf-8s ��charset=utf-8�euc_jps��charset=euc_jpz shift-jiss��charset=shift-jiszutf-16zcharset=utf-16)r$��r��metari��rH��rj��)r��Zmeta_tagr$��utf_8r�� shift_jisZutf_16_ur��r��r��test_encoding_substitution��s�� z,TestSubstitutions.test_encoding_substitutionc��C��s2��d}t�d�}|�j||d�}|�j|jd�jd��d�S�)Nz`
foo
Zpre)Z parse_onlyr��)r��r$��r��r��rN��)r��r��ry��r$��r��r��r��;test_encoding_substitution_doesnt_happen_if_tag_is_strained$��s��zMTestSubstitutions.test_encoding_substitution_doesnt_happen_if_tag_is_strainedN)r��r��r ��rj��rk��rl��rm��rn��rr��rs��ru��rv��rx��ry��r{��r}��r~��r��r��r��r��r��r��rf��s �� rf��c��@��sP��e�Zd�ZdZdd��Zdd��Zdd��Zdd ��Zd d��Zdd ��Z dd��Z dd��ZdS�)�TestEncodingz0Test the ability to encode objects into strings.c��C��s.��d}|�j�|�}|�j|jjjd�djd��d�S�)Nu ��☃zutf-8u��☃)r$��r��r"��r��ri��)r��r��r$��r��r��r��"test_unicode_string_can_be_encoded2��s�� z/TestEncoding.test_unicode_string_can_be_encodedc��C��s,��d}|�j�|�}|�j|jjd�|jd��d�S�)Nu ��☃zutf-8)r$��r��r"��ri��)r��r��r$��r��r��r��1test_tag_containing_unicode_string_can_be_encoded8��s�� z>TestEncoding.test_tag_containing_unicode_string_can_be_encodedc��C��s&��d}|�j�|�}|�j|jjd�d��d�S�)Nu ��☃�asciis��☃)r$��r��r"��ri��)r��r��r$��r��r��r��s�� zITestEncoding.test_encoding_substitutes_unrecognized_characters_by_defaultc��C��s&��d}|�j�|�}|�jt|jddd��d�S�)Nu ��☃r��strict)�errors)r$��r��UnicodeEncodeErrorri��)r��r��r$��r��r��r�� test_encoding_can_be_made_strictC��s�� z-TestEncoding.test_encoding_can_be_made_strictc��C��s$��d}|�j�|�}|�jd|jj��d�S�)Nu ��☃u��☃)r$��r��r"��Zdecode_contents)r��r��r$��r��r��r��test_decode_contentsI��s�� z!TestEncoding.test_decode_contentsc��C��s.��d}|�j�|�}|�jdjd�|jjdd��d�S�)Nu ��☃u��☃rg��)r\��)r$��r��ri��r"��Zencode_contents)r��r��r$��r��r��r��test_encode_contentsN��s �� z!TestEncoding.test_encode_contentsc��C��s*��d}|�j�|�}|�jdjd�|jj��d�S�)Nu ��☃u��☃rg��)r$��r��ri��r"��ZrenderContents)r��r��r$��r��r��r��test_deprecated_renderContentsU��s�� z+TestEncoding.test_deprecated_renderContentsc��C��s8��d}|�j�|�}tr$|�j|t|��n|�jdt|��d�S�)Nu ��☃s ��\u2603)r$��r��r��repr)r��r��r$��r��r��r�� test_repr[��s �� zTestEncoding.test_reprN)r��r��r ��r1��r��r��r��r��r��r��r��r��r��r��r��r��r��/��s��r��c��@��s,��e�Zd�Zdd��Zdd��Zdd��Zdd��Zd S�) �TestNavigableStringSubclassesc��C��sX��|�j�d�}td�}|jd|��|�jt|�d��|�j|jdd�d��|�j|jd�d��d�S�)Nr��rB��r=��z)r)��r��)r$��r��r��r��r(��r%��r��)r��r$��r*��r��r��r�� test_cdatae��s�� z(TestNavigableStringSubclasses.test_cdatac��sV��d��_��fdd�}��jd�}td�}|jd|��jd|j|d��jd��j��d S�) zkText inside a CData object is passed into the formatter. But the return value is ignored. r��c��s��j�d7��_�dS�)Nr=��zBITTER FAILURE)�count)�args)r��r��r�� incrementv��s��zNTestNavigableStringSubclasses.test_cdata_is_never_formatted..incrementr��z<><><>r=��s��<><>]]>)rh��N)r��r$��r��r��r��ri��)r��r��r$��r*��r��)r��r��test_cdata_is_never_formattedo��s�� z;TestNavigableStringSubclasses.test_cdata_is_never_formattedc��C��s2��t�d�}|�jd�}|jd|��|�j|j��d��d�S�)NrB��r��r=��s�� )r ��r$��r��r��ri��)r��Zdoctyper$��r��r��r��test_doctype_ends_in_newline��s�� z:TestNavigableStringSubclasses.test_doctype_ends_in_newlinec��C��s��t�d�}|�jd|j��d�S�)NrB��z)r ��r��Zoutput_ready)r��r��r��r��r��test_declaration��s��z.TestNavigableStringSubclasses.test_declarationN)r��r��r ��r��r��r��r��r��r��r��r��r��c��s�� r��c��@��s��e�Zd�ZdZdd��Zdd��ZeZdd��Zdd ��Zd d��Z dd ��Z dd��Zdd��Zdd��Z dd��Zdd��Zdd��Zdd��Zdd��Zdd��Zd d!��Zd"d#��Zd$d%��Zd&d'��Zd(d)��Zd*d+��Zd,d-��Zd.d/��Zd0d1��Zd2d3��Zd4d5��Zd6d7��Zd8d9��Z d:d;��Z!dd?��Z#d@dA��Z$dBdC��Z%dDdE��Z&dFdG��Z'dHdI��Z(dJdK��Z)dLdM��Z*dNdO��Z+dPdQ��Z,dRdS��Z-dTdU��Z.dVdW��Z/dXdY��Z0dZd[��Z1d\d]��Z2d^d_��Z3d`da��Z4dbdc��Z5ddde��Z6dfdg��Z7dhdi��Z8djdk��Z9dldm��Z:dndo��Z;dpdq��Z The title Hello there.

An H1

Some text

Some more text

An H2

Another
Bob
Another H2
me span1a1 span1a2 test span2a1

English

English UK

English US

French

c��C��s��t�|�jd�|�_d�S�)Nzhtml.parser)r��HTMLr$��)r��r��r��r��rR��s��zTestSoupSelector.setUpc��K��sR��dd��|�j�j|f|�D��}|j��|j��|�j||d|dj|�dj|�f��d�S�)Nc��S��s��g�|�]}|d��qS�)r��r��)r��elr��r��r��r��s��z2TestSoupSelector.assertSelects..z$Selector %s, expected [%s], got [%s]z, )r$��select�sortr��join)r��selector�expected_ids�kwargsZel_idsr��r��r��r��s��zTestSoupSelector.assertSelectsc��G��s"��x|D�]\}}|�j�||��qW�d�S�)N)�assertSelect)r��Ztestsr��r��r��r��r��assertSelectMultiple��s��z%TestSoupSelector.assertSelectMultiplec��C��sF��|�j�jd�}|�jt|�d��|�j|d�jd��|�j|d�jdg��d�S�)Nrh��r=��r��z The title)r$��r��r��r,��rN��r��)r��elsr��r��r��test_one_tag_one��s��z!TestSoupSelector.test_one_tag_onec��C��sX��|�j�jd�}|�jt|�d��x|D�]}|�j|jd��q"W�|�j�jd�}|�jd|d��d�S�)Nra��mainr��)r$��r��r��r,��rN�� select_one)r��r��ra��r��r��r��r��test_one_tag_many��s�� z"TestSoupSelector.test_one_tag_manyc��C��s��|�j�jd�}|�jd�|��d�S�)NZnonexistenttag)r$��r��r��)r��matchr��r��r��(test_select_one_returns_none_if_no_match��s��z9TestSoupSelector.test_select_one_returns_none_if_no_matchc��C��s ��|�j�jd�}|�jdddg��d�S�)Nzdiv div�inner�data1)r$��r��r��)r��r��r��r��r��test_tag_in_tag_one��s��z$TestSoupSelector.test_tag_in_tag_onec��C��s&��x dD�]}|�j�|ddddg��qW�d�S�) N�html div� html body div�body divr��r��r��footer)r��r��r��)r��)r��r��r��r��r��test_tag_in_tag_many��s�� z%TestSoupSelector.test_tag_in_tag_manyc��C��sB��|�j�ddgdd��|�j�dddgdd��|�j�dd ddd gdd��d�S�)Nzhtml divr��r=��)r:��z html body divr��r+��zbody divr��r��r>��)r��)r��r��r��r�� test_limit��s��zTestSoupSelector.test_limitc��C��s��|�j�t|�jjd��d��d�S�)N�delr��)r��r,��r$��r��)r��r��r��r��test_tag_no_match��s��z"TestSoupSelector.test_tag_no_matchc��C��s��|�j�t|�jjd��d�S�)Nztag%t)r��r��r$��r��)r��r��r��r��test_invalid_tag��s��z!TestSoupSelector.test_invalid_tagc��C��s��|�j�dddg��d�S�)Nzcustom-dashed-tag�dash1�dash2)r��)r��r��r��r��test_select_dashed_tag_ids��s��z+TestSoupSelector.test_select_dashed_tag_idsc��C��s6��|�j�jd�}|�j|d�jd��|�j|d�d�d��d�S�)Nzcustom-dashed-tag[id="dash2"]r��zcustom-dashed-tagr��r��)r$��r��r��rN��)r��Zdashedr��r��r��test_select_dashed_by_id��s��z)TestSoupSelector.test_select_dashed_by_idc��C��s��|�j�|�jjd�d�jd��d�S�)Nzbody > custom-dashed-tagr��zHello there.)r��r$��r��r)��)r��r��r��r��test_dashed_tag_text��s��z%TestSoupSelector.test_dashed_tag_textc��C��s ��|�j�|�jjd�|�jjd��d�S�)Nzcustom-dashed-tag)r��r$��r��r-��)r��r��r��r��#test_select_dashed_matches_find_all��s��z4TestSoupSelector.test_select_dashed_matches_find_allc��C��s��|�j�ddgfdddgf��d�S�)NZh1�header1Zh2�header2�header3)r��)r��r��r��r��test_header_tags ��s��z!TestSoupSelector.test_header_tagsc��C��sV��xPd D�]H}|�j�j|�}|�jt|�d��|�j|d�jd��|�j|d�d�dg��qW�d�S�) N�.onep�p.onep�html p.onepr=��r��r��rm��onep)r��r��r��)r$��r��r��r,��rN��)r��r��r��r��r��r��test_class_one��s �� zTestSoupSelector.test_class_onec��C��s ��|�j�jd�}|�jt|�d��d�S�)Nzdiv.onepr��)r$��r��r��r,��)r��r��r��r��r��test_class_mismatched_tag��s��z*TestSoupSelector.test_class_mismatched_tagc��C��s ��xdD�]}|�j�|dg��qW�d�S�)N� div#inner�#inner� div div#innerr��)r��r��r��)r��)r��r��r��r��r��test_one_id��s�� zTestSoupSelector.test_one_idc��C��s ��|�j�jd�}|�jt|�d��d�S�)Nz #doesnotexistr��)r$��r��r��r,��)r��r��r��r��r��test_bad_id��s��zTestSoupSelector.test_bad_idc��C��sf��|�j�jd�}|�jt|�d��x|D�]}|�j|jd��q"W�|�j|d�d�dg��|�j|d�jd��d�S�)Nzdiv#inner pr9��r��r=��rm��r��r��)r$��r��r��r,��rN��r7��r6��)r��r��r��r��r��r��test_items_in_id#��s�� z!TestSoupSelector.test_items_in_idc��C��s*��x$dD�]}|�j�t|�jj|��d��qW�d�S�)N�div#main del�div#main div.oops�div div#mainr��)r��r��r��)r��r,��r$��r��)r��r��r��r��r��test_a_bunch_of_emptys+��s�� z'TestSoupSelector.test_a_bunch_of_emptysc��C��s ��xd D�]}|�j�|d g��qW�d�S�)N�.class1�p.class1�.class2�p.class2�.class3�p.class3� html p.class2�div#inner .class2�pmulti)r��r��r��r��r��r��r��r��)r��)r��r��r��r��r��test_multi_class_support/��s��z)TestSoupSelector.test_multi_class_supportc��C��s ��xdD�]}|�j�|dg��qW�d�S�)N�.class1.class3�.class3.class2�.class1.class2.class3r��)r��r��r��)r��)r��r��r��r��r��test_multi_class_selection4��s��z+TestSoupSelector.test_multi_class_selectionc��C��s"��|�j�dddg��|�j�ddg��d�S�)Nz.s1 > a�s1a1�s1a2z.s1 > a span�s1a2s1)r��)r��r��r��r��test_child_selector9��s��z$TestSoupSelector.test_child_selectorc��C��s��|�j�ddg��d�S�)Nz.s1 > a#s1a2 spanr��)r��)r��r��r��r��test_child_selector_id=��s��z'TestSoupSelector.test_child_selector_idc��C��st��|�j�ddgfddgfddgfddgfddgfddgfd dgfd g�fddgfddgfd dgfdg�fdg�fdg�f��d�S�)Nzp[class="onep"]r��z p[id="p1"]z[class="onep"]z [id="p1"]zlink[rel="stylesheet"]�l1zlink[type="text/css"]zlink[href="blah.css"]zlink[href="no-blah.css"]z[rel="stylesheet"]z[type="text/css"]z[href="blah.css"]z[href="no-blah.css"]zp[href="no-blah.css"])r��)r��r��r��r��test_attribute_equals@��s��z&TestSoupSelector.test_attribute_equalsc��C��s\��|�j�ddgfddgfddgfddgfddgfddgfdd gfd d gfdd gfdd gf� �d�S�) Nzp[class~="class1"]r��zp[class~="class2"]zp[class~="class3"]z[class~="class1"]z[class~="class2"]z[class~="class3"]za[rel~="friend"]�bobz a[rel~="met"]z[rel~="friend"]z[rel~="met"])r��)r��r��r��r��test_attribute_tildeR��s��z%TestSoupSelector.test_attribute_tildec��C��sv��|�j�ddgfddgfdg�fdg�fdg�fddgfdd d gfdd d gfdd dgfdd dgfddgfdd gfddgf� �d�S�)Nz[rel^="style"]r��zlink[rel^="style"]znotlink[rel^="notstyle"]z[rel^="notstyle"]zlink[rel^="notstyle"]zlink[href^="bla"]za[href^="http://"]r��mez[href^="http://"]z [id^="p"]r��r��z [id^="m"]r��zdiv[id^="m"]z a[id^="m"]zdiv[data-tag^="dashed"]r��)r��)r��r��r��r��test_attribute_startswith`��s�� z*TestSoupSelector.test_attribute_startswithc�� C��sH��|�j�ddgfddgfddgfdddddd d ddgfd dgfdg�f��d�S�)Nz[href$=".css"]r��zlink[href$=".css"]z link[id$="1"]z [id$="1"]r��r��r��r��s2a1r��r��zdiv[id$="1"]z[id$="noending"])r��)r��r��r��r��test_attribute_endswithq��s��z(TestSoupSelector.test_attribute_endswithc��C��s��|�j�ddgfddgfdg�fdg�fdg�fddgfdd d gfddd gfddgfdd gfddgfddgfddgfdddd ddddddg fddgfdg�fdd d dgfdd d gfd dgfd!dd"gfd#d"gfd$dgf��d�S�)%Nz[rel*="style"]r��zlink[rel*="style"]znotlink[rel*="notstyle"]z[rel*="notstyle"]zlink[rel*="notstyle"]zlink[href*="bla"]z[href*="http://"]r��r��z [id*="p"]r��r��zdiv[id*="m"]r��z a[id*="m"]z[href*=".css"]zlink[href*=".css"]z link[id*="1"]z [id*="1"]r��r��r��r��r��r��r��zdiv[id*="1"]z[id*="noending"]z[href*="."]za[href*="."]zlink[href*="."]zdiv[id*="n"]r��z div[id*="nn"]zdiv[data-tag*="edval"])r��)r��r��r��r��test_attribute_contains{��s.�� z(TestSoupSelector.test_attribute_containsc��C��s2��|�j�ddddgfddddgfddgfdg�f��d�S�) Nz p[lang|="en"]zlang-enz lang-en-gbz lang-en-usz[lang|="en"]z p[lang|="fr"]zlang-frz p[lang|="gb"])r��)r��r��r��r��test_attribute_exact_or_hypen��s ��z.TestSoupSelector.test_attribute_exact_or_hypenc�� C��sV��|�j�ddddgfddgfdddgfddd d dgfdd dgfdg�fdg�fddgf��d�S�)Nz[rel]r��r��r��z link[rel]za[rel]z[lang]zlang-enz lang-en-gbz lang-en-uszlang-frzp[class]r��r��z[blah]zp[blah]z div[data-tag]r��)r��)r��r��r��r��test_attribute_exists��s�� z&TestSoupSelector.test_attribute_existsc��C��s,��d}t�|d�}|jd�\}|�jd|j��d�S�)Nz]
nope

yes
zhtml.parserzdiv[style="display: right"]�yes)r��r��r��r��)r��r��r$��Zchosenr��r��r��"test_quoted_space_in_selector_name��s�� z3TestSoupSelector.test_quoted_space_in_selector_namec��C��s(��|�j�t|�jjd��|�j�t|�jjd��d�S�)Nza:no-such-pseudoclassza:nth-of-type(a))r��r��r$��r��)r��r��r��r��test_unsupported_pseudoclass��s��z-TestSoupSelector.test_unsupported_pseudoclassc��C��s��|�j�jd�}|�jt|�d��|�j|d�jd��|�j�jd�}|�jt|�d��|�j|d�jd��|�j�jd�}|�jt|�d��|�jt|�j�jd��d�S�) Nzdiv#inner p:nth-of-type(1)r=��r��z Some textzdiv#inner p:nth-of-type(3)ZAnotherzdiv#inner p:nth-of-type(4)zdiv p:nth-of-type(0))r$��r��r��r,��r��r��r��)r��r��r��r��r��test_nth_of_type��s��z!TestSoupSelector.test_nth_of_typec��C��s2��|�j�jd�}|�jt|�d��|�j|d�jd��d�S�)Nzdiv#inner > p:nth-of-type(1)r=��r��z Some text)r$��r��r��r,��r��)r��r��r��r��r��"test_nth_of_type_direct_descendant��s��z3TestSoupSelector.test_nth_of_type_direct_descendantc��C��s��|�j�ddg��d�S�)Nz#inner > p:nth-of-type(2)r��)r��)r��r��r��r��"test_id_child_selector_nth_of_type��s��z3TestSoupSelector.test_id_child_selector_nth_of_typec��C��s.��|�j�jddd�}|jd�}|�j|ddg��d�S�)Nra��r��)r��r��r��)r$��r%��r��r��)r��r��selectedr��r��r��test_select_on_element��s�� z'TestSoupSelector.test_select_on_elementc��C��s��|�j�ddg��|�j�dg��d�S�)Nz .fancy #innerr��z.normal #inner)r��)r��r��r��r��test_overspecified_child_id��s��z,TestSoupSelector.test_overspecified_child_idc��C��sB��|�j�ddg��|�j�ddg��|�j�ddg��|�jg�|�jjd��d�S�)Nz#p1 + h2r��z#p1 + h2 + pr��z#p1 + #header2 + .class1z#p1 + p)r��r��r$��r��)r��r��r��r��test_adjacent_sibling_selector��s��z/TestSoupSelector.test_adjacent_sibling_selectorc��C��sR��|�j�dddg��|�j�ddg��|�j�ddg��|�j�ddg��|�jg�|�jjd��d�S�) Nz#p1 ~ h2r��r��z#p1 ~ #header2z#p1 ~ h2 + ar��z#p1 ~ h2 + [rel="me"]z#inner ~ h2)r��r��r$��r��)r��r��r��r��test_general_sibling_selector��s ��z.TestSoupSelector.test_general_sibling_selectorc��C��s��|�j�t|�jjd��d�S�)Nzh1 >)r��r��r$��r��)r��r��r��r��test_dangling_combinator��s��z)TestSoupSelector.test_dangling_combinatorc��C��s��|�j�ddddg��d�S�)Nzp[lang] ~ pz lang-en-gbz lang-en-uszlang-fr)r��)r��r��r��r��2test_sibling_combinator_wont_select_same_tag_twice��s��zCTestSoupSelector.test_sibling_combinator_wont_select_same_tag_twicec��C��s��|�j�dddg��d�S�)Nzx, y�xid�yid)r��)r��r��r��r��test_multiple_select��s��z%TestSoupSelector.test_multiple_selectc��C��s��|�j�dddg��d�S�)Nzx,yr��r��)r��)r��r��r��r��"test_multiple_select_with_no_space��s��z3TestSoupSelector.test_multiple_select_with_no_spacec��C��s��|�j�dddg��d�S�)Nzx, yr��r��)r��)r��r��r��r��$test_multiple_select_with_more_space��s��z5TestSoupSelector.test_multiple_select_with_more_spacec��C��s��|�j�ddg��d�S�)Nzx, xr��)r��)r��r��r��r��test_multiple_select_duplicated��s��z0TestSoupSelector.test_multiple_select_duplicatedc��C��s��|�j�dddg��d�S�)Nzx, y ~ p[lang=fr]r��zlang-fr)r��)r��r��r��r��test_multiple_select_sibling��s��z-TestSoupSelector.test_multiple_select_siblingc��C��s��|�j�dddg��d�S�)Nzx, y > zr��zidb)r��)r��r��r��r��.test_multiple_select_tag_and_direct_descendant��s��z?TestSoupSelector.test_multiple_select_tag_and_direct_descendantc��C��s��|�j�dddddddg��d�S�)Nz div > x, y, zr��r��zidar��zidab�zidac)r��)r��r��r��r��/test_multiple_select_direct_descendant_and_tags ��s��z@TestSoupSelector.test_multiple_select_direct_descendant_and_tagsc��C��s��|�j�dddddddg��d�S�)Nzdiv x,y, zr��r��r��r��r ��r ��)r��)r��r��r��r��(test_multiple_select_indirect_descendant ��s��z9TestSoupSelector.test_multiple_select_indirect_descendantc��C��s(��|�j�t|�jjd��|�j�t|�jjd��d�S�)Nz,x, yzx,,y)r��r��r$��r��)r��r��r��r��test_invalid_multiple_select��s��z-TestSoupSelector.test_invalid_multiple_selectc��C��s��|�j�dddg��d�S�)Nzp[lang=en], p[lang=en-gb]zlang-enz lang-en-gb)r��)r��r��r��r��test_multiple_select_attrs��s��z+TestSoupSelector.test_multiple_select_attrsc��C��s��|�j�ddddg��d�S�)Nz*x, y > z[id=zida], z[id=zidab], z[id=zidb]r��r��r ��)r��)r��r��r��r��test_multiple_select_ids��s��z)TestSoupSelector.test_multiple_select_idsc��C��s��|�j�dddg��d�S�)Nzbody > div > x, y > zr��r��)r��)r��r��r��r��test_multiple_select_nested��s��z,TestSoupSelector.test_multiple_select_nestedc��C��sF��d}t�|d�}|jd�}|�jdt|��x|jddgd�D�]}q:W�d�S�)Nz3
zhtml.parserz.c1, .c2r9��Zc1Zc2)ro��)r��r��r��r,��r-��)r��r��r$��r��r��r��r��r��test_select_duplicate_elements��s�� z/TestSoupSelector.test_select_duplicate_elementsN)>r��r��r ��r��rR��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r��r ��r��r��r��r��r��r��r��r��r��sv��1 r��)2r1��Zpdbr��rX��rR��r6��r0��Zbs4r��Zbs4.builderr��r��Zbs4.elementr��r��r��r ��r ��r��r��r ��Zbs4.testingr��r��r��r��ZLXML_PRESENTr��r!��r2��rL��rP��rd��r��r��r��r��r��r��r��r��r��r��r,��rF��rQ��rf��r��r��r��r��r��r��r��sN��( ;O�83(3--*��6n+a�4*PK��je[= �u��u��0��tests/__pycache__/test_docs.cpython-36.opt-1.pycnu��[��3 ��O+��@��sD��d�Z�eZdgZddlZddlZddlZddlZejej B�ej B�ZdS�)zTest harness for doctests.Zadditional_tests��N)�__doc__�typeZ __metaclass__�__all__�atexitZdoctest�osZunittest�ELLIPSISZNORMALIZE_WHITESPACEZREPORT_NDIFFZ DOCTEST_FLAGS��r��r��/usr/lib/python3.6/test_docs.py��s�� PK��je[��ٺ��*��tests/__pycache__/test_lxml.cpython-36.pycnu��[��3 6]U ��@��s��d�Z�ddlZddlZyddlZdZejjZW�n*�ek rV�Z �zdZdZW�Y�ddZ [ X�nX�erlddl mZmZ�ddl mZmZ�ddlmZmZmZ�ddlmZ�dd lmZ�dd lmZmZmZmZ�ee�d�G�dd ��d ee��Zee�d�G�dd��dee��ZdS�)z@Tests to ensure that the lxml tree builder generates good trees.��NTF)�LXMLTreeBuilder�LXMLTreeBuilderForXML)� BeautifulSoup�BeautifulStoneSoup)�Comment�Doctype�SoupStrainer)�skipIf)�test_htmlparser)�HTMLTreeBuilderSmokeTest�XMLTreeBuilderSmokeTest�SoupTestr ��z;lxml seems not to be present, not testing its tree builder.c��@��sP��e�Zd�ZdZedd��Zdd��Zdd��Zee �p6e dk�d�d d��Zdd��ZdS�)�LXMLTreeBuilderSmokeTestz!See ``HTMLTreeBuilderSmokeTest``.c��C��s��t��S�)N)r��)�self��r��/usr/lib/python3.6/test_lxml.py�default_builder%��s��z(LXMLTreeBuilderSmokeTest.default_builderc��C��s(��|�j�dd��|�j�dd��|�j�dd��d�S�)Nz
foo�bar
z
foobar
z
foo�bar
z
foo�bar
)ZassertSoupEquals)r��r��r��r��test_out_of_range_entity)��s��z1LXMLTreeBuilderSmokeTest.test_out_of_range_entityc��C��s��d�S�)Nr��)r��r��r��r��*test_entities_in_foreign_document_encoding1��s��zCLXMLTreeBuilderSmokeTest.test_entities_in_foreign_document_encoding��r��z@Skipping doctype test for old version of lxml to avoid segfault.c��C��s(��|�j�d�}|jd�}|�jd|j��d�S�)Nz r��)�soup�contents�assertEqual�strip)r��r��Zdoctyper��r��r��test_empty_doctype:��s�� z+LXMLTreeBuilderSmokeTest.test_empty_doctypec��C��sN��t�jdd��}td�}W�d�Q�R�X�|�jdt|j��|�jdt|d�j�k��d�S�)NT)�recordzzz&BeautifulStoneSoup class is deprecatedr��)�warnings�catch_warningsr��r��str�bZ assertTrue�message)r��wr��r��r��r��%test_beautifulstonesoup_is_xml_parserB��s��z>LXMLTreeBuilderSmokeTest.test_beautifulstonesoup_is_xml_parserN)r��r��r��r��) �__name__� __module__�__qualname__�__doc__�propertyr��r��r��r ��LXML_PRESENT�LXML_VERSIONr��r%��r��r��r��r��r��s�� r��z?lxml seems not to be present, not testing its XML tree builder.c��@��s��e�Zd�ZdZedd��ZdS�)�LXMLXMLTreeBuilderSmokeTestz!See ``HTMLTreeBuilderSmokeTest``.c��C��s��t��S�)N)r��)r��r��r��r��r��P��s��z+LXMLXMLTreeBuilderSmokeTest.default_builderN)r&��r'��r(��r)��r*��r��r��r��r��r��r-��J��s��r-��)r��)r)��rer��Z lxml.etreeZlxmlr+��Zetreer,��ImportError�eZbs4.builderr��r��Zbs4r��r��Zbs4.elementr��r��r��Zbs4.testingr ��Z bs4.testsr ��r��r��r ��r��r-��r��r��r��r��s0�� (PK��je[�>��`U��`U��*��tests/__pycache__/test_soup.cpython-36.pycnu��[��3 *6]dO��@��s~��d�Z�ddlmZ�ddlZddlZddlZddlZddlmZm Z �ddl mZmZm Z mZ�ddlZddlmZmZmZ�ddlmZmZ�ddlZyddlmZmZ�d ZW�n&�ek r��Z�z d ZW�Y�ddZ[X�nX�ejd�dko�ejdk�ZG�d d��de�ZG�dd��de�Z G�dd��de�Z G�dd��de�Z!G�dd��dej"�Z#G�dd��de�Z$G�dd��dej"�Z%G�dd��de�Z&G�dd��dej"�Z'dS�)z#Tests of Beautiful Soup as a whole.��)� set_traceN)� BeautifulSoup�BeautifulStoneSoup)�CharsetMetaAttributeValue�ContentMetaAttributeValue�SoupStrainer�NamespacedAttribute)�EntitySubstitution� UnicodeDammit�EncodingDetector)�SoupTest�skipIf)�LXMLTreeBuilder�LXMLTreeBuilderForXMLTF��c��@��s$��e�Zd�Zdd��Zdd��Zdd��ZdS�)�TestConstructorc��C��s"��d}|�j�|�}|�jd|jj��d�S�)Nu ��
éé
u��éé)�soup�assertEqual�h1�string)�self�datar��r��/usr/lib/python3.6/test_soup.py�test_short_unicode_input*��s�� z(TestConstructor.test_short_unicode_inputc��C��s"��d}|�j�|�}|�jd|jj��d�S�)Nz
foo�bar
zfoo�bar)r��r��r��r��)r��r��r��r��r��r��test_embedded_null/��s�� z"TestConstructor.test_embedded_nullc��C��s,��dj�d�}|�j|dgd�}|�jd|j��d�S�)Nu ��Räksmörgåszutf-8)�exclude_encodingszwindows-1252)�encoder��r��original_encoding)r�� utf8_datar��r��r��r��test_exclude_encodings4��s�� z&TestConstructor.test_exclude_encodingsN)�__name__� __module__�__qualname__r��r��r!��r��r��r��r��r��(��s��r��c��@��sF��e�Zd�Zddd�Zdd��Zdd��Zdd ��Zd d��Zdd ��Zdd��Z dS�)�TestWarningsTc��C��s"��|j�tjd�d��}|�j|��d�S�)N�P��)� startswithr��ZNO_PARSER_SPECIFIED_WARNING� assertTrue)r��sZis_there�vr��r��r��_no_parser_specified<��s��z!TestWarnings._no_parser_specifiedc�� C��s>��t�jdd��}|�jd�}W�d�Q�R�X�t|d�j�}|�j|��d�S�)NT)�recordzr��)�warnings�catch_warningsr��str�message�_assert_no_parser_specified)r��wr��msgr��r��r��#test_warning_if_no_parser_specified@��s��z0TestWarnings.test_warning_if_no_parser_specifiedc�� C��s@��t�jdd��}|�jdd�}W�d�Q�R�X�t|d�j�}|�j|��d�S�)NT)r,��z�htmlr��)r-��r.��r��r/��r0��r1��)r��r2��r��r3��r��r��r��*test_warning_if_parser_specified_too_vagueF��s��z7TestWarnings.test_warning_if_parser_specified_too_vaguec�� C��s4��t�jdd��}|�jdd�}W�d�Q�R�X�|�jg�|��d�S�)NT)r,��zzhtml.parser)r-��r.��r��r��)r��r2��r��r��r��r��,test_no_warning_if_explicit_parser_specifiedL��s��z9TestWarnings.test_no_warning_if_explicit_parser_specifiedc��C��sh��t�jdd��}|�jdtd�d�}W�d�Q�R�X�t|d�j�}|�jd|k��|�jd|k��|�jd |j��d�S�) NT)r,��z�b)�parseOnlyTheser��r9�� parse_onlys��) r-��r.��r��r��r/��r0��r(��r��r��)r��r2��r��r3��r��r��r��)test_parseOnlyThese_renamed_to_parse_onlyQ��s��z6TestWarnings.test_parseOnlyThese_renamed_to_parse_onlyc��C��sf��t�jdd��}d}|�j|dd�}W�d�Q�R�X�t|d�j�}|�jd|k��|�jd|k��|�jd|j��d�S�) NT)r,��s��é�utf8)�fromEncodingr��r=��Z from_encoding)r-��r.��r��r/��r0��r(��r��r��)r��r2��r<��r��r3��r��r��r��*test_fromEncoding_renamed_to_from_encodingY��s��z7TestWarnings.test_fromEncoding_renamed_to_from_encodingc��C��s��|�j�t|�jddd��d�S�)NzT)Zno_such_argument)�assertRaises� TypeErrorr��)r��r��r��r��"test_unrecognized_keyword_argumentb��s��z/TestWarnings.test_unrecognized_keyword_argumentN)T) r"��r#��r$��r+��r4��r6��r7��r;��r>��rA��r��r��r��r��r%��:��s�� r%��c��@��s4��e�Zd�Zdd��Zdd��Zdd��Zdd��Zd d ��ZdS�)r%��c��C��s��t�j��}|j}zBtjdd��}|�j|�}W�d�Q�R�X�t|d�j�}|�jd|k��W�d�|j ��X�tjdd��}|�j|�}W�d�Q�R�X�|�j dt|��d�S�)NT)r,��r��zlooks like a filename)�tempfileZNamedTemporaryFile�namer-��r.��r��r/��r0��r(��closer��len)r��Z filehandle�filenamer2��r��r3��r��r��r��test_disk_file_warningh��s�� z#TestWarnings.test_disk_file_warningc��C��s>��t�jdd��}|�jd�}W�d�Q�R�X�|�jtdd��|D��d�S�)NT)r,��s��http://www.crummybytes.com/c��s��s��|�]}d�t�|j�kV��qdS�)zlooks like a URLN)r/��r0��)�.0r2��r��r��r�� }��s��z?TestWarnings.test_url_warning_with_bytes_url..)r-��r.��r��r(��any)r��warning_listr��r��r��r��test_url_warning_with_bytes_urlx��s��z,TestWarnings.test_url_warning_with_bytes_urlc��C��s>��t�jdd��}|�jd�}W�d�Q�R�X�|�jtdd��|D��d�S�)NT)r,��zhttp://www.crummyunicode.com/c��s��s��|�]}d�t�|j�kV��qdS�)zlooks like a URLN)r/��r0��)rH��r2��r��r��r��rI��s��zATestWarnings.test_url_warning_with_unicode_url..)r-��r.��r��r(��rJ��)r��rK��r��r��r��r��!test_url_warning_with_unicode_url��s��z.TestWarnings.test_url_warning_with_unicode_urlc��C��s>��t�jdd��}|�jd�}W�d�Q�R�X�|�jtdd��|D��d�S�)NT)r,��s$��http://www.crummybytes.com/ is greatc��s��s��|�]}d�t�|j�kV��qdS�)zlooks like a URLN)r/��r0��)rH��r2��r��r��r��rI��s��zETestWarnings.test_url_warning_with_bytes_and_space..)r-��r.��r��assertFalserJ��)r��rK��r��r��r��r��%test_url_warning_with_bytes_and_space��s��z2TestWarnings.test_url_warning_with_bytes_and_spacec��C��s>��t�jdd��}|�jd�}W�d�Q�R�X�|�jtdd��|D��d�S�)NT)r,��z%http://www.crummyuncode.com/ is greatc��s��s��|�]}d�t�|j�kV��qdS�)zlooks like a URLN)r/��r0��)rH��r2��r��r��r��rI��s��zGTestWarnings.test_url_warning_with_unicode_and_space..)r-��r.��r��rN��rJ��)r��rK��r��r��r��r��'test_url_warning_with_unicode_and_space��s��z4TestWarnings.test_url_warning_with_unicode_and_spaceN)r"��r#��r$��rG��rL��rM��rO��rP��r��r��r��r��r%��f��s ��c��@��s��e�Zd�Zdd��ZdS�)�TestSelectiveParsingc��C��s.��d}t�d�}|�j||d�}|�j|j��d��d�S�)Nz&NoYes NoYes Yesr8��)r:��s��YesYes Yes)r��r��r��r��)r��markupZstrainerr��r��r��r��test_parse_with_soupstrainer��s��z1TestSelectiveParsing.test_parse_with_soupstrainerN)r"��r#��r$��rS��r��r��r��r��rQ��s��rQ��c��@��sx��e�Zd�ZdZdd��Zdd��Zdd��Zdd ��Zd d��Zdd ��Z dd��Z dd��Zdd��Zdd��Z dd��Zdd��Zdd��ZdS�)�TestEntitySubstitutionz1Standalone tests of the EntitySubstitution class.c��C��s ��t�|�_d�S�)N)r ��sub)r��r��r��r��setUp��s��zTestEntitySubstitution.setUpc��C��s��d}|�j�|�jj|�d��d�S�)Nu��foo\u2200☃\u00f5baru��foo∀☃õbar)r��rU��substitute_html)r��r)��r��r��r��test_simple_html_substitution��s��z4TestEntitySubstitution.test_simple_html_substitutionc��C��s&��d}t�|�}|�j|�jj|j�d��d�S�)Ns��foo��z‘’foo“”)r ��r��rU��rW��rR��)r��Zquotes�dammitr��r��r��test_smart_quote_substitution��s��z4TestEntitySubstitution.test_smart_quote_substitutionc��C��s��d}|�j�|�jj|d�|��d�S�)NzWelcome to "my bar"F)r��rU��substitute_xml)r��r)��r��r��r��Itest_xml_converstion_includes_no_quotes_if_make_quoted_attribute_is_false��s��z`TestEntitySubstitution.test_xml_converstion_includes_no_quotes_if_make_quoted_attribute_is_falsec��C��s0��|�j�|�jjdd�d��|�j�|�jjdd�d��d�S�)NZWelcomeTz "Welcome"z Bob's Barz"Bob's Bar")r��rU��r[��)r��r��r��r��6test_xml_attribute_quoting_normally_uses_double_quotes��s��zMTestEntitySubstitution.test_xml_attribute_quoting_normally_uses_double_quotesc��C��s��d}|�j�|�jj|d�d��d�S�)NzWelcome to "my bar"Tz'Welcome to "my bar"')r��rU��r[��)r��r)��r��r��r��Otest_xml_attribute_quoting_uses_single_quotes_when_value_contains_double_quotes��s��zfTestEntitySubstitution.test_xml_attribute_quoting_uses_single_quotes_when_value_contains_double_quotesc��C��s��d}|�j�|�jj|d�d��d�S�)NzWelcome to "Bob's Bar"Tz""Welcome to "Bob's Bar"")r��rU��r[��)r��r)��r��r��r��btest_xml_attribute_quoting_escapes_single_quotes_when_value_contains_both_single_and_double_quotes��s��zyTestEntitySubstitution.test_xml_attribute_quoting_escapes_single_quotes_when_value_contains_both_single_and_double_quotesc��C��s��d}|�j�|�jj|�|��d�S�)NzWelcome to "Bob's Bar")r��rU��r[��)r��Zquotedr��r��r��zfoo<bar>)r��rU��r[��)r��r��r��r��'test_xml_quoting_handles_angle_brackets��s�� z>TestEntitySubstitution.test_xml_quoting_handles_angle_bracketsc��C��s��|�j�|�jjd�d��d�S�)NzAT&TzAT&T)r��rU��r[��)r��r��r��r��#test_xml_quoting_handles_ampersands��s��z:TestEntitySubstitution.test_xml_quoting_handles_ampersandsc��C��s��|�j�|�jjd�d��d�S�)NzÁT&TzÁT&T)r��rU��r[��)r��r��r��r��Etest_xml_quoting_including_ampersands_when_they_are_part_of_an_entity��s�� z\TestEntitySubstitution.test_xml_quoting_including_ampersands_when_they_are_part_of_an_entityc��C��s��|�j�|�jjd�d��d�S�)NzÁT&TzÁT&T)r��rU��Z"substitute_xml_containing_entities)r��r��r��r��Dtest_xml_quoting_ignoring_ampersands_when_they_are_part_of_an_entity��s�� z[TestEntitySubstitution.test_xml_quoting_ignoring_ampersands_when_they_are_part_of_an_entityc��C��s��d}|�j�|�jj|�|��dS�)z:There's no need to do this except inside attribute values.zBob's "bar"N)r��rU��rW��)r��textr��r��r�� test_quotes_not_html_substituted��s��z7TestEntitySubstitution.test_quotes_not_html_substitutedN)r"��r#��r$��__doc__rV��rX��rZ��r\��r]��r^��r_��r`��ra��rb��rc��rd��rf��r��r��r��r��rT��s��rT��c��sN��e�Zd�Z��fdd�Zdd��Zdd��Zdd��Zd d ��Zee d�dd ��Z ��ZS�)�TestEncodingConversionc��s4��t�t|��j��d|�_|�jjd�|�_|�j|�jd��d�S�)NuU��Sacré bleu!zutf-8sU��Sacré bleu!)�superrh��rV��unicode_datar��r ��r��)r��)� __class__r��r��rV��s��zTestEncodingConversion.setUpc��C��s��t�jj}tjtj��zbdd��}|t�j_d}|�j|�}|j��}|�jt |t ��|�j||�j|j��|�j|j j��d��W�d�tjtj��|t�j_X�d�S�)Nc��S��s��d�S�)Nr��)r/��r��r��r��noop��s��z>TestEncodingConversion.test_ascii_in_unicode_out..noops��azutf-8)�bs4rY��chardet_dammit�logging�disable�WARNINGr��decoder(�� isinstancer/��r��Zdocument_forr��lower�NOTSET)r��chardetrl��asciiZsoup_from_asciiZunicode_outputr��r��r��test_ascii_in_unicode_out��s�� z0TestEncodingConversion.test_ascii_in_unicode_outc��C��s@��|�j�|�j�}|�j|j��|�j��|�j|jjd��|�j|jd��d�S�)Nu��Sacré bleu!)r��rj��r��rr��foor��r��)r��soup_from_unicoder��r��r��test_unicode_in_unicode_out��s��z2TestEncodingConversion.test_unicode_in_unicode_outc��C��s2��|�j�|�j�}|�j|j��|�j��|�j|jjd��d�S�)Nu��Sacré bleu!)r��r ��r��rr��rj��ry��r��)r��Zsoup_from_utf8r��r��r��test_utf8_in_unicode_out��s��z/TestEncodingConversion.test_utf8_in_unicode_outc��C��s$��|�j�|�j�}|�j|jd�|�j��d�S�)Nzutf-8)r��rj��r��r��r ��)r��rz��r��r��r�� test_utf8_out��s��z$TestEncodingConversion.test_utf8_outzQBad HTMLParser detected; skipping test of non-ASCII characters in attribute name.c��C��s(��d}|�j�|�j|�jjd�|jd��d�S�)Nu ��
r<��)r��r��Zdivr��)r��rR��r��r��r��1test_attribute_name_containing_unicode_characters��s��zHTestEncodingConversion.test_attribute_name_containing_unicode_characters)r"��r#��r$��rV��rx��r{��r|��r}��r ��PYTHON_3_PRE_3_2r~�� __classcell__r��r��)rk��r��rh��s�� rh��c��@��s��e�Zd�ZdZdd��Zdd��Zdd��Zdd ��Zd d��Zdd ��Z dd��Z dd��Zdd��Zdd��Z dd��Zdd��Zdd��Zdd��Zdd��Zd d!��Zd"d#��Zd$S�)%�TestUnicodeDammitz"Standalone tests of UnicodeDammit.c��C��s��d}t�|�}|�j|j|��d�S�)Nu��I'm already Unicode! ☃)r ��r��unicode_markup)r��rR��rY��r��r��r��test_unicode_input"��s��z$TestUnicodeDammit.test_unicode_inputc��C��s��d}t�|�}|�j|jd��d�S�)Ns��z#\u2018\u2019\u201c\u201d)r ��r��r��)r��rR��rY��r��r��r��test_smart_quotes_to_unicode'��s��z.TestUnicodeDammit.test_smart_quotes_to_unicodec��C��s"��d}t�|dd�}|�j|jd��d�S�)Ns��Zxml)�smart_quotes_toz+‘’“”)r ��r��r��)r��rR��rY��r��r��r��!test_smart_quotes_to_xml_entities-��s��z3TestUnicodeDammit.test_smart_quotes_to_xml_entitiesc��C��s"��d}t�|dd�}|�j|jd��d�S�)Ns��r5��)r��z'‘’“”)r ��r��r��)r��rR��rY��r��r��r��"test_smart_quotes_to_html_entities3��s��z4TestUnicodeDammit.test_smart_quotes_to_html_entitiesc��C��s"��d}t�|dd�}|�j|jd��d�S�)Ns��rw��)r��z''"")r ��r��r��)r��rR��rY��r��r��r��test_smart_quotes_to_ascii9��s��z,TestUnicodeDammit.test_smart_quotes_to_asciic��C��s0��d}t�|�}|�j|jj��d��|�j|jd��d�S�)Ns��Sacré bleu! ☃zutf-8u��Sacré bleu! ☃)r ��r��r��rt��r��)r��r<��rY��r��r��r��test_detect_utf8?��s��z"TestUnicodeDammit.test_detect_utf8c��C��s4��d}t�|dg�}|�j|jj��d��|�j|jd��d�S�)Ns��z iso-8859-8z\u05dd\u05d5\u05dc\u05e9)r ��r��r��rt��r��)r��hebrewrY��r��r��r��test_convert_hebrewF��s��z%TestUnicodeDammit.test_convert_hebrewc��C��s6��d}t�|�}|�j|jj��d��|�j|jjd�|��d�S�)Ns��ケータイ Watchzutf-8)r ��r��r��rt��r��r��)r��utf_8rY��r��r��r��/test_dont_see_smart_quotes_where_there_are_noneL��s��zATestUnicodeDammit.test_dont_see_smart_quotes_where_there_are_nonec��C��s,��dj�d�}t|dg�}|�j|jj��d��d�S�)Nu ��Räksmörgåszutf-8z iso-8859-8)r��r ��r��r��rt��)r��r ��rY��r��r��r�� test_ignore_inappropriate_codecsR��s�� z2TestUnicodeDammit.test_ignore_inappropriate_codecsc��C��s:��dj�d�}x*dD�]"}t||g�}|�j|jj��d��qW�d�S�)Nu ��Räksmörgåszutf-8�.utf8�...� utF---16.!)r��r��r��)r��r ��r��r��rt��)r��r ��Zbad_encodingrY��r��r��r��test_ignore_invalid_codecsW��s�� z,TestUnicodeDammit.test_ignore_invalid_codecsc��C��sL��dj�d�}t|dgd�}|�j|jj��d��t|ddgd�}|�j|jd��d�S�)Nu ��Räksmörgåszutf-8)r��zwindows-1252)r��r ��r��r��rt��)r��r ��rY��r��r��r��r!��]��s�� z(TestUnicodeDammit.test_exclude_encodingsc��C��s"��t�d�}t|j�}d|kst�d�S�)Ns'��u��utf-�)r��list� encodings�AssertionError)r��Zdetectedr��r��r��r��Ptest_encoding_detector_replaces_junk_in_encoding_name_with_replacement_characterk��s�� zbTestUnicodeDammit.test_encoding_detector_replaces_junk_in_encoding_name_with_replacement_characterc��C��s,��x&dD�]}t�|dd�}|�jd|j��qW�d�S�) N�&��&��$��#��T)Zis_htmlzeuc-jp)r��r��r��r��)r ��r��r��)r��r��rY��r��r��r�� test_detect_html5_style_meta_tagq��s��z2TestUnicodeDammit.test_detect_html5_style_meta_tagc��C��s��d}t�jj}tjtj��zPdd��}|t�j_t|�}|�jd|j��|�j d|j k��t|d�}|�j |j��W�d�tjtj��|t�j_X�d�S�)NsT�� بتر ��ѐ��c��S��s��d�S�)Nr��)r/��r��r��r��rl��s��zBTestUnicodeDammit.test_last_ditch_entity_replacement..noopTz\ufffdzhtml.parser) rm��rY��rn��ro��rp��rq��r ��r��Zcontains_replacement_charactersr(��r��r��ru��)r��docrv��rl��rY��r��r��r��r��"test_last_ditch_entity_replacement|��s�� z4TestUnicodeDammit.test_last_ditch_entity_replacementc��C��s,��d}t�|�}|�jd|j��|�jd|j��d�S�)Ns��<�a�>��<�/�a�>�u��áézutf-16le)r ��r��r��r��)r��r��rY��r��r��r��test_byte_order_mark_removed��s��z.TestUnicodeDammit.test_byte_order_mark_removedc��C��sP��dj�d�}dj�d�}||�|�}|�jt|jd��tj|�}|�jd|jd��d�S�)Nu��☃r��r<��u��“Hi, I like Windows!”�windows_1252u+��☃☃☃“Hi, I like Windows!”☃☃☃u ��☃☃☃)r��r?��UnicodeDecodeErrorrr��r �� detwingler��)r��r<��r��r��Zfixedr��r��r��test_detwingle��s�� z TestUnicodeDammit.test_detwinglec��C��sB��x��s6��,/ E<�/PK��je[= �u��u��*��tests/__pycache__/test_docs.cpython-36.pycnu��[��3 ��O+��@��sD��d�Z�eZdgZddlZddlZddlZddlZejej B�ej B�ZdS�)zTest harness for doctests.Zadditional_tests��N)�__doc__�typeZ __metaclass__�__all__�atexitZdoctest�osZunittest�ELLIPSISZNORMALIZE_WHITESPACEZREPORT_NDIFFZ DOCTEST_FLAGS��r��r��/usr/lib/python3.6/test_docs.py��s�� PK��je[��Z��Z��4��tests/__pycache__/test_html5lib.cpython-36.opt-1.pycnu��[��3 6]+��@��s��d�Z�ddlZyddlmZ�dZW�n&�ek rF�Z�z dZW�Y�ddZ[X�nX�ddlmZ�ddl m Z mZmZ�ee�d�G�d d ��d ee ��Z dS�)zDTests to ensure that the html5lib tree builder generates good trees.��N)�HTML5TreeBuilderTF)�SoupStrainer)�HTML5TreeBuilderSmokeTest�SoupTest�skipIfz?html5lib seems not to be present, not testing its tree builder.c��@��sl��e�Zd�ZdZedd��Zdd��Zdd��Zdd ��Zd d��Z dd ��Z dd��Zdd��Zdd��Z dd��Zdd��ZdS�)�HTML5LibBuilderSmokeTestz"See ``HTML5TreeBuilderSmokeTest``.c��C��s��t��S�)N)r��)�self��r ��#/usr/lib/python3.6/test_html5lib.py�default_builder��s��z(HTML5LibBuilderSmokeTest.default_builderc��C��sd��t�d�}d}tjdd��}|�j||d�}W�d�Q�R�X�|�j|j��|�j|��|�jdt|d�j �k��d�S�)N�bz
A bold statement.
T)�record)Z parse_onlyz4the html5lib tree builder doesn't support parse_onlyr��) r��warnings�catch_warnings�soup�assertEqual�decodeZdocument_forZ assertTrue�str�message)r��Zstrainer�markup�wr��r ��r ��r ��test_soupstrainer��s��z*HTML5LibBuilderSmokeTest.test_soupstrainerc��C��s��d}|�j�|d��|�j�d��dS�)z8html5lib inserts tags where other parsers don't.z[z�
Here's another table:
foo
Here's another table:
foo
z{
Foo
Bar
Baz
N)ZassertSoupEquals)r��r��r ��r ��r ��test_correctly_nested_tables(��s��z5HTML5LibBuilderSmokeTest.test_correctly_nested_tablesc��C��s$��d}|�j�|�}|�jd|jj��d�S�)Nzy
foo
s ��
foo
)r��r��p�encode)r��r��r��r ��r ��r ��(test_xml_declaration_followed_by_doctype<��s�� zAHTML5LibBuilderSmokeTest.test_xml_declaration_followed_by_doctypec��C��s:��d}|�j�|�}|�jd|jj��|�jdt|jd��d�S�)Nz%
foo

bar
zD
foo

bar
��r��)r��r��bodyr��len�find_all)r��r��r��r ��r ��r ��test_reparented_markupJ��s�� z/HTML5LibBuilderSmokeTest.test_reparented_markupc��C��s:��d}|�j�|�}|�jd|jj��|�jdt|jd��d�S�)Nz&
foo

bar
zE
foo

bar
r��r��)r��r��r��r��r��r��)r��r��r��r ��r ��r ��+test_reparented_markup_ends_with_whitespaceQ��s�� zDHTML5LibBuilderSmokeTest.test_reparented_markup_ends_with_whitespacec��C��s0��d}|�j�|�}|jdd�\}}|jd�\}}dS�)z�Verify that we keep the two whitespace nodes in this document distinct when reparenting the adjacent tags. z,

� )�stringZtbodyN)r��r��)r��r��r��Zspace1Zspace2Ztbody1Ztbody2r ��r ��r ��aftermath

aftermath

�target)r#Z aftermath��)r�noscriptrZnext_element�findrZprevious_element)rrrr(r%Zfinal_aftermathr r r �*test_reparented_markup_containing_childrenbs zCHTML5LibBuilderSmokeTest.test_reparented_markup_containing_childrencCsd}|j|�}dS)z(Processing instructions become comments.sN)r)rrrr r r �test_processing_instructionrs z4HTML5LibBuilderSmokeTest.test_processing_instructioncCs,d}|j|�}|jd�\}}|j||�dS)Ns

�a)rrr)rrrZa1Za2r r r �test_cloned_multivalue_nodexs z4HTML5LibBuilderSmokeTest.test_cloned_multivalue_nodecCs$d}|j|�}|jd|jj��dS)NsAz>A
)rrrr)rrrr r r �test_foster_parentings z.HTML5LibBuilderSmokeTest.test_foster_parentingN)�__name__� __module__�__qualname__�__doc__�propertyrrrrr r!r$r*r+r-r.r r r r rs r)r2rZbs4.builderrZHTML5LIB_PRESENT�ImportError�eZbs4.elementrZbs4.testingrrrrr r r r �sPK�je[]_@u� � 6tests/__pycache__/test_htmlparser.cpython-36.opt-1.pycnu�[��3 Y=K[��@sfdZddlmZddlZddlmZmZddlmZddl m Z Gdd�dee�ZGd d �d e�ZdS)zGTests to ensure that the html.parser tree builder generates good trees.�)� set_traceN)�SoupTest�HTMLTreeBuilderSmokeTest)�HTMLParserTreeBuilder)�BeautifulSoupHTMLParserc@s@eZdZedd��Zdd�Zdd�Zdd�Zd d �Zdd�Z d S)�HTMLParserTreeBuilderSmokeTestcCst�S)N)r)�self�r �%/usr/lib/python3.6/test_htmlparser.py�default_buildersz.HTMLParserTreeBuilderSmokeTest.default_buildercCsdS)Nr )rr r r �test_namespaced_system_doctypesz=HTMLParserTreeBuilderSmokeTest.test_namespaced_system_doctypecCsdS)Nr )rr r r �test_namespaced_public_doctypesz=HTMLParserTreeBuilderSmokeTest.test_namespaced_public_doctypecCs<|jd�}tj|d�}tj|�}|jt|jt|j��dS)zfUnlike most tree builders, HTMLParserTreeBuilder and will be restored after pickling. z foo�N)Zsoup�pickle�dumps�loadsZ assertTrue� isinstanceZbuilder�type)rZtreeZdumpedZloadedr r r �test_builder_is_pickleds z6HTMLParserTreeBuilderSmokeTest.test_builder_is_pickledcCs|jdd�|jdd�dS)Nz

z

z

�)�assertSoupEquals)rr r r �)test_redundant_empty_element_closing_tags!szHHTMLParserTreeBuilderSmokeTest.test_redundant_empty_element_closing_tagscCs|jdd�dS)Nz foo &# barzfoo &# bar)r)rr r r �test_empty_element%sz1HTMLParserTreeBuilderSmokeTest.test_empty_elementN) �__name__� __module__�__qualname__�propertyrrr rrrr r r r r s rc@seZdZdd�ZdS)�TestHTMLParserSubclasscCst�}|jd�dS)zlVerify that our HTMLParser subclass implements error() in a way that doesn't cause a crash. zdon't crashN)r�error)r�parserr r r � test_error,sz!TestHTMLParserSubclass.test_errorN)rrrr r r r r r+sr) �__doc__ZpdbrrZbs4.testingrrZbs4.builderrZbs4.builder._htmlparserrrrr r r r �s!PK�je[0�iWXX*tests/__pycache__/test_tree.cpython-36.pycnu�[��3 6]�8�@sdZddlmZddlZddlZddlZddlZddlmZddl m Z mZddlm Z mZmZmZmZmZmZmZddlmZmZe jd�dk Ze jd �dk ZGd d�de�ZGdd �d e�ZGdd�de�ZGdd�de�ZGdd�de�ZGdd�de�Z Gdd�de�Z!Gdd�de�Z"Gdd�de�Z#Gdd�de#�Z$Gdd�de#�Z%Gd d!�d!e�Z&Gd"d#�d#e&�Z'Gd$d%�d%e&�Z(Gd&d'�d'e�Z)Gd(d)�d)e�Z*Gd*d+�d+e�Z+Gd,d-�d-e�Z,Gd.d/�d/e�Z-Gd0d1�d1e�Z.Gd2d3�d3e�Z/Gd4d5�d5e�Z0Gd6d7�d7e�Z1dS)8a8Tests for Beautiful Soup's tree traversal methods. The tree traversal methods are the main advantage of using Beautiful Soup over just using a parser. Different parsers will build different Beautiful Soup trees given the same markup, but all Beautiful Soup trees can be traversed with the methods tested here. �)� set_traceN)� BeautifulSoup)�builder_registry�HTMLParserTreeBuilder)�PY3K�CData�Comment�Declaration�Doctype�NavigableString�SoupStrainer�Tag)�SoupTest�skipIfZxmlZlxmlc@seZdZdd�Zdd�ZdS)�TreeTestcCs|jdd�|D�|�dS)z�Make sure that the given tags have the correct text. This is used in tests that define a bunch of tags, each containing a single string, and then select certain strings by some mechanism. cSsg|] }|j�qS�)�string)�.0�tagrr�/usr/lib/python3.6/test_tree.py� 2sz*TreeTest.assertSelects..N)�assertEqual)�self�tags�should_matchrrr� assertSelects+szTreeTest.assertSelectscCs|jdd�|D�|�dS)z�Make sure that the given tags have the correct IDs. This is used in tests that define a bunch of tags, each containing a single string, and then select certain strings by some mechanism. cSsg|]}|d�qS)�idr)rrrrrr;sz-TreeTest.assertSelectsIDs..N)r)rrrrrr�assertSelectsIDs4szTreeTest.assertSelectsIDsN)�__name__� __module__�__qualname__rrrrrrr)s rc@s8eZdZdZdd�Zdd�Zdd�Zdd �Zd d�ZdS) �TestFindz�Basic tests of the find() method. find() just calls find_all() with limit=1, so it's not tested all that thouroughly here. cCs"|jd�}|j|jd�jd�dS)Nz 1234�b�2)�soupr�findr)rr$rrr� test_find_tagEs zTestFind.test_find_tagcCs"|jd�}|j|jdd�d�dS)Nu

Räksmörgås

u Räksmörgås)r)r$rr%)rr$rrr�test_unicode_text_findIs zTestFind.test_unicode_text_findcCs,|jd�}t|�|jd|jdd�j�dS)Nu&
here it is
z here it isu Räksmörgås)r)r$�strrr%�text)rr$rrr�test_unicode_attribute_findMs z$TestFind.test_unicode_attribute_findcCs"|jd�}|jdt|j��dS)z)Test an optimization that finds all tags.zfoobar�N)r$r�len�find_all)rr$rrr�test_find_everythingSs zTestFind.test_find_everythingcCs$|jd�}|jdt|jd��dS)z;Test an optimization that finds all tags with a given name.zfoobarbazr+�aN)r$rr,r-)rr$rrr�test_find_everything_with_nameXs z'TestFind.test_find_everything_with_nameN) rrr �__doc__r&r'r*r.r0rrrrr!>sr!c@s8eZdZdZdd�Zdd�Zdd�Zdd �Zd d�ZdS) �TestFindAllz%Basic tests of the find_all() method.cCs�|jd�}|j|jdd�dg�|j|jdd�dg�|j|jddgd�ddg�|j|jtjd�d�dddg�|j|jdd�dddg�d S) z'You can search the tree for text nodes.uFoobar»�bar)r)r)�Fooz.*�»TN)r$rr-�re�compile)rr$rrr�test_find_all_text_nodes`s z$TestFindAll.test_find_all_text_nodescCs�|jd�}|j|jddd�dddg�|j|jddd�dg�|j|jdd d�dddd dg�|j|jddd�dddd dg�d S)z7You can limit the number of items returned by find_all.z(1 2 3 4 5r/�)�limit�1r#�3�� 4�5rN)r$rr-)rr$rrr�test_find_all_limitps zTestFindAll.test_find_all_limitcCs:|jd�}|j|ddd�dg�|j|jdd�dg�dS) Nz!123r/r=)r:r;�foo)rr<)r$rr")rr$rrr�%test_calling_a_tag_is_calling_findall|s z1TestFindAll.test_calling_a_tag_is_calling_findallcCs.|jd�}g}|j|�|jg|j|��dS)Nz)r$�appendrr-)rr$�lrrr�Ttest_find_all_with_self_referential_data_structure_does_not_cause_infinite_recursion�s z`TestFindAll.test_find_all_with_self_referential_data_structure_does_not_cause_infinite_recursioncCs^|jd�}|jd�}|jt|d��|jd�}|jt|d��|jdd�}|jt|d��dS)z%All find_all calls return a ResultSetzr/�sourceTrB)r)N)r$r-� assertTrue�hasattr)rr$�resultrrr�test_find_all_resultset�s z#TestFindAll.test_find_all_resultsetN) rrr r1r8rArCrFrKrrrrr2]s r2c@seZdZdd�ZdS)�TestFindAllBasicNamespacescCs<|jd�}|jd|jd�j�|jd|jddid�j�dS)Nz04r?zmathml:msqrtr/zsvg:fillZred)�attrs)r$rr%r�name)rr$rrr�test_find_by_namespaced_name�s z7TestFindAllBasicNamespaces.test_find_by_namespaced_nameN)rrr rOrrrrrL�srLcspeZdZdZ�fdd�Zdd�Zdd�Zdd �Zd d�Zdd �Z dd�Z dd�Zdd�Zdd�Z dd�Z�ZS)�TestFindAllByNamez&Test ways of finding tags by tag name.cstt|�j�|jd�|_dS)Nz�First tag. Second tag. Third Nested tag. tag.)�superr�setUpr$�tree)r)� __class__rrrR�szTestFindAllByName.setUpcCs|j|jjd�ddg�dS)Nr/z First tag.zNested tag.)rrSr-)rrrr�test_find_all_by_tag_name�sz+TestFindAllByName.test_find_all_by_tag_namecCs\|j|jjddd�dg�|j|jjddd�ddg�|j|jjdtjd�d�ddg�dS)Nr/z First tag.)r)TzNested tag.r)rrSr-r6r7)rrrr�test_find_all_by_name_and_text�sz0TestFindAllByName.test_find_all_by_name_and_textcCs|j|jjjd�dg�dS)Nr/zNested tag.)rrS�cr-)rrrr�!test_find_all_on_non_root_element�sz3TestFindAllByName.test_find_all_on_non_root_elementcCs|j|jd�ddg�dS)Nr/z First tag.zNested tag.)rrS)rrrr�%test_calling_element_invokes_find_all�sz7TestFindAllByName.test_calling_element_invokes_find_allcCs |j|jjtd��ddg�dS)Nr/z First tag.zNested tag.)rrSr-r)rrrr�test_find_all_by_tag_strainer�sz/TestFindAllByName.test_find_all_by_tag_strainercCs"|j|jjddg�dddg�dS)Nr/r"z First tag.zSecond tag.zNested tag.)rrSr-)rrrr�test_find_all_by_tag_names�sz,TestFindAllByName.test_find_all_by_tag_namescCs$|j|jjddd��dddg�dS)NT)r/r"z First tag.zSecond tag.zNested tag.)rrSr-)rrrr�test_find_all_by_tag_dict�sz+TestFindAllByName.test_find_all_by_tag_dictcCs$|j|jjtjd��dddg�dS)Nz^[ab]$z First tag.zSecond tag.zNested tag.)rrSr-r6r7)rrrr�test_find_all_by_tag_re�sz)TestFindAllByName.test_find_all_by_tag_recCs,dd�}|jd�}|j|j|�ddg�dS)NcSs|j|jd�kS)Nr)rN�get)rrrr�id_matches_name�szRTestFindAllByName.test_find_all_with_tags_matching_method..id_matches_namez�Match 1. Does not match. Match 2.zMatch 1.zMatch 2.)r$rr-)rr_rSrrr�'test_find_all_with_tags_matching_method�s z9TestFindAllByName.test_find_all_with_tags_matching_methodcCsx|jd�}|jdd�}|jdtjd��}|jdddg�\}}|jd|j�|jd|j�|jd|j�|jd|j�dS)NzH
1
2
3
�divza dza br<r;)r$r%r6r7r-rr)rr$Zr1Zr2Zr3Zr4rrr�%test_find_with_multi_valued_attribute�sz7TestFindAllByName.test_find_with_multi_valued_attribute)rrr r1rRrUrVrXrYrZr[r\r]r`rb� __classcell__rr)rTrrP�s rPc@s�eZdZdd�Zdd�Zdd�Zdd�Zd d �Zdd�Zd d�Z dd�Z dd�Zdd�Zdd�Z dd�Zdd�Zdd�Zdd�Zdd �Zd!S)"�TestFindAllByAttributecCs&|jd�}|j|jdd�ddg�dS)Nz� Matching a. Non-matching Matching b.a. �first)rzMatching a.zMatching b.)r$rr-)rrSrrr�test_find_all_by_attribute_name�sz6TestFindAllByAttribute.test_find_all_by_attribute_namecCstdjd�}djd�}|j|�}|j|jg|j|d��|j|jg|j|jd�d��|j|jg|j|dgd��dS)Nuםולש�utf8u)�titlezsomething else)�encoder$rr/r-�decode)rZpeace�datar$rrr�%test_find_all_by_utf8_attribute_value�s zName match. Class match. Non-match. A tag called 'name1'. Zname1)rNzA tag called 'name1'.rN)rMzName match.�classZclass2zClass match.)r$rr-)rrSrrr�test_find_all_by_attribute_dictsz6TestFindAllByAttribute.test_find_all_by_attribute_dictcCs�|jd�}|j|jddd�dg�|j|jddd�dg�|j|jdd d�dg�|j|jdd�dg�|j|jdd �ddg�|j|jdd�dg�|j|jdd �dg�dS)Nz� Class 1. Class 2. Class 1. Class 3 and 4. r/r;)�class_zClass 1.rWr<zClass 3 and 4.r?)rM)r$rr-)rrSrrr�test_find_all_by_classsz-TestFindAllByAttribute.test_find_all_by_classcCst|jd�}|jdtjd�d�}|j|dg�|jdtjd�d�}|j|dg�|jdtjd�d�}|j|dg�dS)Nz#Found itZgar�o)rozFound itr/zo b)r$r-r6r7r)rrS�frrr�0test_find_by_class_when_multiple_classes_present-s zGTestFindAllByAttribute.test_find_by_class_when_multiple_classes_presentcCsd|jd�}|j|jdtjd��dg�dd�}|j|jd|�g�dd�}|j|jd|�dg�dS) NzFound itr/ZbazFound itcSst|�dkS)Nr9)r,)�valuerrr�big_attribute_value@sznTestFindAllByAttribute.test_find_all_with_non_dictionary_for_attrs_finds_by_class..big_attribute_valuecSst|�dkS)Nr9)r,)rtrrr�small_attribute_valueEszpTestFindAllByAttribute.test_find_all_with_non_dictionary_for_attrs_finds_by_class..small_attribute_value)r$rr-r6r7)rr$rurvrrr�:test_find_all_with_non_dictionary_for_attrs_finds_by_class;s zQTestFindAllByAttribute.test_find_all_with_non_dictionary_for_attrs_finds_by_classcCs�|jd�}|jd�\}}|j||g|jdd��|j|g|jdd��|j|g|jddd��|j|g|jdd��|jg|jdd��dS)Nz*r/rBr3zfoo bar)rozbar foo)r$r-r)rr$r/Za2rrr�:test_find_all_with_string_for_attrs_finds_multiple_classesKs zQTestFindAllByAttribute.test_find_all_with_string_for_attrs_finds_multiple_classescCs0|jd�}tddid�}|j|j|�dg�dS)Nzi Match. Non-match.rre)rMzMatch.)r$rrr-)rrS�strainerrrr�'test_find_all_by_attribute_soupstrainerWsz>TestFindAllByAttribute.test_find_all_by_attribute_soupstrainercCs&|jd�}|j|jddd�dg�dS)Nz�ID present. No ID present. ID is empty.r/)rzNo ID present.)r$rr-)rrSrrr�$test_find_all_with_missing_attribute_sz;TestFindAllByAttribute.test_find_all_with_missing_attributecCs&|jd�}|j|jdd�ddg�dS)Nz�ID present. No ID present. ID is empty.T)rzID present.zID is empty.)r$rr-)rrSrrr�$test_find_all_with_defined_attributegsz;TestFindAllByAttribute.test_find_all_with_defined_attributecCs>|jd�}ddg}|j|jdd�|�|j|jdd�|�dS)Nz[Unquoted attribute. Quoted attribute.zUnquoted attribute.zQuoted attribute.r=)rr;)r$rr-)rrSZexpectedrrr�$test_find_all_with_numeric_attributeps z;TestFindAllByAttribute.test_find_all_with_numeric_attributecCs,|jd�}|j|jdddgd�ddg�dS)Nz�1 2 3 No ID.r;r<r?)r)r$rr-)rrSrrr�(test_find_all_with_list_attribute_valuesysz?TestFindAllByAttribute.test_find_all_with_list_attribute_valuescCs,|jd�}|j|jtjd�d�ddg�dS)Nz�One a. Two as. Mixed as and bs. One b. No ID.z^a+$)rzOne a.zTwo as.)r$rr-r6r7)rrSrrr�5test_find_all_with_regular_expression_attribute_value�szLTestFindAllByAttribute.test_find_all_with_regular_expression_attribute_valuecCsX|jd�}|j}|j|g|jddd��|jg|jddd��|jg|jddd��dS)Nzfoobarfoor/rB)r)r3)r$r/rr-)rr$r/rrr�'test_find_by_name_and_containing_string�s z>TestFindAllByAttribute.test_find_by_name_and_containing_stringcCs*|jd�}|j|jd�|jddd��dS)Nz"foo foor/rB)r))r$rr-)rr$rrr�=test_find_by_name_and_containing_string_when_string_is_buried�s zTTestFindAllByAttribute.test_find_by_name_and_containing_string_when_string_is_buriedcCsB|jd�}|j}|j|g|jddd��|jg|jddd��dS)Nz"foofoor+rB)rr)r=r3)r$r/rr-)rr$r/rrr�,test_find_by_attribute_and_containing_string�s zCTestFindAllByAttribute.test_find_by_attribute_and_containing_stringN)rrr rfrlrnrprsrwrxrzr{r|r}r~rr�r�r�rrrrrd�s rdc@seZdZdZdd�ZdS)� TestIndexzTest Tag.indexcCsN|jd�}|j}x(t|j�D]\}}|j||j|��qW|jt|jd�dS)Nah
Identical Not identical Identical Identical with child Also not identical Identical with child
r=)r$ra� enumerate�contentsr�index�assertRaises� ValueError)rrSra�i�elementrrr� test_index�szTestIndex.test_indexN)rrr r1r�rrrrr��sr�cs`eZdZdZ�fdd�Zdd�Zdd�Zdd �Zd d�Zdd �Z dd�Z dd�Zdd�Z�Z S)�TestParentOperationsz;Test navigation and searching through an element's parents.cs(tt|�j�|jd�|_|jj|_dS)Na1

Start here

)rQr�rRr$rSr"�start)r)rTrrrR�szTestParentOperations.setUpcCsF|j|jjdd�|j|jjjdd�|j|jjjjdd�dS)Nr�bottom�middle�top)rr��parent)rrrr�test_parent�sz TestParentOperations.test_parentcCs |jjd}|j|j|j�dS)Nr)rSr�rr�)rZtop_tagrrr�%test_parent_of_top_tag_is_soup_object�sz:TestParentOperations.test_parent_of_top_tag_is_soup_objectcCs|jd|jj�dS)N)rrSr�)rrrr�test_soup_object_has_no_parent�sz3TestParentOperations.test_soup_object_has_no_parentcCs8|j|jjd�dddg�|j|jjddd�dg�dS)N�ulr�r�r�)r)rr�Zfind_parents)rrrr�test_find_parents�sz&TestParentOperations.test_find_parentscCs8|j|jjd�dd�|j|jjddd�dd�dS)Nr�rr�r�)r)rr��find_parent)rrrr�test_find_parent�sz%TestParentOperations.test_find_parentcCs"|jjdd�}|j|jjd�dS)Nz Start here)r)r")rSr%rr�rN)rr)rrr�test_parent_of_text_element�sz0TestParentOperations.test_parent_of_text_elementcCs(|jjdd�}|j|jd�dd�dS)Nz Start here)r)r�rr�)rSr%rr�)rr)rrr�test_text_element_find_parent�sz2TestParentOperations.test_text_element_find_parentcCs(dd�|jjD�}|j|dddg�dS)NcSs&g|]}|dk rd|jkr|d�qS)Nr)rM)rr�rrrr�sz>TestParentOperations.test_parent_generator..r�r�r�)r��parentsr)rr�rrr�test_parent_generator�sz*TestParentOperations.test_parent_generator)rrr r1rRr�r�r�r�r�r�r�r�rcrr)rTrr��sr�cseZdZ�fdd�Z�ZS)� ProximityTestcstt|�j�|jd�|_dS)NzgOneTwoThree)rQrrRr$rS)r)rTrrrR�szProximityTest.setUp)rrr rRrcrr)rTrr��sr�csTeZdZ�fdd�Zdd�Zdd�Zdd�Zd d �Zdd�Zd d�Z dd�Z �ZS)�TestNextOperationscstt|�j�|jj|_dS)N)rQr�rRrSr"r�)r)rTrrrR�szTestNextOperations.setUpcCs*|j|jjd�|j|jjjdd�dS)N�Onerr#)rr��next_element)rrrr� test_next�szTestNextOperations.test_nextcCs |jjdd�}|j|jd�dS)N�Three)r))rSr%rr�)rZlastrrr�test_next_of_last_item_is_none�sz1TestNextOperations.test_next_of_last_item_is_nonecCs|j|jjd�dS)N)rrSr�)rrrr�test_next_of_root_is_nonesz,TestNextOperations.test_next_of_root_is_nonecCsB|j|jjd�ddg�|jjdd�|j|jjdd�dg�dS)Nr"�Twor�r9)r)rr�� find_all_next)rrrr�test_find_all_nextsz%TestNextOperations.test_find_all_nextcCs2|j|jjd�dd�|j|jjdd�d�dS)Nr"rr#r�)r))rr�� find_next)rrrr�test_find_next sz!TestNextOperations.test_find_nextcCs<|jjdd�}|j|jd�jd�|j|jd�ddg�dS)Nr�)r)r"r�r�)rSr%rr�rrr�)rr)rrr�test_find_next_for_text_elementsz2TestNextOperations.test_find_next_for_text_elementcCsF|jjdd�}dd�|jD�}|\}}|j|dd�|j|d�dS)Nr�)r)cSsg|]}|�qSrr)r�noderrrrsz:TestNextOperations.test_next_generator..rr<r�)rSr%Z next_elementsr)rr�Z successorsrr�rrr�test_next_generators z&TestNextOperations.test_next_generator)rrr rRr�r�r�r�r�r�r�rcrr)rTrr��sr�csTeZdZ�fdd�Zdd�Zdd�Zdd�Zd d �Zdd�Zd d�Z dd�Z �ZS)�TestPreviousOperationscs"tt|�j�|jjdd�|_dS)Nr�)r))rQr�rRrSr%�end)r)rTrrrRszTestPreviousOperations.setUpcCs*|j|jjdd�|j|jjjd�dS)Nrr<r�)rr��previous_element)rrrr� test_previous!sz$TestPreviousOperations.test_previouscCs|jjd�}|j|jd�dS)N�html)rSr%rr�)rrerrr�#test_previous_of_first_item_is_none%sz:TestPreviousOperations.test_previous_of_first_item_is_nonecCsdS)Nr)rrrr�test_previous_of_root_is_none)sz4TestPreviousOperations.test_previous_of_root_is_nonecCs6|j|jjd�dddg�|j|jjdd�dg�dS)Nr"r�r�r�r=)r)rr��find_all_previous)rrrr�test_find_all_previous/sz-TestPreviousOperations.test_find_all_previouscCs2|j|jjd�dd�|j|jjdd�d�dS)Nr"rr<r�)r))rr�� find_previous)rrrr�test_find_previous7sz)TestPreviousOperations.test_find_previouscCs>|jjdd�}|j|jd�jd�|j|jd�dddg�dS)Nr�)r)r"r�r�)rSr%rr�rrr�)rr)rrr�#test_find_previous_for_text_element;sz:TestPreviousOperations.test_find_previous_for_text_elementcCsh|jjdd�}dd�|jD�}|\}}}}|j|dd�|j|jd�|j|jd�|j|jd �dS) Nr�)r)cSsg|]}|�qSrr)rr�rrrrCszBTestPreviousOperations.test_previous_generator..rr;�body�headr�)rSr%Zprevious_elementsrrN)rr�Zpredecessorsr"r�r�r�rrr�test_previous_generatorAsz.TestPreviousOperations.test_previous_generator)rrr rRr�r�r�r�r�r�r�rcrr)rTrr�sr�cseZdZ�fdd�Z�ZS)�SiblingTestcs4tt|�j�d}tjd�jd|�}|j|�|_dS)Na� z\n\s*�)rQr�rRr6r7�subr$rS)r�markup)rTrrrRPszSiblingTest.setUp)rrr rRrcrr)rTrr�Nsr�csLeZdZ�fdd�Zdd�Zdd�Zdd�Zd d �Zdd�Zd d�Z �Z S)�TestNextSiblingcs"tt|�j�|jjdd�|_dS)Nr;)r)rQr�rRrSr%r�)r)rTrrrRfszTestNextSibling.setUpcCs|j|jjd�dS)N)rrS�next_sibling)rrrr�!test_next_sibling_of_root_is_nonejsz1TestNextSibling.test_next_sibling_of_root_is_nonecCsB|j|jjdd�|j|jjjdd�|j|jjdd�dS)Nrr#r<z1.1)rr�r�r�)rrrr�test_next_siblingmsz!TestNextSibling.test_next_siblingcCsN|j|jjjd�|jjdd�}|j|jd�|jjdd�}|j|jd�dS)Nz1.1)rr?)rrSr�r�r%)r�nested_spanZ last_spanrrr�test_next_sibling_may_not_existts z/TestNextSibling.test_next_sibling_may_not_existcCs|j|jjd�dd�dS)N�spanrr#)rr��find_next_sibling)rrrr�test_find_next_sibling}sz&TestNextSibling.test_find_next_siblingcCs6|j|jjd�dddg�|j|jjdd�dg�dS)Nr�r#r<r?)r)rr��find_next_siblings)rrrr�test_next_siblings�sz"TestNextSibling.test_next_siblingscCsv|jd�}|jdd�}|j|jjd�|j|jjd�|j|jd�dg�|j|jdd�d�|j|jdd�d�dS)NzFoobarbazr4)r)r"�bazr3�nonesuch)r$r%rr�rNrr�r�)rr$r�rrr�"test_next_sibling_for_text_element�s z2TestNextSibling.test_next_sibling_for_text_element)rrr rRr�r�r�r�r�r�rcrr)rTrr�ds r�csLeZdZ�fdd�Zdd�Zdd�Zdd�Zd d �Zdd�Zd d�Z �Z S)�TestPreviousSiblingcs"tt|�j�|jjdd�|_dS)Nr?)r)rQr�rRrSr%r�)r)rTrrrR�szTestPreviousSibling.setUpcCs|j|jjd�dS)N)rrS�previous_sibling)rrrr�%test_previous_sibling_of_root_is_none�sz9TestPreviousSibling.test_previous_sibling_of_root_is_nonecCsB|j|jjdd�|j|jjjdd�|j|jjdd�dS)Nrr<r#z3.1)rr�r�r�)rrrr�test_previous_sibling�sz)TestPreviousSibling.test_previous_siblingcCsN|j|jjjd�|jjdd�}|j|jd�|jjdd�}|j|jd�dS)Nz1.1)rr;)rrSr�r�r%)rr�Z first_spanrrr�#test_previous_sibling_may_not_exist�s z7TestPreviousSibling.test_previous_sibling_may_not_existcCs|j|jjd�dd�dS)Nr�rr<)rr��find_previous_sibling)rrrr�test_find_previous_sibling�sz.TestPreviousSibling.test_find_previous_siblingcCs6|j|jjd�dddg�|j|jjdd�dg�dS)Nr�r<r#r;)r)rr��find_previous_siblings)rrrr�test_previous_siblings�sz*TestPreviousSibling.test_previous_siblingscCsv|jd�}|jdd�}|j|jjd�|j|jjd�|j|jd�dg�|j|jdd�d�|j|jdd�d�dS)NzFoobarbazr�)r)r"r4r3r�)r$r%rr�rNrr�r�)rr$r�rrr�&test_previous_sibling_for_text_element�s z:TestPreviousSibling.test_previous_sibling_for_text_element)rrr rRr�r�r�r�r�r�rcrr)rTrr��s r�c@s0eZdZdZdd�Zdd�Zdd�Zdd �Zd S)�TestTagCreationz$Test the ability to create new tags.cCsd|jd�}|jddddid�}|jt|t��|jd|j�|jtddd�|j�|jd|j �dS)Nr�rBr�rNza name)r3rM)r3rN) r$�new_tagrH� isinstancer rrN�dictrMr�)rr$r�rrr�test_new_tag�s zTestTagCreation.test_new_tagcCs�trBtdd�}|jd�}|jd�}|jd|j��|jd|j��tdd�}|jd�}|jd�}|jd|j��|jd|j��dS) Nr�zlxml-xml�br�ps
s
zhtml.parsers
)�XML_BUILDER_PRESENTrr�rri)rZxml_soupZxml_brZxml_pZ html_soupZhtml_brZhtml_prrr�1test_tag_inherits_self_closing_rules_from_builder�s zATestTagCreation.test_tag_inherits_self_closing_rules_from_buildercCs4|jd�}|jd�}|jd|�|jt|t��dS)Nr�rB)r$� new_stringrrHr�r)rr$�srrr�'test_new_string_creates_navigablestring�s z7TestTagCreation.test_new_string_creates_navigablestringcCs6|jd�}|jdt�}|jd|�|jt|t��dS)Nr�rB)r$r�rrrHr�)rr$r�rrr�3test_new_string_can_create_navigablestring_subclass�s zCTestTagCreation.test_new_string_can_create_navigablestring_subclassN)rrr r1r�r�r�r�rrrrr��s r�c@s<eZdZdd�Zdd�Zdd�Zdd�Zd d �Zdd�Zd d�Z dd�Z dd�Zdd�Zdd�Z dd�Zdd�Zdd�Zdd�Zdd �Zd!d"�Zd#d$�Zd%d&�Zd'd(�Zd)d*�Zd+d,�Zd-d.�Zd/d0�Zd1d2�Zd3d4�Zd5d6�Zd7d8�Zd9d:�Zd;d<�Z d=d>�Z!d?d@�Z"dAdB�Z#dCdD�Z$dEdF�Z%dGdH�Z&dIdJ�Z'dKdL�Z(dMS)N�TestTreeModificationcCsl|jd�}d|jd<|j|j�|jd��|jd=|j|j�|jd��d|jd<|j|j�|jd��dS) Nzr+rzzrBZid2z)r$r/rrj�document_for)rr$rrr�test_attribute_modification�s z0TestTreeModification.test_attribute_modificationcCsltjd��}|jd|d�}t||d�}t||d�}d|d<|jjd|�|jjd |�|j|jj�d �dS)Nr�z )�builderr/�olzhttp://foo.com/Zhrefrr=s4
)r�lookupr$r r��insertrri)rr�r$r/r�rrr�test_new_tag_creation�sz*TestTreeModification.test_new_tag_creationcCs\d}|j|�}|jdd�}|j}|jdd�j|j�|j|j|�|j|j�|jd��dS)NzT
Don't leave me here.

Don't leave!
r#)rzD
Don't leave me .

Don't leave!here
)r$r%r"rDrr�rjr�)r�docr$Zsecond_paraZboldrrr�!test_append_to_contents_moves_tag�s z6TestTreeModification.test_append_to_contents_moves_tagcCs0d}|j|�}|j}|j|j�}|j||�dS)Nz)r$r/�replace_withrWr)rr)r$r/�new_arrr�1test_replace_with_returns_thing_that_was_replaceds zFTestTreeModification.test_replace_with_returns_thing_that_was_replacedcCs,d}|j|�}|j}|j�}|j||�dS)Nz)r$r/�unwrapr)rr)r$r/r�rrr�+test_unwrap_returns_thing_that_was_replaceds z@TestTreeModification.test_unwrap_returns_thing_that_was_replacedcCsJ|jd�}|j}|j�|jd|j�|jt|j�|jt|j|j �dS)NzFooBar) r$r/�extractrr�r�r�r�r�rW)rr$r/rrr�Itest_replace_with_and_unwrap_give_useful_exception_when_tag_has_no_parents z^TestTreeModification.test_replace_with_and_unwrap_give_useful_exception_when_tag_has_no_parentcCs:d}|j|�}|j}|jj|�|j|j�|j|��dS)Nz-Foo )r$rWr�rrjr�)rr)r$rWrrr�test_replace_tag_with_itself's z1TestTreeModification.test_replace_tag_with_itselfcCs&d}|j|�}|jt|jj|j�dS)Nz)r$r�r�r"r�r/)rr)r$rrr�1test_replace_tag_with_its_parent_raises_exception.s zFTestTreeModification.test_replace_tag_with_its_parent_raises_exceptioncCs(d}|j|�}|jt|jjd|j�dS)Nzr)r$r�r�r/r�)rr)r$rrr�,test_insert_tag_into_itself_raises_exception3s zATestTreeModification.test_insert_tag_into_itself_raises_exceptionc Cs�|jd�}d}|j|�}|jd|�x|jD]}t|t�s,t�q,Wt|j�\}}}}|jd|j �|jd|j �|jd|j �|jd|j �dS) z�Inserting one BeautifulSoup object into another actually inserts all of its children -- you'll never combine BeautifulSoup objects. z-
And now, a word:
And we're back.
z
p2
p3
r=zAnd now, a word:�p2�p3zAnd we're back.N) r$r�Zdescendantsr�r�AssertionError�listZchildrenrr) rr$r)Z to_insertr��p1r�r�Zp4rrr�1test_insert_beautifulsoup_object_inserts_children8s zFTestTreeModification.test_insert_beautifulsoup_object_inserts_childrencCsX|jd�}|j}|jd}|jdd�|j\}}|jd�|jd�|jd|jj�dS)Nz
onethree
rr=Ztwor�Zthree)r$r/r�r�ZreplaceWithrr"r)rr$r/r"�left�rightrrr�3test_replace_with_maintains_next_element_throughoutLs zHTestTreeModification.test_replace_with_maintains_next_element_throughoutcCsl|jd�}|jdd�jd�|jdd�}|j}|j|j|�|j|j|�|j|jj|�|j|jd�dS)NzArgh!zArgh!)r)zHooray!)r$r%r�r"rr�r�r�)rr$�new_textr"rrr�test_replace_final_node[s z,TestTreeModification.test_replace_final_nodecCs�|jd�}|jjdd�|j|j�|jd��|jdd�}|j|jd�|j|jj|�|j|j d�|j|j j |�|j|j d�|j|j|j�dS)NzArgh!r=zHooray!z!Argh!Hooray!)r)zArgh!)r$r"r�rrjr�r%r�r�r�r�rW)rr$rrrr�test_consecutive_text_nodeses z0TestTreeModification.test_consecutive_text_nodescCsT|jd�}|jjdd�|jjdd�|jddg|jj�|j|jjdjd�dS)Nzrr3rB)r$r/r�rr�r�)rr$rrr�test_insert_stringzs z'TestTreeModification.test_insert_stringcCs�|j}|jd|d�}t||d�}|jdd�|jjd|�|j|j�|jd��|j}|j|j |�|j|j |�|jdd �}|j|j|�|j|j |�|j}|j|j |�|j|j |�|jdd �}|j|j|�|j|j|�|j|j |�dS) Nz%Findlady!)r�Zmagictagr�ther=z=Findthelady!ZFind)r))Zdefault_builderr$r r�r/rrjr�r"r�r�r%r�r�rWr�)rr�r$Z magic_tagZb_tagr%Zc_tagrrrr�test_insert_tag�s, z$TestTreeModification.test_insert_tagcCs0d}|j|�}|jj|j�|j||j��dS)Nz)r$r/rDr"rrj)rrkr$rrr�*test_append_child_thats_already_at_the_end�s z?TestTreeModification.test_append_child_thats_already_at_the_endcCs2d}|j|�}|jjd|j�|jd|j��dS)Nzrz)r$r/r��drrj)rrkr$rrr�$test_move_tag_to_beginning_of_parent�s z9TestTreeModification.test_move_tag_to_beginning_of_parentcCs.|jd�}|jjdd�|jt|j�d�dS)Nz
r=ZContentsz
Contents
)r$r�r�rr()rr$rrr�&test_insert_works_on_empty_element_tag�s z;TestTreeModification.test_insert_works_on_empty_element_tagcCs`|jd�}|jjd�|jjd�|j|j�|jd��|jj|j�|j|j�|jd��dS)Nzfoobar�BAZ�QUUXzQUUXfooBAZbarzQUUXbarfooBAZ)r$r"� insert_beforer/rrjr�)rr$rrr�test_insert_before�s z'TestTreeModification.test_insert_beforecCs`|jd�}|jjd�|jjd�|j|j�|jd��|jj|j�|j|j�|jd��dS)Nzfoobarrr zfooQUUXbarBAZzQUUXbarfooBAZ)r$r"�insert_afterr/rrjr�)rr$rrr�test_insert_after�s z&TestTreeModification.test_insert_aftercCsR|jd�}|jd�}|jd�}|jt|j|�|jt|j|�|jt|j|�dS)Nr�r/)r$r�r�r�r�r�NotImplementedError)rr$rrrrr�:test_insert_after_raises_exception_if_after_has_no_meaning�s zOTestTreeModification.test_insert_after_raises_exception_if_after_has_no_meaningcCsR|jd�}|jd�}|jd�}|jt|j|�|jt|j|�|jt|j|�dS)Nr�r/)r$r�r�r�r�rr)rr$rrrrr�Ftest_insert_before_raises_notimplementederror_if_before_has_no_meaning�s z[TestTreeModification.test_insert_before_raises_notimplementederror_if_before_has_no_meaningcCsv|jd�}|jd�\}}|j|�|j|j�|jd��|j|jd�|j|j|j�|j|jd�|j|j d�dS)Nz;
There's no business like show business
r"z0
There's business like no business
�noz business) r$r-r�rrjr�r�r�r�r�)rr$rZshowrrr�test_replace_with�s z&TestTreeModification.test_replace_withcCs0d}|j|�}|jj|j�|jd|j��dS)Nzz)r$r"r�rWrrj)rrkr$rrr�test_replace_first_child�s z-TestTreeModification.test_replace_first_childcCs0d}|j|�}|jj|j�|jd|j��dS)Nzz)r$rWr�r"rrj)rrkr$rrr�test_replace_last_child�s z,TestTreeModification.test_replace_last_childcCs|jd�}|j}|j}|j|�|j|j�|jd��|j|jd�|j|jdd�j d�|j|j d�|j|jd�|j|jd�|j|j|j �|j|j d�|j|j j |j�|j|jd�|jdd�}|j}|j|j |�|j|j|�|j|j |�|j|j|�dS)NzQWereservetherighttorefuseservicez-Werefusetoservicer)r)ZWeZto)r$r"rrr�rrjr�r�r%r�r�r�r�r/�e�g)rr$Z remove_tagZmove_tagZto_textZg_tagrrr�test_nested_tag_replace_with�s. z1TestTreeModification.test_nested_tag_replace_withcCs6|jd�}|jj�|j|jd�|j|jjd�dS)NzI
Unneeded formatting is unneeded
zUnneeded formatting is unneeded)r$�emr�rr�r))rrSrrr�test_unwraps z TestTreeModification.test_unwrapcCsF|jd�}|jj|jd��}|j|j�d�|j|j�|jd��dS)NzI wish I was bold.r"zI wish I was bold.)r$r�wrapr�rrjr�)rr$rtrrr� test_wrap"s zTestTreeModification.test_wrapcCs4|jd�}|jjj|j�|j|j�|jd��dS)NzI wish I was bold.zI wish I was bold.)r$r"r�rrrjr�)rr$rrr�%test_wrap_extracts_tag_from_elsewhere)s z:TestTreeModification.test_wrap_extracts_tag_from_elsewherecCsH|jd�}|jjj|j�|jdt|jj��|j|j�|jd��dS)Nz+I like being bold.I wish I was bold.r+z+I like being bold.I wish I was bold.) r$r"r�rrr,r�rjr�)rr$rrr�&test_wrap_puts_new_contents_at_the_end/s z;TestTreeModification.test_wrap_puts_new_contents_at_the_endcCs�|jd�}|jt|jj�d�|jdd�j�}|j|j�d�|j|j�d�|jt|jj�d�|j|jd�|j|j d�|j|j j d�|jdd �}|jd d �}|j|j |�|j|j|�|j|j |�|j|j|�dS)NzRSome content.
Nav crap
More content.r9Znav)rz6Some content. More content.z
Nav crap
r+zSome content. )r)z More content.) r$rr,r�r�r%r�rjr�r�r�r�r�)rr$Z extractedZ content_1Z content_2rrr�test_extract7s"z!TestTreeModification.test_extractcCsz|jd�}|jj}|jj}|jd�}|jd�}|jj|�|jj|�|j�|j�|j||jj�|j||jj�dS)NzfoobarrBr3)r$r/rr"r�rDr�r)rr$Zfoo_1Zbar_1Zfoo_2Zbar_2rrr�4test_extract_distinguishes_between_identical_stringsPs zITestTreeModification.test_extract_distinguishes_between_identical_stringscs8|jd��fdd��jd�D�|jdt�j��dS)Nzv csg|]}�jj��qSr)�scriptr�)rr�)r$rrrmszKTestTreeModification.test_extract_multiples_of_same_tag..r$z )r$r-rr(r�)rr)r$r�"test_extract_multiples_of_same_tagas z7TestTreeModification.test_extract_multiples_of_same_tagcCs.|jd�}|jd�j�|jd|jd��dS)Nz hi r�)r$r%r�r)rr$rrr�Btest_extract_works_when_element_is_surrounded_by_identical_stringsqszWTestTreeModification.test_extract_works_when_element_is_surrounded_by_identical_stringscCsf|jd�}|j}|jj�|jt|jj�d�|jt|d��|j }|jdd�|jdt|j��dS)zTag.clear()z4
String Italicized and another
rr�T)Z decomposeN) r$r/r��clearrr,r�rHrIr)rr$r/rrrr� test_clearzs zTestTreeModification.test_clearcCsB|jd�}d|j_|j|jjdg�d|j_|j|jjdg�dS)zTag.string = 'string'z rBr3N)r$r/rrr�r")rr$rrr�test_string_set�s z$TestTreeModification.test_string_setcCs,|jd�}|jj|j_|j|jj�d�dS)Nzfoobarsbarbar)r$rWrr"rr/ri)rr$rrr�/test_string_set_does_not_affect_original_string�s zDTestTreeModification.test_string_set_does_not_affect_original_stringcCs2|jd�}td�}||j_|jt|jjt��dS)NzrB)r$rr/rrHr�)rr$�cdatarrr�)test_set_string_preserves_class_of_string�s z>TestTreeModification.test_set_string_preserves_class_of_stringN))rrr r�r�r�r�r�r�r�r�r�r�rrrrrrr rrrrrrrrrrrr r!r"r#r%r&r(r)r*r,rrrrr��sL $ r�c@sxeZdZdZdd�Zdd�Zdd�Zdd �Zd d�Zdd �Z dd�Z dd�Zdd�Zdd�Z dd�Zdd�Zdd�ZdS)�TestElementObjectsz)Test various features of element objects.cCsV|jd�}|jt|j�d�|jt|�d�|jt|j�d�|jt|jj�d�dS)z3The length of an element is its number of children.z123r=r9N)r$rr,r�r�)rr$rrr�test_len�s zTestElementObjects.test_lencCsL|jd�}|j|j|jd��|j|jj|jd�jd��|j|jd�dS)z2Accessing a Python member .foo invokes find('foo')zr"r�N)r$rr"r%r�r/)rr$rrr�test_member_access_invokes_find�s z2TestElementObjects.test_member_access_invokes_findcCsP|jd�}tjdd��}|j}WdQRX|j|j|�|jdt|dj��dS)NzT)�recordzp.bTag is deprecated, use .find("b") instead. If you really were looking for a tag called bTag, use .find("bTag")r)r$�warnings�catch_warningsZbTagrr"r(�message)rr$�wrrrr�test_deprecated_member_access�s z0TestElementObjects.test_deprecated_member_accesscCs2|jd�}|j|jjd��|j|jjd��dS)z�has_attr() checks for the presence of an attribute. Please note note: has_attr() is different from __in__. has_attr() checks the tag's attributes and __in__ checks the tag's chidlren. z�attrZattr2N)r$rHrB�has_attr�assertFalse)rr$rrr� test_has_attr�s z TestElementObjects.test_has_attrcCsd}|j|d�dS)Nz%z%)ZassertSoupEquals)rr�rrr�.test_attributes_come_out_in_alphabetical_order�szATestElementObjects.test_attributes_come_out_in_alphabetical_ordercCs|jd�}|j|jjd�dS)Nz foorB)r$rr"r)rr$rrr�test_string�s zTestElementObjects.test_stringcCs|jd�}|j|jjd�dS)Nz)r$rr"r)rr$rrr�test_empty_tag_has_no_string�s z/TestElementObjects.test_empty_tag_has_no_stringcCs`|jd�}|j|jjd�|jd�}|j|jjd�|jd�}|jjdd�|j|jjd�dS)Nzfoozfoobar

foor=r3)r$rr"rr/r�)rr$rrr�-test_tag_with_multiple_children_has_no_string�s z@TestElementObjects.test_tag_with_multiple_children_has_no_stringcCs,|jd�}|j|jjd�|j|jd�dS)Nz

foo

feozN)r$r8r"r)rr$rrr�test_lack_of_string�s z&TestElementObjects.test_lack_of_stringcCs`|jd�}|j|jjd�|j|jjdd�d�|j|jjd�d�|j|jjddd�d�d S) zBTag.text and Tag.get_text(sep=u"") -> all child text, concatenatedzar t zar t T)�stripZart�,z a,r, , t za,r,tN)r$rr/r)�get_text)rr$rrr� test_all_text�s z TestElementObjects.test_all_textcCsJ|jd�}|j|j�d�|j|jttfd�d�|j|jdd�d�dS)NzfoobarZfoobar)�typesZfooIGNOREbar)r$rrBrr)rr$rrr�test_get_text_ignores_comments�s z1TestElementObjects.test_get_text_ignores_commentscCs$|jd�}|jddgt|j��dS)NzfoobarrBr3)r$rr�Zstrings)rr$rrr�!test_all_strings_ignores_commentss z4TestElementObjects.test_all_strings_ignores_commentsN)rrr r1r.r/r5r9r:r;r<r=r>r?rCrErFrrrrr-�s r-c@sPeZdZdZdd�Zdd�Zdd�Zdd �Zd d�Zdd �Z dd�Z dd�ZdS)�TestCDAtaListAttributesz0Testing cdata-list attributes like 'class'. cCs"|jd�}|jdg|jd�dS)NzrBrm)r$rr/)rr$rrr�test_single_value_becomes_list s z6TestCDAtaListAttributes.test_single_value_becomes_listcCs$|jd�}|jddg|jd�dS)NzrBr3rm)r$rr/)rr$rrr�!test_multiple_values_becomes_lists z9TestCDAtaListAttributes.test_multiple_values_becomes_listcCs&|jd�}|jdddg|jd�dS)NzrBr3r�rm)r$rr/)rr$rrr�2test_multiple_values_separated_by_weird_whitespaces zJTestCDAtaListAttributes.test_multiple_values_separated_by_weird_whitespacecCs |jd�}|jd|jj��dS)Nzs)r$rr/ri)rr$rrr�,test_attributes_joined_into_string_on_outputs zDTestCDAtaListAttributes.test_attributes_joined_into_string_on_outputcCs$|jd�}|jdg|jjd��dS)Nzzabc defr)r$rr/Zget_attribute_list)rr$rrr�test_get_attribute_lists z/TestCDAtaListAttributes.test_get_attribute_listcCs$|jd�}|jddg|jd�dS)Nz(z ISO-8859-1zUTF-8zaccept-charset)r$rZform)rr$rrr�test_accept_charset!s z+TestCDAtaListAttributes.test_accept_charsetcCs$d}|j|�}|jd|jd�dS)Nz)zISO-8859-1 UTF-8zaccept-charset)r$rr/)rrkr$rrr�-test_cdata_attribute_applying_only_to_one_tag%s zETestCDAtaListAttributes.test_cdata_attribute_applying_only_to_one_tagcs6|jd�j�|jd�j��fdd�}|jt|�dS)Nr�cs d�_dS)NrB)rNr)rrr�t0szJTestCDAtaListAttributes.test_string_has_immutable_name_property..t)r$rrrNr��AttributeError)rrOr)rr�'test_string_has_immutable_name_property-sz?TestCDAtaListAttributes.test_string_has_immutable_name_propertyN)rrr r1rHrIrJrKrLrMrNrQrrrrrG srGcs`eZdZdZ�fdd�Zdd�Zdd�Zdd �Zd d�Zdd �Z dd�Z dd�Zdd�Z�Z S)�TestPersistencez*Testing features like pickle and deepcopy.cs&tt|�j�d|_|j|j�|_dS)Nay Beautiful Soup: We called him Tortoise because he taught us. foo bar )rQrRrRZpager$rS)r)rTrrrR7szTestPersistence.setUpcCs@tj|jd�}tj|�}|j|jt�|j|j�|jj��dS)Nr+)�pickle�dumpsrS�loadsrrTrrj)r�dumped�loadedrrr�!test_pickle_and_unpickle_identityKs z1TestPersistence.test_pickle_and_unpickle_identitycCs&tj|j�}|j|j�|jj��dS)N)�copy�deepcopyrSrrj)rZcopiedrrr�test_deepcopy_identitySsz&TestPersistence.test_deepcopy_identitycCs:tdd�}|j}|j�}|jdt|��|j||j�dS)Ns

zhtml.parseru

)rZoriginal_encoding�__copy__rr()rr$�encodingrYrrr�test_copy_preserves_encodingXs z,TestPersistence.test_copy_preserves_encodingcCs>d}|j|�}tj|tj�}tj|�}|j|j�|j��dS)Nu ☃)r$rSrTZHIGHEST_PROTOCOLrUrrj)rr�r$rVrWrrr�test_unicode_pickle_s z#TestPersistence.test_unicode_picklecCszd}|j|�}|jdd�}tj|�}|j||�|jd|j�|jd|j�|jd|j�|jd|j�|jd|j�dS)NzFooBarr4)r) r$r%rYrr�r��assertNotEqualr�r�)rr�r$�s1�s2rrr�1test_copy_navigablestring_is_not_attached_to_treegs zATestPersistence.test_copy_navigablestring_is_not_attached_to_treecCs>d}|j|�}|j}tj|�}|j||�|jt|t��dS)Nz)r$rrYrrHr�r)rr�r$rarbrrr�0test_copy_navigablestring_subclass_has_same_typess z@TestPersistence.test_copy_navigablestring_subclass_has_same_typecCs(d}|j|�}tj|�}|j||�dS)Nz)

FooBar

end)r$rYr)rr�r$Z soup_copyrrr�test_copy_entire_soup{s z%TestPersistence.test_copy_entire_soupcCs�d}|j|�}|j}tj|�}|jt|�t|��|j||�|j||k�|jd|j�|jd|j�|jd|jdd�j �|j d|jdd�j �dS)Nz)

FooBar

endZBar)r)r$rarYrr(r8r�r�r%r�r`)rr�r$raZdiv_copyrrr�test_copy_tag_copies_contents�s z-TestPersistence.test_copy_tag_copies_contents)rrr r1rRrXr[r^r_rcrdrerfrcrr)rTrrR4srRc@s�eZdZdd�Zdd�Zdd�Zdd�Zd d �Zdd�Zd d�Z dd�Z dd�Zdd�Zdd�Z dd�Zdd�Zdd�Zdd�Zdd �Zd!S)"�TestSubstitutionscCs0d}|j|�}|jdd�}|j||jd��dS)Nu#<<Sacré bleu!>>�minimal)� formatter)r$rjrr�)rr�r$�decodedrrr�!test_default_formatter_is_minimal�s z3TestSubstitutions.test_default_formatter_is_minimalcCs0d}|j|�}|jdd�}|j||jd��dS)Nu'
<<Sacré bleu!>>r�)riz.
<<Sacré bleu!>>)r$rjrr�)rr�r$rjrrr�test_formatter_html�s z%TestSubstitutions.test_formatter_htmlcCs0d}|j|�}|jdd�}|j||jd��dS)Nu'
<<Sacré bleu!>>Zhtml5)riz-
<<Sacré bleu!>>)r$rjrr�)rr�r$rjrrr�test_formatter_html5�s z&TestSubstitutions.test_formatter_html5cCs0d}|j|�}|jdd�}|j||jd��dS)Nu#<<Sacré bleu!>>rh)ri)r$rjrr�)rr�r$rjrrr�test_formatter_minimal�s z(TestSubstitutions.test_formatter_minimalcCs0d}|j|�}|jdd�}|j||jd��dS)Nu#<<Sacré bleu!>>)riu<>)r$rjrr�)rr�r$rjrrr�test_formatter_null�s z%TestSubstitutions.test_formatter_nullcCs4d}|j|�}|jdd�d�}|j||jd��dS)Nz!<foo>bar
cSs|j�S)N)�upper)�xrrr��sz9TestSubstitutions.test_formatter_custom..)rizBAR
)r$rjrr�)rr�r$rjrrr�test_formatter_custom�s z'TestSubstitutions.test_formatter_customcCs�d}|j|�}|j}d}|j||j��|j||jdd��d}|j||jdd��|j||jdd��d}|j||jdd �d��dS) Nu%eu)erh)riz/er�u%EcSs|j�S)N)rp)rqrrrrr�szMTestSubstitutions.test_formatter_is_run_on_attribute_values..)r$r/rrj)rr�r$r/Zexpect_minimalZexpect_htmlZexpect_upperrrr�)test_formatter_is_run_on_attribute_values�s z;TestSubstitutions.test_formatter_is_run_on_attribute_valuescCs$d}t|d�j�}|jd|k�dS)NzO zhtml.parsers< < hey > >)rrirH)rr��encodedrrr�2test_formatter_skips_script_tag_for_html_documents�szDTestSubstitutions.test_formatter_skips_script_tag_for_html_documentscCs$d}t|d�j�}|jd|k�dS)NzF zhtml.parsers< < hey > >)rrirH)rr�rurrr�1test_formatter_skips_style_tag_for_html_documents�szCTestSubstitutions.test_formatter_skips_style_tag_for_html_documentscCs |jd�}|jd|jj��dS)Nz*

foo

bar

baz z/

foo

bar

baz

)r$rra�prettify)rr$rrr�,test_prettify_leaves_preformatted_text_alone�s z>TestSubstitutions.test_prettify_leaves_preformatted_text_alonecCs,tdd�}|jdd�d�}|jd|k�dS)Nzfoozhtml.parsercSs|j�S)N)rp)rqrrrrr�szLTestSubstitutions.test_prettify_accepts_formatter_function..)riZFOO)rrxrH)rr$Zprettyrrr�(test_prettify_accepts_formatter_function�s z:TestSubstitutions.test_prettify_accepts_formatter_functioncCs"|jd�}|jtt|j��dS)Nz)r$rr(�typerx)rr$rrr�(test_prettify_outputs_unicode_by_default�s z:TestSubstitutions.test_prettify_outputs_unicode_by_defaultcCs$|jd�}|jtt|jd��dS)Nzzutf-8)r$r�bytesr{rx)rr$rrr�test_prettify_can_encode_datas z/TestSubstitutions.test_prettify_can_encode_datacCs0d}|j|�}|jjd�}|j||jd��dS)NuSacré bleu!zutf-8)r$r"rir)rr�r$rurrr�,test_html_entity_substitution_off_by_defaults z>TestSubstitutions.test_html_entity_substitution_off_by_defaultcCs�d}|j|�}|j|jdd�|jd�}|jd|k�|jd�}|jd|k�|jd�}|jd |k�|jd �jd �}|jd|k�dS)NzEZcontentztext/html; charset=x-sjiszutf-8s charset=utf-8�euc_jpscharset=euc_jpz shift-jisscharset=shift-jiszutf-16zcharset=utf-16)r$r�metarirHrj)rZmeta_tagr$�utf_8r�� shift_jisZutf_16_urrr�test_encoding_substitutions z,TestSubstitutions.test_encoding_substitutioncCs2d}td�}|j||d�}|j|jdjd�dS)Nz`

foo

Zpre)Z parse_onlyr)rr$rr�rN)rr�ryr$rrr�;test_encoding_substitution_doesnt_happen_if_tag_is_strained$szMTestSubstitutions.test_encoding_substitution_doesnt_happen_if_tag_is_strainedN)rrr rkrlrmrnrorsrtrvrwryrzr|r~rr�r�rrrrrg�s rgc@sPeZdZdZdd�Zdd�Zdd�Zdd �Zd d�Zdd �Z dd�Z dd�ZdS)�TestEncodingz0Test the ability to encode objects into strings.cCs.d}|j|�}|j|jjjd�djd��dS)Nu ☃zutf-8u☃)r$rr"rri)rr�r$rrr�"test_unicode_string_can_be_encoded2s z/TestEncoding.test_unicode_string_can_be_encodedcCs,d}|j|�}|j|jjd�|jd��dS)Nu ☃zutf-8)r$rr"ri)rr�r$rrr�1test_tag_containing_unicode_string_can_be_encoded8s z>TestEncoding.test_tag_containing_unicode_string_can_be_encodedcCs&d}|j|�}|j|jjd�d�dS)Nu ☃�asciis☃)r$rr"ri)rr�r$rrr�s zITestEncoding.test_encoding_substitutes_unrecognized_characters_by_defaultcCs&d}|j|�}|jt|jddd�dS)Nu ☃r��strict)�errors)r$r��UnicodeEncodeErrorri)rr�r$rrr� test_encoding_can_be_made_strictCs z-TestEncoding.test_encoding_can_be_made_strictcCs$d}|j|�}|jd|jj��dS)Nu ☃u☃)r$rr"Zdecode_contents)rr�r$rrr�test_decode_contentsIs z!TestEncoding.test_decode_contentscCs.d}|j|�}|jdjd�|jjdd��dS)Nu ☃u☃rg)r])r$rrir"Zencode_contents)rr�r$rrr�test_encode_contentsNs z!TestEncoding.test_encode_contentscCs*d}|j|�}|jdjd�|jj��dS)Nu ☃u☃rg)r$rrir"ZrenderContents)rr�r$rrr�test_deprecated_renderContentsUs z+TestEncoding.test_deprecated_renderContentscCs8d}|j|�}tr$|j|t|��n|jdt|��dS)Nu ☃s \u2603)r$rr�repr)rr�r$rrr� test_repr[s zTestEncoding.test_reprN)rrr r1r�r�r�r�r�r�r�r�rrrrr�/sr�c@s,eZdZdd�Zdd�Zdd�Zdd�Zd S) �TestNavigableStringSubclassescCsX|jd�}td�}|jd|�|jt|�d�|j|jdd�d�|j|jdd�dS)Nr�rBr=z)r)r)r$rr�rr(r%r�)rr$r+rrr� test_cdataes z(TestNavigableStringSubclasses.test_cdatacsVd�_�fdd�}�jd�}td�}|jd|��jd|j|d��jd�j�d S) zkText inside a CData object is passed into the formatter. But the return value is ignored. rcs�jd7_dS)Nr=zBITTER FAILURE)�count)�args)rrr� incrementvszNTestNavigableStringSubclasses.test_cdata_is_never_formatted..incrementr�z<><><>r=s<><>]]>)riN)r�r$rr�rri)rr�r$r+r)rr�test_cdata_is_never_formattedos z;TestNavigableStringSubclasses.test_cdata_is_never_formattedcCs2td�}|jd�}|jd|�|j|j�d�dS)NrBr�r=s )r r$r�rri)rZdoctyper$rrr�test_doctype_ends_in_newline�s z:TestNavigableStringSubclasses.test_doctype_ends_in_newlinecCstd�}|jd|j��dS)NrBz)r rZoutput_ready)rr rrr�test_declaration�sz.TestNavigableStringSubclasses.test_declarationN)rrr r�r�r�r�rrrrr�cs r�c@s�eZdZdZdd�Zdd�ZeZdd�Zdd �Zd d�Z dd �Z dd�Zdd�Zdd�Z dd�Zdd�Zdd�Zdd�Zdd�Zdd�Zd d!�Zd"d#�Zd$d%�Zd&d'�Zd(d)�Zd*d+�Zd,d-�Zd.d/�Zd0d1�Zd2d3�Zd4d5�Zd6d7�Zd8d9�Z d:d;�Z!dd?�Z#d@dA�Z$dBdC�Z%dDdE�Z&dFdG�Z'dHdI�Z(dJdK�Z)dLdM�Z*dNdO�Z+dPdQ�Z,dRdS�Z-dTdU�Z.dVdW�Z/dXdY�Z0dZd[�Z1d\d]�Z2d^d_�Z3d`da�Z4dbdc�Z5ddde�Z6dfdg�Z7dhdi�Z8djdk�Z9dldm�Z:dndo�Z;dpdq�Z The title

Hello there.

An H1

Some text

Some more text

An H2

Another

Bob

Another H2

me span1a1 span1a2 test span2a1

English

English UK

English US

French

cCst|jd�|_dS)Nzhtml.parser)r�HTMLr$)rrrrrR�szTestSoupSelector.setUpcKsRdd�|jj|f|�D�}|j�|j�|j||d|dj|�dj|�f�dS)NcSsg|]}|d�qS)rr)r�elrrrr�sz2TestSoupSelector.assertSelects..z$Selector %s, expected [%s], got [%s]z, )r$�select�sortr�join)r�selector�expected_ids�kwargsZel_idsrrrr�szTestSoupSelector.assertSelectscGs"x|D]\}}|j||�qWdS)N)�assertSelect)rZtestsr�r�rrr�assertSelectMultiple�sz%TestSoupSelector.assertSelectMultiplecCsF|jjd�}|jt|�d�|j|djd�|j|djdg�dS)Nrhr=rz The title)r$r�rr,rNr�)r�elsrrr�test_one_tag_one�sz!TestSoupSelector.test_one_tag_onecCsX|jjd�}|jt|�d�x|D]}|j|jd�q"W|jjd�}|jd|d�dS)Nra��mainr)r$r�rr,rN� select_one)rr�rar�rrr�test_one_tag_many�s z"TestSoupSelector.test_one_tag_manycCs|jjd�}|jd|�dS)NZnonexistenttag)r$r�r)r�matchrrr�(test_select_one_returns_none_if_no_match�sz9TestSoupSelector.test_select_one_returns_none_if_no_matchcCs |jjd�}|jdddg�dS)Nzdiv div�inner�data1)r$r�r)rr�rrr�test_tag_in_tag_one�sz$TestSoupSelector.test_tag_in_tag_onecCs&x dD]}|j|ddddg�qWdS) N�html div� html body div�body divr�r�r��footer)r�r�r�)r)rr�rrr�test_tag_in_tag_many�s z%TestSoupSelector.test_tag_in_tag_manycCsB|jddgdd�|jdddgdd�|jdd ddd gdd�dS)Nzhtml divr�r=)r:z html body divr�r+zbody divr�r�r>)r)rrrr� test_limit�szTestSoupSelector.test_limitcCs|jt|jjd��d�dS)N�delr)rr,r$r�)rrrr�test_tag_no_match�sz"TestSoupSelector.test_tag_no_matchcCs|jt|jjd�dS)Nztag%t)r�r�r$r�)rrrr�test_invalid_tag�sz!TestSoupSelector.test_invalid_tagcCs|jdddg�dS)Nzcustom-dashed-tag�dash1�dash2)r)rrrr�test_select_dashed_tag_ids�sz+TestSoupSelector.test_select_dashed_tag_idscCs6|jjd�}|j|djd�|j|ddd�dS)Nzcustom-dashed-tag[id="dash2"]rzcustom-dashed-tagrr�)r$r�rrN)rZdashedrrr�test_select_dashed_by_id�sz)TestSoupSelector.test_select_dashed_by_idcCs|j|jjd�djd�dS)Nzbody > custom-dashed-tagrzHello there.)rr$r�r))rrrr�test_dashed_tag_textsz%TestSoupSelector.test_dashed_tag_textcCs |j|jjd�|jjd��dS)Nzcustom-dashed-tag)rr$r�r-)rrrr�#test_select_dashed_matches_find_allsz4TestSoupSelector.test_select_dashed_matches_find_allcCs|jddgfdddgf�dS)NZh1�header1Zh2�header2�header3)r�)rrrr�test_header_tags sz!TestSoupSelector.test_header_tagscCsVxPd D]H}|jj|�}|jt|�d�|j|djd�|j|dddg�qWdS) N�.onep�p.onep�html p.onepr=rr�rm�onep)r�r�r�)r$r�rr,rN)rr�r�rrr�test_class_ones zTestSoupSelector.test_class_onecCs |jjd�}|jt|�d�dS)Nzdiv.onepr)r$r�rr,)rr�rrr�test_class_mismatched_tagsz*TestSoupSelector.test_class_mismatched_tagcCs xdD]}|j|dg�qWdS)N� div#inner�#inner� div div#innerr�)r�r�r�)r)rr�rrr�test_one_ids zTestSoupSelector.test_one_idcCs |jjd�}|jt|�d�dS)Nz #doesnotexistr)r$r�rr,)rr�rrr�test_bad_idszTestSoupSelector.test_bad_idcCsf|jjd�}|jt|�d�x|D]}|j|jd�q"W|j|dddg�|j|djd��dS)Nzdiv#inner pr9r�r=rmr�r)r$r�rr,rNr8r7)rr�r�rrr�test_items_in_id#s z!TestSoupSelector.test_items_in_idcCs*x$dD]}|jt|jj|��d�qWdS)N�div#main del�div#main div.oops�div div#mainr)r�r�r�)rr,r$r�)rr�rrr�test_a_bunch_of_emptys+s z'TestSoupSelector.test_a_bunch_of_emptyscCs xd D]}|j|d g�qWdS)N�.class1�p.class1�.class2�p.class2�.class3�p.class3� html p.class2�div#inner .class2�pmulti)r�r�r�r�r�r�r�r�)r)rr�rrr�test_multi_class_support/sz)TestSoupSelector.test_multi_class_supportcCs xdD]}|j|dg�qWdS)N�.class1.class3�.class3.class2�.class1.class2.class3r�)r�r�r�)r)rr�rrr�test_multi_class_selection4sz+TestSoupSelector.test_multi_class_selectioncCs"|jdddg�|jddg�dS)Nz.s1 > a�s1a1�s1a2z.s1 > a span�s1a2s1)r)rrrr�test_child_selector9sz$TestSoupSelector.test_child_selectorcCs|jddg�dS)Nz.s1 > a#s1a2 spanr�)r)rrrr�test_child_selector_id=sz'TestSoupSelector.test_child_selector_idcCst|jddgfddgfddgfddgfddgfddgfd dgfd gfddgfddgfd dgfdgfdgfdgf�dS)Nzp[class="onep"]r�z p[id="p1"]z[class="onep"]z [id="p1"]zlink[rel="stylesheet"]�l1zlink[type="text/css"]zlink[href="blah.css"]zlink[href="no-blah.css"]z[rel="stylesheet"]z[type="text/css"]z[href="blah.css"]z[href="no-blah.css"]zp[href="no-blah.css"])r�)rrrr�test_attribute_equals@sz&TestSoupSelector.test_attribute_equalscCs\|jddgfddgfddgfddgfddgfddgfdd gfd d gfdd gfdd gf� dS) Nzp[class~="class1"]r�zp[class~="class2"]zp[class~="class3"]z[class~="class1"]z[class~="class2"]z[class~="class3"]za[rel~="friend"]�bobz a[rel~="met"]z[rel~="friend"]z[rel~="met"])r�)rrrr�test_attribute_tildeRsz%TestSoupSelector.test_attribute_tildecCsv|jddgfddgfdgfdgfdgfddgfdd d gfdd d gfdd dgfdd dgfddgfdd gfddgf� dS)Nz[rel^="style"]r�zlink[rel^="style"]znotlink[rel^="notstyle"]z[rel^="notstyle"]zlink[rel^="notstyle"]zlink[href^="bla"]za[href^="http://"]r��mez[href^="http://"]z [id^="p"]r�r�z [id^="m"]r�zdiv[id^="m"]z a[id^="m"]zdiv[data-tag^="dashed"]r�)r�)rrrr�test_attribute_startswith`s z*TestSoupSelector.test_attribute_startswithc CsH|jddgfddgfddgfdddddd d ddgfd dgfdgf�dS)Nz[href$=".css"]r�zlink[href$=".css"]z link[id$="1"]z [id$="1"]r�r�r�r��s2a1r�r�zdiv[id$="1"]z[id$="noending"])r�)rrrr�test_attribute_endswithqsz(TestSoupSelector.test_attribute_endswithcCs�|jddgfddgfdgfdgfdgfddgfdd d gfddd gfddgfdd gfddgfddgfddgfdddd ddddddg fddgfdgfdd d dgfdd d gfd dgfd!dd"gfd#d"gfd$dgf�dS)%Nz[rel*="style"]r�zlink[rel*="style"]znotlink[rel*="notstyle"]z[rel*="notstyle"]zlink[rel*="notstyle"]zlink[href*="bla"]z[href*="http://"]r�r�z [id*="p"]r�r�zdiv[id*="m"]r�z a[id*="m"]z[href*=".css"]zlink[href*=".css"]z link[id*="1"]z [id*="1"]r�r�r�r�r�r�r�zdiv[id*="1"]z[id*="noending"]z[href*="."]za[href*="."]zlink[href*="."]zdiv[id*="n"]r�z div[id*="nn"]zdiv[data-tag*="edval"])r�)rrrr�test_attribute_contains{s. z(TestSoupSelector.test_attribute_containscCs2|jddddgfddddgfddgfdgf�dS) Nz p[lang|="en"]zlang-enz lang-en-gbz lang-en-usz[lang|="en"]z p[lang|="fr"]zlang-frz p[lang|="gb"])r�)rrrr�test_attribute_exact_or_hypen�s z.TestSoupSelector.test_attribute_exact_or_hypenc CsV|jddddgfddgfdddgfddd d dgfdd dgfdgfdgfddgf�dS)Nz[rel]r�r�r�z link[rel]za[rel]z[lang]zlang-enz lang-en-gbz lang-en-uszlang-frzp[class]r�r�z[blah]zp[blah]z div[data-tag]r�)r�)rrrr�test_attribute_exists�s z&TestSoupSelector.test_attribute_existscCs,d}t|d�}|jd�\}|jd|j�dS)Nz]

nope

yes

zhtml.parserzdiv[style="display: right"]�yes)rr�rr)rr�r$Zchosenrrr�"test_quoted_space_in_selector_name�s z3TestSoupSelector.test_quoted_space_in_selector_namecCs(|jt|jjd�|jt|jjd�dS)Nza:no-such-pseudoclassza:nth-of-type(a))r�rr$r�)rrrr�test_unsupported_pseudoclass�sz-TestSoupSelector.test_unsupported_pseudoclasscCs�|jjd�}|jt|�d�|j|djd�|jjd�}|jt|�d�|j|djd�|jjd�}|jt|�d�|jt|jjd�dS) Nzdiv#inner p:nth-of-type(1)r=rz Some textzdiv#inner p:nth-of-type(3)ZAnotherzdiv#inner p:nth-of-type(4)zdiv p:nth-of-type(0))r$r�rr,rr�r�)rr�rrr�test_nth_of_type�sz!TestSoupSelector.test_nth_of_typecCs2|jjd�}|jt|�d�|j|djd�dS)Nzdiv#inner > p:nth-of-type(1)r=rz Some text)r$r�rr,r)rr�rrr�"test_nth_of_type_direct_descendant�sz3TestSoupSelector.test_nth_of_type_direct_descendantcCs|jddg�dS)Nz#inner > p:nth-of-type(2)r�)r)rrrr�"test_id_child_selector_nth_of_type�sz3TestSoupSelector.test_id_child_selector_nth_of_typecCs.|jjddd�}|jd�}|j|ddg�dS)Nrar�)rr�r�)r$r%r�r)rr��selectedrrr�test_select_on_element�s z'TestSoupSelector.test_select_on_elementcCs|jddg�|jdg�dS)Nz .fancy #innerr�z.normal #inner)r)rrrr�test_overspecified_child_id�sz,TestSoupSelector.test_overspecified_child_idcCsB|jddg�|jddg�|jddg�|jg|jjd��dS)Nz#p1 + h2r�z#p1 + h2 + pr�z#p1 + #header2 + .class1z#p1 + p)rrr$r�)rrrr�test_adjacent_sibling_selector�sz/TestSoupSelector.test_adjacent_sibling_selectorcCsR|jdddg�|jddg�|jddg�|jddg�|jg|jjd��dS) Nz#p1 ~ h2r�r�z#p1 ~ #header2z#p1 ~ h2 + ar�z#p1 ~ h2 + [rel="me"]z#inner ~ h2)rrr$r�)rrrr�test_general_sibling_selector�s z.TestSoupSelector.test_general_sibling_selectorcCs|jt|jjd�dS)Nzh1 >)r�r�r$r�)rrrr�test_dangling_combinator�sz)TestSoupSelector.test_dangling_combinatorcCs|jddddg�dS)Nzp[lang] ~ pz lang-en-gbz lang-en-uszlang-fr)r)rrrr�2test_sibling_combinator_wont_select_same_tag_twice�szCTestSoupSelector.test_sibling_combinator_wont_select_same_tag_twicecCs|jdddg�dS)Nzx, y�xid�yid)r)rrrr�test_multiple_select�sz%TestSoupSelector.test_multiple_selectcCs|jdddg�dS)Nzx,yrr)r)rrrr�"test_multiple_select_with_no_space�sz3TestSoupSelector.test_multiple_select_with_no_spacecCs|jdddg�dS)Nzx, yrr)r)rrrr�$test_multiple_select_with_more_space�sz5TestSoupSelector.test_multiple_select_with_more_spacecCs|jddg�dS)Nzx, xr)r)rrrr�test_multiple_select_duplicatedsz0TestSoupSelector.test_multiple_select_duplicatedcCs|jdddg�dS)Nzx, y ~ p[lang=fr]rzlang-fr)r)rrrr�test_multiple_select_siblingsz-TestSoupSelector.test_multiple_select_siblingcCs|jdddg�dS)Nzx, y > zr�zidb)r)rrrr�.test_multiple_select_tag_and_direct_descendantsz?TestSoupSelector.test_multiple_select_tag_and_direct_descendantcCs|jdddddddg�dS)Nz div > x, y, zrr�zidar�zidab�zidac)r)rrrr�/test_multiple_select_direct_descendant_and_tags sz@TestSoupSelector.test_multiple_select_direct_descendant_and_tagscCs|jdddddddg�dS)Nzdiv x,y, zrrr rr r)r)rrrr�(test_multiple_select_indirect_descendant sz9TestSoupSelector.test_multiple_select_indirect_descendantcCs(|jt|jjd�|jt|jjd�dS)Nz,x, yzx,,y)r�r�r$r�)rrrr�test_invalid_multiple_selectsz-TestSoupSelector.test_invalid_multiple_selectcCs|jdddg�dS)Nzp[lang=en], p[lang=en-gb]zlang-enz lang-en-gb)r)rrrr�test_multiple_select_attrssz+TestSoupSelector.test_multiple_select_attrscCs|jddddg�dS)Nz*x, y > z[id=zida], z[id=zidab], z[id=zidb]rrr )r)rrrr�test_multiple_select_idssz)TestSoupSelector.test_multiple_select_idscCs|jdddg�dS)Nzbody > div > x, y > zrr)r)rrrr�test_multiple_select_nestedsz,TestSoupSelector.test_multiple_select_nestedcCsRd}t|d�}|jd�}|jdt|��x$|jddgd�D]}||ks:t�q:WdS)Nz3

zhtml.parserz.c1, .c2r9Zc1Zc2)ro)rr�rr,r-r�)rr�r$r�r�rrr�test_select_duplicate_elementss z/TestSoupSelector.test_select_duplicate_elementsN)>rrr r�rRrr�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�rrrrrrrr rrrrrrrrrr��sv1 r�)2r1ZpdbrrYrSr6r1Zbs4rZbs4.builderrrZbs4.elementrrrr r rrr Zbs4.testingrrr�r�ZLXML_PRESENTrr!r2rLrPrdr�r�r�r�r�r�r�r�r�r�r-rGrRrgr�r�r�rrrr�sN( ;O83(3--*6n+a4*PK�je[0e,��.tests/__pycache__/test_html5lib.cpython-36.pycnu�[��3 6]+�@s�dZddlZyddlmZdZWn&ek rFZz dZWYddZ[XnXddlmZddl m Z mZmZeed�Gd d �d ee ��Z dS)zDTests to ensure that the html5lib tree builder generates good trees.�N)�HTML5TreeBuilderTF)�SoupStrainer)�HTML5TreeBuilderSmokeTest�SoupTest�skipIfz?html5lib seems not to be present, not testing its tree builder.c@sleZdZdZedd��Zdd�Zdd�Zdd �Zd d�Z dd �Z dd�Zdd�Zdd�Z dd�Zdd�ZdS)�HTML5LibBuilderSmokeTestz"See ``HTML5TreeBuilderSmokeTest``.cCst�S)N)r)�self�r �#/usr/lib/python3.6/test_html5lib.py�default_buildersz(HTML5LibBuilderSmokeTest.default_buildercCsdtd�}d}tjdd��}|j||d�}WdQRX|j|j�|j|��|jdt|dj �k�dS)N�bz

A bold statement.

T)�record)Z parse_onlyz4the html5lib tree builder doesn't support parse_onlyr) r�warnings�catch_warnings�soup�assertEqual�decodeZdocument_forZ assertTrue�str�message)rZstrainer�markup�wrr r r �test_soupstrainersz*HTML5LibBuilderSmokeTest.test_soupstrainercCsd}|j|d�|jd�dS)z8html5lib inserts tags where other parsers don't.z[z�

Here's another table:

foo

Here's another table:

foo

Foo
Bar
Baz

N)ZassertSoupEquals)rrr r r �test_correctly_nested_tables(sz5HTML5LibBuilderSmokeTest.test_correctly_nested_tablescCs$d}|j|�}|jd|jj��dS)Nzy

foo

)rr�p�encode)rrrr r r �(test_xml_declaration_followed_by_doctype<s zAHTML5LibBuilderSmokeTest.test_xml_declaration_followed_by_doctypecCs:d}|j|�}|jd|jj��|jdt|jd��dS)Nz%

foo

bar

foo

bar

�r)rr�bodyr�len�find_all)rrrr r r �test_reparented_markupJs z/HTML5LibBuilderSmokeTest.test_reparented_markupcCs:d}|j|�}|jd|jj��|jdt|jd��dS)Nz&

foo

bar

foo

bar

rr)rrrrrr)rrrr r r �+test_reparented_markup_ends_with_whitespaceQs zDHTML5LibBuilderSmokeTest.test_reparented_markup_ends_with_whitespacecCsLd}|j|�}|jdd�\}}|jd�\}}|j|ks:t�|j|ksHt�dS)z�Verify that we keep the two whitespace nodes in this document distinct when reparenting the adjacent tags. z,

� )�stringZtbodyN)rr�next_element�AssertionError)rrrZspace1Zspace2Ztbody1Ztbody2r r r �aftermath

aftermath

�target)r#Z aftermath��)r�noscriptrr$�findrZprevious_element)rrrr*r'Zfinal_aftermathr r r �*test_reparented_markup_containing_childrenbs zCHTML5LibBuilderSmokeTest.test_reparented_markup_containing_childrencCs$d}|j|�}t|�jd�s t�dS)z(Processing instructions become comments.szN)rr� startswithr%)rrrr r r �test_processing_instructionrs z4HTML5LibBuilderSmokeTest.test_processing_instructioncCs8d}|j|�}|jd�\}}|j||�||k s4t�dS)Ns

�a)rrrr%)rrrZa1Za2r r r �test_cloned_multivalue_nodexs z4HTML5LibBuilderSmokeTest.test_cloned_multivalue_nodecCs$d}|j|�}|jd|jj��dS)NsAz>A
)rrrr)rrrr r r �test_foster_parentings z.HTML5LibBuilderSmokeTest.test_foster_parentingN)�__name__� __module__�__qualname__�__doc__�propertyrrrrr r!r&r,r.r0r1r r r r rs r)r5rZbs4.builderrZHTML5LIB_PRESENT�ImportError�eZbs4.elementrZbs4.testingrrrrr r r r �sPK�je[vG4Wtests/__init__.pynu�[��"The beautifulsoup tests." PK�je[�MB�H�H'__pycache__/dammit.cpython-36.opt-1.pycnu�[��3 6]�t�@s dZdZddlZddlmZddlZddlZddlZdZyddl Z dd�Z WnFek r�yddlZdd�Z Wnek r�dd�Z YnXYnXyddl Z Wnek r�YnXejd j�ej�Zejd j�ej�ZGdd�de�ZGd d�d�ZGdd�d�ZdS)aBBeautiful Soup bonus library: Unicode, Dammit This library converts a bytestream to Unicode through any means necessary. It is heavily based on code from Mark Pilgrim's Universal Feed Parser. It works best on XML and HTML, but it does not rewrite the XML or HTML to reflect a new encoding; that's the tree builder's job. ZMIT�N)�codepoint2namecCstj|�dS)N�encoding)�cchardet�detect)�s�r�/usr/lib/python3.6/dammit.py�chardet_dammitsr cCstj|�dS)Nr)�chardetr)rrrrr !scCsdS)Nr)rrrrr 'sz!^<\?.*encoding=['"](.*?)['"].*\?>z0<\s*meta[^>]+charset\s*=\s*["']?([^>]*?)[ /;'">]c@s�eZdZdZdd�Ze�\ZZZdddddd �Ze j d �Ze j d�Ze dd ��Ze dd��Ze dd��Ze ddd��Ze ddd��Ze dd��ZdS)�EntitySubstitutionzASubstitute XML or HTML entities for the corresponding characters.cCsni}i}g}xBttj��D]2\}}t|�}|dkrD|j|�|||<|||<qWddj|�}||tj|�fS)N�"z[%s]�)�listr�items�chr�append�join�re�compile)�lookupZreverse_lookupZcharacters_for_reZ codepoint�name� characterZ re_definitionrrr�_populate_class_variables9s z,EntitySubstitution._populate_class_variablesZaposZquotZamp�lt�gt)�'�"�&�<�>z&([<>]|&(?!#\d+;|#x[0-9a-fA-F]+;|\w+;))z([<>&])cCs|jj|jd��}d|S)Nrz&%s;)�CHARACTER_TO_HTML_ENTITY�get�group)�cls�matchobj�entityrrr�_substitute_html_entityZsz*EntitySubstitution._substitute_html_entitycCs|j|jd�}d|S)zmUsed with a regular expression to substitute the appropriate XML entity for an XML special character.rz&%s;)�CHARACTER_TO_XML_ENTITYr")r#r$r%rrr�_substitute_xml_entity_sz)EntitySubstitution._substitute_xml_entitycCs6d}d|kr*d|kr&d}|jd|�}nd}|||S)a*Make a value into a quoted XML attribute, possibly escaping it. Most strings will be quoted using double quotes. Bob's Bar -> "Bob's Bar" If a string contains double quotes, it will be quoted using single quotes. Welcome to "my bar" -> 'Welcome to "my bar"' If a string contains both single and double quotes, the double quotes will be escaped, and the string will be quoted using double quotes. Welcome to "Bob's Bar" -> "Welcome to "Bob's bar" rrz")�replace)�self�valueZ quote_withZreplace_withrrr�quoted_attribute_valuefsz)EntitySubstitution.quoted_attribute_valueFcCs"|jj|j|�}|r|j|�}|S)aSubstitute XML entities for special XML characters. :param value: A string to be substituted. The less-than sign will become <, the greater-than sign will become >, and any ampersands will become &. If you want ampersands that appear to be part of an entity definition to be left alone, use substitute_xml_containing_entities() instead. :param make_quoted_attribute: If True, then the string will be quoted, as befits an attribute value. )�AMPERSAND_OR_BRACKET�subr(r,)r#r+�make_quoted_attributerrr�substitute_xml�s z!EntitySubstitution.substitute_xmlcCs"|jj|j|�}|r|j|�}|S)a�Substitute XML entities for special XML characters. :param value: A string to be substituted. The less-than sign will become <, the greater-than sign will become >, and any ampersands that are not part of an entity defition will become &. :param make_quoted_attribute: If True, then the string will be quoted, as befits an attribute value. )�BARE_AMPERSAND_OR_BRACKETr.r(r,)r#r+r/rrr�"substitute_xml_containing_entities�s z5EntitySubstitution.substitute_xml_containing_entitiescCs|jj|j|�S)a�Replace certain Unicode characters with named HTML entities. This differs from data.encode(encoding, 'xmlcharrefreplace') in that the goal is to make the result more readable (to those with ASCII displays) rather than to recover from errors. There's absolutely nothing wrong with a UTF-8 string containg a LATIN SMALL LETTER E WITH ACUTE, but replacing that character with "é" will make it more readable to some people. )�CHARACTER_TO_HTML_ENTITY_REr.r&)r#rrrr�substitute_html�sz"EntitySubstitution.substitute_htmlN)F)F)�__name__� __module__�__qualname__�__doc__rr ZHTML_ENTITY_TO_CHARACTERr3r'rrr1r-�classmethodr&r(r,r0r2r4rrrrr5s$ %rc@sHeZdZdZddd�Zdd�Zedd ��Zed d��Z eddd ��Z dS)�EncodingDetectora^Suggests a number of possible encodings for a bytestring. Order of precedence: 1. Encodings you specifically tell EncodingDetector to try first (the override_encodings argument to the constructor). 2. An encoding declared within the bytestring itself, either in an XML declaration (if the bytestring is to be interpreted as an XML document), or in a tag (if the bytestring is to be interpreted as an HTML document.) 3. An encoding detected through textual analysis by chardet, cchardet, or a similar external library. 4. UTF-8. 5. Windows-1252. NFcCsN|pg|_|pg}tdd�|D��|_d|_||_d|_|j|�\|_|_dS)NcSsg|]}|j��qSr)�lower)�.0�xrrr� �sz-EncodingDetector.__init__..) �override_encodings�set�exclude_encodings�chardet_encoding�is_html�declared_encoding�strip_byte_order_mark�markup�sniffed_encoding)r*rFr?rCrArrr�__init__�s zEncodingDetector.__init__cCs8|dk r4|j�}||jkrdS||kr4|j|�dSdS)NFT)r;rA�add)r*r�triedrrr�_usable�s zEncodingDetector._usableccs�t�}x |jD]}|j||�r|VqW|j|j|�r>|jV|jdkrZ|j|j|j�|_|j|j|�rp|jV|jdkr�t |j�|_|j|j|�r�|jVxdD]}|j||�r�|Vq�WdS)z tag, hopefully near the beginning of the document. iig��?N)�endposr�asciir)) rV�max�int�xml_encoding_re�search�html_meta_re�groups�decoder;)r#rFrCZsearch_entire_documentZ xml_endposZhtml_endposrDZdeclared_encoding_matchrrrrN+s z'EncodingDetector.find_declared_encoding)NFN)FF)r5r6r7r8rHrK�propertyrPr9rErNrrrrr:�s !r:c�@sReZdZdZddd�ZdddgZgdd gfd d�Zdd �Z�ddd�Z�ddd�Z e dd��Zdd�Zdd�Z �dd�d �d!�d"�d#�d$�d%�d&�d'�d(�d)�d*d2�d+d2d2�d,�d-�d.�d/�d0�d1�d2�d3�d4�d5�d6�d7d2�d8�d9dQ� ZdRddSdTdUdVdWdXdYdZd[d\d]d2d^d2d2d_d_d`d`dadbdcdddedfdgdhd2didjddkdldmdndodpd[dqdPdrdsdkddtdbdudvdwdx�d:dzd{dadSd|drd}d~dd�d2d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�dad�d�d�d�d�djd�d�d�d�d�d�d�d�d�dld�d�d�d�d�d�d�d�dud�dududududud�dudzdzdzdzd�d�d�d��Zd�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d�d��d�d�d�d�d�d�d�d�d�d �d �d�d�d �d�zZ�d;�d<�d=gZe�d�dZe�d>�dZe�d?�d�d��ZdS(@� UnicodeDammitz�A class for detecting the encoding of a *ML document and converting it to a Unicode string. If the source encoding is windows-1252, can replace MS smart quotes with their HTML or XML equivalents.z mac-romanz shift-jis)� macintoshzx-sjis�windows-1252z iso-8859-1z iso-8859-2NFcCs�||_g|_d|_||_tjt�|_t||||�|_ t |t�sF|dkr`||_t|�|_ d|_dS|j j|_d}x,|j jD] }|j j}|j|�}|dk rxPqxW|s�x@|j jD]4}|dkr�|j|d�}|dk r�|jjd�d|_Pq�W||_ |s�d|_dS)NFr rYr)zSSome characters could not be decoded, and were replaced with REPLACEMENT CHARACTER.T)�smart_quotes_to�tried_encodingsZcontains_replacement_charactersrC�loggingZ getLoggerr5�logr:�detectorrTrUrFZunicode_markup�original_encodingrP� _convert_fromZwarning)r*rFr?rerCrA�urrrrrHXs> zUnicodeDammit.__init__cCs�|jd�}|jdkr&|jj|�j�}nf|jj|�}t|�tkr�|jdkrfdj�|dj�dj�}q�dj�|dj�dj�}n|j�}|S)z[Changes a MS smart quote character to an XML or HTML entity, or an ASCII character.�rYZxmlz&#x�;rr)r"re�MS_CHARS_TO_ASCIIr!�encode�MS_CHARS�type�tuple)r*�matchZorigr.rrr�_sub_ms_char�s zUnicodeDammit._sub_ms_char�strictcCs�|j|�}|s||f|jkr"dS|jj||f�|j}|jdk rh||jkrhd}tj|�}|j|j |�}y|j |||�}||_||_Wn tk r�}zdSd}~XnX|jS)Ns([�-�])) � find_codecrfrrFre�ENCODINGS_WITH_SMART_QUOTESrrr.ru�_to_unicoderj� Exception)r*Zproposed�errorsrFZsmart_quotes_reZsmart_quotes_compiledrlrOrrrrk�s" zUnicodeDammit._convert_fromcCst|||�S)zGiven a string and its encoding, decodes the string into Unicode. %encoding is a string recognized by encodings.aliases)rU)r*rWrr{rrrry�szUnicodeDammit._to_unicodecCs|js dS|jjS)N)rCrirD)r*rrr�declared_html_encoding�sz$UnicodeDammit.declared_html_encodingcCs`|j|jj||��pN|r*|j|jdd��pN|r@|j|jdd��pN|rL|j�pN|}|r\|j�SdS)N�-r �_)�_codec�CHARSET_ALIASESr!r)r;)r*�charsetr+rrrrw�szUnicodeDammit.find_codeccCs<|s|Sd}ytj|�|}Wnttfk r6YnX|S)N)�codecsr�LookupError� ValueError)r*r��codecrrrr�s zUnicodeDammit._codec�euro�20AC� �sbquo�201A�fnof�192�bdquo�201E�hellip�2026�dagger�2020�Dagger�2021�circ�2C6�permil�2030�Scaron�160�lsaquo�2039�OElig�152�?�#x17D�17D�lsquo�2018�rsquo�2019�ldquo�201C�rdquo�201D�bull�2022�ndash�2013�mdash�2014�tilde�2DC�trade�2122�scaron�161�rsaquo�203A�oelig�153�#x17E�17E�Yumlr ) ��ZEUR�,�fz,,z...�+z++�^�%�SrZOE�Zrr�*r}z--�~z(TM)rrZoe�z�Y�!�cZGBP�$ZYEN�|z..z(th)z<>z1/4z1/2z3/4�AZAE�C�E�I�D�N�O�U�b�B�aZaerO�i�n�/�y)�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r��s€s‚sƒs„s…s†s‡sˆs‰sŠs‹sŒsŽs‘s’s“s”s•s–s—s˜s™sšs›sœsžsŸs s¡s¢s£s¤s¥s¦s§s¨s©sªs«s¬ss®s¯s°s±s²s³s´sµs¶s·s¸s¹sºs»s¼s½s¾s¿sÀsÁsÂsÃsÄsÅsÆsÇsÈsÉsÊsËsÌsÍsÎsÏsÐsÑsÒsÓsÔsÕsÖs×sØsÙsÚsÛsÜsÝsÞsßsàrsâsãsäsåsæsçsèsésêsësìsísîsïsðsñsòsósôsõsös÷søsùsúsûsüsýsþ)z��r�r�rRr�r�rSr�r�rQrrm�utf8cCs$|jdd�j�dkrtd��|j�dkr0td��g}d }d }x�|t|�k�r�||}t|t�sft|�}||jkr�||jkr�xz|j D]$\}} } ||kr�|| kr�|| 7}Pq�Wq>|d kr�||j kr�|j|||��|j|j |�|d7}|}q>|d7}q>W|d k�r|S|j||d��d j|�S)a�Fix characters from one encoding embedded in some other encoding. Currently the only situation supported is Windows-1252 (or its subset ISO-8859-1), embedded in UTF-8. The input must be a bytestring. If you've already converted the document to Unicode, you're too late. The output is a bytestring in which `embedded_encoding` characters have been converted to their `main_encoding` equivalents. r~r}�windows-1252�windows_1252zPWindows-1252 and ISO-8859-1 are the only currently supported embedded encodings.r��utf-8z4UTF-8 is the only currently supported main encoding.rrarmN�)r�r�)r�r�) r)r;�NotImplementedErrorrVrTr[�ord�FIRST_MULTIBYTE_MARKER�LAST_MULTIBYTE_MARKER�MULTIBYTE_MARKERS_AND_SIZES�WINDOWS_1252_TO_UTF8rr)r#Zin_bytesZ main_encodingZembedded_encodingZbyte_chunksZchunk_start�posZbyte�start�end�sizerrr� detwingles< zUnicodeDammit.detwingle)rv)rv)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r�)r�r )rr�)r�r�rR)r�r�rS)r�r�rQ��)r�rd)r5r6r7r8r�rxrHrurkryrar|rwrrqror�r�r�r�r9r�rrrrrbEs`1 rb)r8Z__license__r�Z html.entitiesrrrg�stringZchardet_typerr �ImportErrorr Ziconv_codecrrpr�r\r^�objectrr:rbrrrr�s8PK�je[��ܚ�>�>#__pycache__/__init__.cpython-36.pycnu�[��3 (6]XY�@sdZdZdZdZdZdgZddlZddlZddlZddl Z ddl Z dd lmZm Z dd lmZddlmZmZmZmZmZmZmZmZmZmZmZdd kGdd�de�ZeZeZGdd�de�ZGdd�de �Z!Gdd�de"�Z#e$dk�r ddlZeej%�Z&e'e&j(��dS)aHBeautiful Soup Elixir and Tonic "The Screen-Scraper's Friend" http://www.crummy.com/software/BeautifulSoup/ Beautiful Soup uses a pluggable XML or HTML parser to parse a (possibly invalid) document into a tree representation. Beautiful Soup provides methods and Pythonic idioms that make it easy to navigate, search, and modify the parse tree. Beautiful Soup works with Python 2.7 and up. It works better if lxml and/or html5lib is installed. For more than you ever wanted to know about Beautiful Soup, see the documentation: http://www.crummy.com/software/BeautifulSoup/bs4/doc/ z*Leonard Richardson (leonardr@segfault.org)z4.6.3z*Copyright (c) 2004-2018 Leonard RichardsonZMIT� BeautifulSoup�N�)�builder_registry�ParserRejectedMarkup)� UnicodeDammit)�CData�Comment�DEFAULT_OUTPUT_ENCODING�Declaration�Doctype�NavigableString�PageElement�ProcessingInstruction� ResultSet�SoupStrainer�Tagz`You are trying to run the Python 2 version of Beautiful Soup under Python 3. This will not work.zuYou need to convert the code, either by installing it (`python setup.py install`) or by running 2to3 (`2to3 -w bs4`).cs�eZdZdZdZddgZdZdZd2d d �Zdd�Z d d�Z edd��Zdd�Z dd�Zddifdd�Zefdd�Zdd�Zdd�Zdd�Zdd �Zefd!d"�Zd3d#d$�Zd4d&d'�Zd(d)�Zd5d*d+�Zd,d-�Zd.ed/f�fd0d1� Z�ZS)6ra This class defines the basic interface called by the tree builders. These methods will be called by the parser: reset() feed(markup) The tree builder may call these methods from its feed() implementation: handle_starttag(name, attrs) # See note about return value handle_endtag(name) handle_data(data) # Appends to the current data node endData(containerClass=NavigableString) # Ends the current data node No matter how complicated the underlying parser is, you should be able to build a tree using 'start tag' events, 'end tag' events, 'data' events, and "done with data" events. If you encounter an empty-element tag (aka a self-closing tag, like HTML's
tag), call handle_starttag and then handle_endtag. z [document]ZhtmlZfastz a�No parser was explicitly specified, so I'm using the best available %(markup_type)s parser for this system ("%(parser)s"). This usually isn't a problem, but if you run this code on another system, or in a different virtual environment, it may use a different parser and behave differently. The code that caused this warning is on line %(line_number)s of the file %(filename)s. To get rid of this warning, pass the additional argument 'features="%(parser)s"' to the BeautifulSoup constructor. �Nc"s�d�krtjd�d�kr*�d=tjd�d�krB�d=tjd�d�krZ�d=tjd�d �krr�d =tjd ��fdd�}|p�|d d�}|p�|dd�}|r�t|t�r�tjd�d}t��dkr�t�j��j�} td| ��|dk�r|} t|t�r�|g}|dk�st|�dk�r|j }t j|�}|dk�r@tddj |��|�}| |jk�pZ| |jk�s|j�rld}nd}d} ytjd�} Wntk �r�YnX| �r�| j}| j}n tj}d}|jd�}|�r�|j�}|jd(��r�|dd)�}|�rt|||j|d�}tj|j|dd�||_|j|_|j|_||j_||_t |d ��rN|j!�}n�t|�d!k�rt|t"��rrd"|k�s�t|t��rd#|k�rt|t��r�t#j$j%�r�|j&d$�}n|}d%}yt#j$j'|�}Wn$t(k �r�}zWYdd}~XnX|�rt|t��r|j&d$�}tjd&|�|j)|�xZ|jj*|||d'�D]D\|_+|_,|_-|_.|j/�y|j0�PWnt1k �rrYnX�q2Wd|_+d|j_dS)*a_Constructor. :param markup: A string or a file-like object representing markup to be parsed. :param features: Desirable features of the parser to be used. This may be the name of a specific parser ("lxml", "lxml-xml", "html.parser", or "html5lib") or it may be the type of markup to be used ("html", "html5", "xml"). It's recommended that you name a specific parser, so that Beautiful Soup gives you the same results across platforms and virtual environments. :param builder: A specific TreeBuilder to use instead of looking one up based on `features`. You shouldn't need to use this. :param parse_only: A SoupStrainer. Only parts of the document matching the SoupStrainer will be considered. This is useful when parsing part of a document that would otherwise be too large to fit into memory. :param from_encoding: A string indicating the encoding of the document to be parsed. Pass this in if Beautiful Soup is guessing wrongly about the document's encoding. :param exclude_encodings: A list of strings indicating encodings known to be wrong. Pass this in if you don't know the document's encoding but you know Beautiful Soup's guess is wrong. :param kwargs: For backwards compatibility purposes, the constructor accepts certain keyword arguments used in Beautiful Soup 3. None of these arguments do anything in Beautiful Soup 4 and there's no need to actually pass keyword arguments into the constructor. ZconvertEntitiesz�BS4 does not respect the convertEntities argument to the BeautifulSoup constructor. Entities are always converted to Unicode characters.Z markupMassagez�BS4 does not respect the markupMassage argument to the BeautifulSoup constructor. The tree builder is responsible for any necessary markup massage.Z smartQuotesToz�BS4 does not respect the smartQuotesTo argument to the BeautifulSoup constructor. Smart quotes are always converted to Unicode characters.ZselfClosingTagsz�BS4 does not respect the selfClosingTags argument to the BeautifulSoup constructor. The tree builder is responsible for understanding self-closing tags.ZisHTMLz�BS4 does not respect the isHTML argument to the BeautifulSoup constructor. Suggest you use features='lxml' for HTML and features='lxml-xml' for XML.cs0|�kr,tjd||f��|}�|=|SdS)NzLThe "%s" argument to the BeautifulSoup constructor has been renamed to "%s.")�warnings�warn)Zold_name�new_name�value)�kwargs��/usr/lib/python3.6/__init__.py�deprecated_argument�sz3BeautifulSoup.__init__..deprecated_argumentZparseOnlyThese� parse_onlyZfromEncoding� from_encodingzlYou provided Unicode markup but also provided a value for from_encoding. Your from_encoding will be ignored.Nrz2__init__() got an unexpected keyword argument '%s'zjCouldn't find a tree builder with the features you requested: %s. Do you need to install a parser library?�,ZXMLZHTMLr�__file__�.pyc�.pyo)�filename�line_number�parser�markup_type�)� stacklevel�read��<�<�utf8Fzw"%s" looks like a filename, not markup. You should probably open this file and pass the filehandle into Beautiful Soup.)�exclude_encodings)rr ��)2rr� isinstance�str�len�list�keys�pop� TypeError�DEFAULT_BUILDER_FEATURESr�lookup�FeatureNotFound�join�NAMEZALTERNATE_NAMES�is_xml�sys� _getframe� ValueError� f_globals�f_lineno�__dict__�get�lower�endswith�dict�NO_PARSER_SPECIFIED_WARNING�builderZ known_xml�soupr�hasattrr'�bytes�os�path�supports_unicode_filenames�encode�exists� Exception�_check_markup_is_urlZprepare_markup�markup�original_encodingZdeclared_html_encodingZcontains_replacement_characters�reset�_feedr)�selfrQ�featuresrFrrr,rr�argZoriginal_featuresZ builder_classr$Zcaller�globalsr"r!Zfnl�valuesZpossible_filename�is_file�er)rr�__init__Xs�' zBeautifulSoup.__init__cCs&t|�|jd�|jdd�}|j|_|S)Nzutf-8)rFr)�typerMrFrR)rU�copyrrr�__copy__$szBeautifulSoup.__copy__cCs(t|j�}d|kr$|jjr$d|d<|S)NrF)rDr@rFZ picklable)rU�drrr�__getstate__0s zBeautifulSoup.__getstate__csxt�t�rd}d }nt�t�r(d}d}ndSt�fdd �|D��rt|�krtt�t�rb�jd d�}n�}tjd|�dS)z� Check if markup looks like it's actually a url and raise a warning if so. Markup can be unicode or str (py2) / bytes (py3). � �http:�https:� �http:�https:Nc3s|]}�j|�VqdS)N)� startswith)�.0�prefix)rQrr� Fsz5BeautifulSoup._check_markup_is_url..zutf-8�replacez�"%s" looks like a URL. Beautiful Soup is not an HTTP client. You should probably use an HTTP client like requests to get the document behind the URL, and feed that document to Beautiful Soup.)rcrd)rfrg)r.rIr/�any�decoderr)rQZspaceZcant_start_withZdecoded_markupr)rQrrP7s z"BeautifulSoup._check_markup_is_urlcCs@|jj�|jj|j�|j�x|jj|jkr:|j�q"WdS)N) rFrSZfeedrQ�endData� currentTag�name� ROOT_TAG_NAME�popTag)rUrrrrTSs zBeautifulSoup._feedcCsJtj|||j|j�d|_|jj�g|_d|_g|_g|_ |j |�dS)Nr)rr\rFrrZhiddenrS�current_datarp�tagStack�preserve_whitespace_tag_stack�pushTag)rUrrrrS]s zBeautifulSoup.resetcKs|j|�td|j||||�S)z+Create a new tag associated with this soup.N)�updaterrF)rUrq� namespace�nsprefix�attrsZkwattrsrrr�new_taggs zBeautifulSoup.new_tagcCs||�S)z7Create a new NavigableString associated with this soup.r)rU�s�subclassrrr� new_stringlszBeautifulSoup.new_stringcCstd��dS)Nz4BeautifulSoup objects don't support insert_before().)�NotImplementedError)rU� successorrrr� insert_beforepszBeautifulSoup.insert_beforecCstd��dS)Nz3BeautifulSoup objects don't support insert_after().)r�)rUr�rrr�insert_aftersszBeautifulSoup.insert_aftercCs@|jj�}|jr(||jdkr(|jj�|jr:|jd|_|jS)Nrr-r-)rur3rvrp)rU�tagrrrrsvs zBeautifulSoup.popTagcCsJ|jr|jjj|�|jj|�|jd|_|j|jjkrF|jj|�dS)Nrr-)rp�contents�appendrurqrFZpreserve_whitespace_tagsrv)rUr�rrrrwszBeautifulSoup.pushTagcCs�|jr�dj|j�}|jsPd}x|D]}||jkr"d}Pq"W|rPd|krLd}nd}g|_|jr�t|j�dkr�|jjs�|jj|�r�dS||�}|j |�dS)NrTF� rer) rtr8rv�ASCII_SPACESrr0ru�text�search�object_was_parsed)rUZcontainerClassrtZ strippable�i�orrrro�s& zBeautifulSoup.endDatac CsV|p|j}|p|j}d}}}t|t�rF|j}|j}|j}|sF|j}|j|||||�||_|j j |�|j�rRt|j �d}x4|dkr�|j ||kr�P|d8}q�Wtd||f��|dkr�|}d}n|j |d}}|t|j �dkr�|j}d}n|j |d}}||_|�r||_||_|�r.||_||_|�r@||_||_|�rR||_dS)z Add an object to the parse tree.Nrrz[Error building tree: supposedly %r was inserted into %r after the fact, but I don't see it!) rp�_most_recent_elementr.r�next_element�next_sibling�previous_sibling�previous_elementZsetupr�r�r0r=) rUr��parentZmost_recent_elementr�r�r�r��indexrrrr��sR zBeautifulSoup.object_was_parsedTcCsn||jkrdSd}t|j�}xLt|ddd�D]8}|j|}||jkr^||jkr^|r\|j�}P|j�}q.W|S)z�Pops the tag stack up to and including the most recent instance of the given tag. If inclusivePop is false, pops the tag stack up to but *not* including the most recent instqance of the given tag.Nrrr-)rrr0ru�rangerqrjrs)rUrqrzZinclusivePopZmost_recently_popped� stack_sizer��trrr� _popToTag�s zBeautifulSoup._popToTagc Cs�|j�|jr8t|j�dkr8|jjs4|jj||�r8dSt||j|||||j|j �}|dkr`|S|j rn||j _ ||_ |j|�|S)aPush a start tag on to the stack. If this method returns None, the tag was rejected by the SoupStrainer. You should proceed as if the tag had not occurred in the document. For instance, if this was a self-closing tag, don't call handle_endtag. rN)rorr0rur�Z search_tagrrFrpr�r�rw)rUrqryrzr{r�rrr�handle_starttag�s zBeautifulSoup.handle_starttagcCs|j�|j||�dS)N)ror�)rUrqrzrrr� handle_endtagszBeautifulSoup.handle_endtagcCs|jj|�dS)N)rtr�)rU�datarrr�handle_dataszBeautifulSoup.handle_dataFZminimalcsN|jr$d}|dkrd|}d|}nd}|s2d}nd}|tt|�j|||�S)zlReturns a string or Unicode representation of this document. To get Unicode, pass None for encoding.rNz encoding="%s"z r)r:�superrrn)rUZpretty_printZeventual_encodingZ formatterZ encoding_partrjZindent_level)� __class__rrrns zBeautifulSoup.decode)rNNNNN)NN)NT)N)�__name__� __module__�__qualname__�__doc__rrr5r�rEr\r_ra�staticmethodrPrTrSr|rrr�r�rsrwror�r�r�r�r�r rn� __classcell__rr)r�rr8s8 L 9 cs eZdZdZ�fdd�Z�ZS)�BeautifulStoneSoupz&Deprecated interface to an XML parser.cs(d|d<tjd�tt|�j||�dS)NZxmlrVzxThe BeautifulStoneSoup class is deprecated. Instead of using it, pass features="xml" into the BeautifulSoup constructor.)rrr�r�r\)rU�argsr)r�rrr\5szBeautifulStoneSoup.__init__)r�r�r�r�r\r�rr)r�rr�2sr�c@seZdZdS)�StopParsingN)r�r�r�rrrrr�=sr�c@seZdZdS)r7N)r�r�r�rrrrr7@sr7�__main__))r�� __author__�__version__Z __copyright__Z__license__�__all__rJ�rer;� tracebackrrFrrZdammitr�elementrrr r rrr rrrrrZ_sZ_soupr�rOr�r=r7r��stdinrG�printZprettifyrrrr�s64z PK�je[��ܚ�>�>)__pycache__/__init__.cpython-36.opt-1.pycnu�[��3 (6]XY�@sdZdZdZdZdZdgZddlZddlZddlZddl Z ddl Z dd lmZm Z dd lmZddlmZmZmZmZmZmZmZmZmZmZmZdd kGdd�de�ZeZeZGdd�de�ZGdd�de �Z!Gdd�de"�Z#e$dk�r ddlZeej%�Z&e'e&j(��dS)aHBeautiful Soup Elixir and Tonic "The Screen-Scraper's Friend" http://www.crummy.com/software/BeautifulSoup/ Beautiful Soup uses a pluggable XML or HTML parser to parse a (possibly invalid) document into a tree representation. Beautiful Soup provides methods and Pythonic idioms that make it easy to navigate, search, and modify the parse tree. Beautiful Soup works with Python 2.7 and up. It works better if lxml and/or html5lib is installed. For more than you ever wanted to know about Beautiful Soup, see the documentation: http://www.crummy.com/software/BeautifulSoup/bs4/doc/ z*Leonard Richardson (leonardr@segfault.org)z4.6.3z*Copyright (c) 2004-2018 Leonard RichardsonZMIT� BeautifulSoup�N�)�builder_registry�ParserRejectedMarkup)� UnicodeDammit)�CData�Comment�DEFAULT_OUTPUT_ENCODING�Declaration�Doctype�NavigableString�PageElement�ProcessingInstruction� ResultSet�SoupStrainer�Tagz`You are trying to run the Python 2 version of Beautiful Soup under Python 3. This will not work.zuYou need to convert the code, either by installing it (`python setup.py install`) or by running 2to3 (`2to3 -w bs4`).cs�eZdZdZdZddgZdZdZd2d d �Zdd�Z d d�Z edd��Zdd�Z dd�Zddifdd�Zefdd�Zdd�Zdd�Zdd�Zdd �Zefd!d"�Zd3d#d$�Zd4d&d'�Zd(d)�Zd5d*d+�Zd,d-�Zd.ed/f�fd0d1� Z�ZS)6ra This class defines the basic interface called by the tree builders. These methods will be called by the parser: reset() feed(markup) The tree builder may call these methods from its feed() implementation: handle_starttag(name, attrs) # See note about return value handle_endtag(name) handle_data(data) # Appends to the current data node endData(containerClass=NavigableString) # Ends the current data node No matter how complicated the underlying parser is, you should be able to build a tree using 'start tag' events, 'end tag' events, 'data' events, and "done with data" events. If you encounter an empty-element tag (aka a self-closing tag, like HTML's
tag), call handle_starttag and then handle_endtag. z [document]ZhtmlZfastz a�No parser was explicitly specified, so I'm using the best available %(markup_type)s parser for this system ("%(parser)s"). This usually isn't a problem, but if you run this code on another system, or in a different virtual environment, it may use a different parser and behave differently. The code that caused this warning is on line %(line_number)s of the file %(filename)s. To get rid of this warning, pass the additional argument 'features="%(parser)s"' to the BeautifulSoup constructor. �Nc"s�d�krtjd�d�kr*�d=tjd�d�krB�d=tjd�d�krZ�d=tjd�d �krr�d =tjd ��fdd�}|p�|d d�}|p�|dd�}|r�t|t�r�tjd�d}t��dkr�t�j��j�} td| ��|dk�r|} t|t�r�|g}|dk�st|�dk�r|j }t j|�}|dk�r@tddj |��|�}| |jk�pZ| |jk�s|j�rld}nd}d} ytjd�} Wntk �r�YnX| �r�| j}| j}n tj}d}|jd�}|�r�|j�}|jd(��r�|dd)�}|�rt|||j|d�}tj|j|dd�||_|j|_|j|_||j_||_t |d ��rN|j!�}n�t|�d!k�rt|t"��rrd"|k�s�t|t��rd#|k�rt|t��r�t#j$j%�r�|j&d$�}n|}d%}yt#j$j'|�}Wn$t(k �r�}zWYdd}~XnX|�rt|t��r|j&d$�}tjd&|�|j)|�xZ|jj*|||d'�D]D\|_+|_,|_-|_.|j/�y|j0�PWnt1k �rrYnX�q2Wd|_+d|j_dS)*a_Constructor. :param markup: A string or a file-like object representing markup to be parsed. :param features: Desirable features of the parser to be used. This may be the name of a specific parser ("lxml", "lxml-xml", "html.parser", or "html5lib") or it may be the type of markup to be used ("html", "html5", "xml"). It's recommended that you name a specific parser, so that Beautiful Soup gives you the same results across platforms and virtual environments. :param builder: A specific TreeBuilder to use instead of looking one up based on `features`. You shouldn't need to use this. :param parse_only: A SoupStrainer. Only parts of the document matching the SoupStrainer will be considered. This is useful when parsing part of a document that would otherwise be too large to fit into memory. :param from_encoding: A string indicating the encoding of the document to be parsed. Pass this in if Beautiful Soup is guessing wrongly about the document's encoding. :param exclude_encodings: A list of strings indicating encodings known to be wrong. Pass this in if you don't know the document's encoding but you know Beautiful Soup's guess is wrong. :param kwargs: For backwards compatibility purposes, the constructor accepts certain keyword arguments used in Beautiful Soup 3. None of these arguments do anything in Beautiful Soup 4 and there's no need to actually pass keyword arguments into the constructor. ZconvertEntitiesz�BS4 does not respect the convertEntities argument to the BeautifulSoup constructor. Entities are always converted to Unicode characters.Z markupMassagez�BS4 does not respect the markupMassage argument to the BeautifulSoup constructor. The tree builder is responsible for any necessary markup massage.Z smartQuotesToz�BS4 does not respect the smartQuotesTo argument to the BeautifulSoup constructor. Smart quotes are always converted to Unicode characters.ZselfClosingTagsz�BS4 does not respect the selfClosingTags argument to the BeautifulSoup constructor. The tree builder is responsible for understanding self-closing tags.ZisHTMLz�BS4 does not respect the isHTML argument to the BeautifulSoup constructor. Suggest you use features='lxml' for HTML and features='lxml-xml' for XML.cs0|�kr,tjd||f��|}�|=|SdS)NzLThe "%s" argument to the BeautifulSoup constructor has been renamed to "%s.")�warnings�warn)Zold_name�new_name�value)�kwargs��/usr/lib/python3.6/__init__.py�deprecated_argument�sz3BeautifulSoup.__init__..deprecated_argumentZparseOnlyThese� parse_onlyZfromEncoding� from_encodingzlYou provided Unicode markup but also provided a value for from_encoding. Your from_encoding will be ignored.Nrz2__init__() got an unexpected keyword argument '%s'zjCouldn't find a tree builder with the features you requested: %s. Do you need to install a parser library?�,ZXMLZHTMLr�__file__�.pyc�.pyo)�filename�line_number�parser�markup_type�)� stacklevel�read��<�<�utf8Fzw"%s" looks like a filename, not markup. You should probably open this file and pass the filehandle into Beautiful Soup.)�exclude_encodings)rr ��)2rr� isinstance�str�len�list�keys�pop� TypeError�DEFAULT_BUILDER_FEATURESr�lookup�FeatureNotFound�join�NAMEZALTERNATE_NAMES�is_xml�sys� _getframe� ValueError� f_globals�f_lineno�__dict__�get�lower�endswith�dict�NO_PARSER_SPECIFIED_WARNING�builderZ known_xml�soupr�hasattrr'�bytes�os�path�supports_unicode_filenames�encode�exists� Exception�_check_markup_is_urlZprepare_markup�markup�original_encodingZdeclared_html_encodingZcontains_replacement_characters�reset�_feedr)�selfrQ�featuresrFrrr,rr�argZoriginal_featuresZ builder_classr$Zcaller�globalsr"r!Zfnl�valuesZpossible_filename�is_file�er)rr�__init__Xs�' zBeautifulSoup.__init__cCs&t|�|jd�|jdd�}|j|_|S)Nzutf-8)rFr)�typerMrFrR)rU�copyrrr�__copy__$szBeautifulSoup.__copy__cCs(t|j�}d|kr$|jjr$d|d<|S)NrF)rDr@rFZ picklable)rU�drrr�__getstate__0s zBeautifulSoup.__getstate__csxt�t�rd}d }nt�t�r(d}d}ndSt�fdd �|D��rt|�krtt�t�rb�jd d�}n�}tjd|�dS)z� Check if markup looks like it's actually a url and raise a warning if so. Markup can be unicode or str (py2) / bytes (py3). � �http:�https:� �http:�https:Nc3s|]}�j|�VqdS)N)� startswith)�.0�prefix)rQrr� Fsz5BeautifulSoup._check_markup_is_url..zutf-8�replacez�"%s" looks like a URL. Beautiful Soup is not an HTTP client. You should probably use an HTTP client like requests to get the document behind the URL, and feed that document to Beautiful Soup.)rcrd)rfrg)r.rIr/�any�decoderr)rQZspaceZcant_start_withZdecoded_markupr)rQrrP7s z"BeautifulSoup._check_markup_is_urlcCs@|jj�|jj|j�|j�x|jj|jkr:|j�q"WdS)N) rFrSZfeedrQ�endData� currentTag�name� ROOT_TAG_NAME�popTag)rUrrrrTSs zBeautifulSoup._feedcCsJtj|||j|j�d|_|jj�g|_d|_g|_g|_ |j |�dS)Nr)rr\rFrrZhiddenrS�current_datarp�tagStack�preserve_whitespace_tag_stack�pushTag)rUrrrrS]s zBeautifulSoup.resetcKs|j|�td|j||||�S)z+Create a new tag associated with this soup.N)�updaterrF)rUrq� namespace�nsprefix�attrsZkwattrsrrr�new_taggs zBeautifulSoup.new_tagcCs||�S)z7Create a new NavigableString associated with this soup.r)rU�s�subclassrrr� new_stringlszBeautifulSoup.new_stringcCstd��dS)Nz4BeautifulSoup objects don't support insert_before().)�NotImplementedError)rU� successorrrr� insert_beforepszBeautifulSoup.insert_beforecCstd��dS)Nz3BeautifulSoup objects don't support insert_after().)r�)rUr�rrr�insert_aftersszBeautifulSoup.insert_aftercCs@|jj�}|jr(||jdkr(|jj�|jr:|jd|_|jS)Nrr-r-)rur3rvrp)rU�tagrrrrsvs zBeautifulSoup.popTagcCsJ|jr|jjj|�|jj|�|jd|_|j|jjkrF|jj|�dS)Nrr-)rp�contents�appendrurqrFZpreserve_whitespace_tagsrv)rUr�rrrrwszBeautifulSoup.pushTagcCs�|jr�dj|j�}|jsPd}x|D]}||jkr"d}Pq"W|rPd|krLd}nd}g|_|jr�t|j�dkr�|jjs�|jj|�r�dS||�}|j |�dS)NrTF� rer) rtr8rv�ASCII_SPACESrr0ru�text�search�object_was_parsed)rUZcontainerClassrtZ strippable�i�orrrro�s& zBeautifulSoup.endDatac CsV|p|j}|p|j}d}}}t|t�rF|j}|j}|j}|sF|j}|j|||||�||_|j j |�|j�rRt|j �d}x4|dkr�|j ||kr�P|d8}q�Wtd||f��|dkr�|}d}n|j |d}}|t|j �dkr�|j}d}n|j |d}}||_|�r||_||_|�r.||_||_|�r@||_||_|�rR||_dS)z Add an object to the parse tree.Nrrz[Error building tree: supposedly %r was inserted into %r after the fact, but I don't see it!) rp�_most_recent_elementr.r�next_element�next_sibling�previous_sibling�previous_elementZsetupr�r�r0r=) rUr��parentZmost_recent_elementr�r�r�r��indexrrrr��sR zBeautifulSoup.object_was_parsedTcCsn||jkrdSd}t|j�}xLt|ddd�D]8}|j|}||jkr^||jkr^|r\|j�}P|j�}q.W|S)z�Pops the tag stack up to and including the most recent instance of the given tag. If inclusivePop is false, pops the tag stack up to but *not* including the most recent instqance of the given tag.Nrrr-)rrr0ru�rangerqrjrs)rUrqrzZinclusivePopZmost_recently_popped� stack_sizer��trrr� _popToTag�s zBeautifulSoup._popToTagc Cs�|j�|jr8t|j�dkr8|jjs4|jj||�r8dSt||j|||||j|j �}|dkr`|S|j rn||j _ ||_ |j|�|S)aPush a start tag on to the stack. If this method returns None, the tag was rejected by the SoupStrainer. You should proceed as if the tag had not occurred in the document. For instance, if this was a self-closing tag, don't call handle_endtag. rN)rorr0rur�Z search_tagrrFrpr�r�rw)rUrqryrzr{r�rrr�handle_starttag�s zBeautifulSoup.handle_starttagcCs|j�|j||�dS)N)ror�)rUrqrzrrr� handle_endtagszBeautifulSoup.handle_endtagcCs|jj|�dS)N)rtr�)rU�datarrr�handle_dataszBeautifulSoup.handle_dataFZminimalcsN|jr$d}|dkrd|}d|}nd}|s2d}nd}|tt|�j|||�S)zlReturns a string or Unicode representation of this document. To get Unicode, pass None for encoding.rNz encoding="%s"z r)r:�superrrn)rUZpretty_printZeventual_encodingZ formatterZ encoding_partrjZindent_level)� __class__rrrns zBeautifulSoup.decode)rNNNNN)NN)NT)N)�__name__� __module__�__qualname__�__doc__rrr5r�rEr\r_ra�staticmethodrPrTrSr|rrr�r�rsrwror�r�r�r�r�r rn� __classcell__rr)r�rr8s8 L 9 cs eZdZdZ�fdd�Z�ZS)�BeautifulStoneSoupz&Deprecated interface to an XML parser.cs(d|d<tjd�tt|�j||�dS)NZxmlrVzxThe BeautifulStoneSoup class is deprecated. Instead of using it, pass features="xml" into the BeautifulSoup constructor.)rrr�r�r\)rU�argsr)r�rrr\5szBeautifulStoneSoup.__init__)r�r�r�r�r\r�rr)r�rr�2sr�c@seZdZdS)�StopParsingN)r�r�r�rrrrr�=sr�c@seZdZdS)r7N)r�r�r�rrrrr7@sr7�__main__))r�� __author__�__version__Z __copyright__Z__license__�__all__rJ�rer;� tracebackrrFrrZdammitr�elementrrr r rrr rrrrrZ_sZ_soupr�rOr�r=r7r��stdinrG�printZprettifyrrrr�s64z PK�je[�r�d?�Z"d@dA�Z#dBdC�Z$dDdE�Z%dFd�ZdGdH�Z&dIdJ�Z'dKdL�Z(dMdN�Z)dOdP�Z*dQdR�Z+dSdT�Z,dUdV�Z-dWdX�Z.dYdZ�Z/d[d\�Z0d]d^�Z1d_d`�Z2dadb�Z3dcdd�Z4dedf�Z5dgdh�Z6didj�Z7dkdl�Z8dmdn�Z9dodp�Z:dqS)r�HTMLTreeBuilderSmokeTestaCA basic test of a treebuilder's competence. Any HTML treebuilder, present or future, should be able to pass these tests. With invalid markup, there's room for interpretation, and different parsers can handle it differently. But with the markup in these tests, there's not much room for interpretation. cCs4x.dD]&}|jd�}|j|�}|jd|j�qWdS)zmVerify that all HTML4 and HTML5 empty element (aka void element) tags are handled correctly. �area�base�br�col�embed�hr�img�input�keygen�link�menuitem�meta�param�source�track�wbr�spacer�frame�TN)r#r$r%r&r'r(r)r*r+r,r-r.r/r0r1r2r3r4)r�new_tagr�is_empty_element)r�namerr6r r r�test_empty_element_tagsIs z0HTMLTreeBuilderSmokeTest.test_empty_element_tagscCsF|jd�}tj|d�}tj|�}|j|jt�|j|j�|j��dS)Nz foo�)r�pickle�dumps�loadsr� __class__rr)r�tree�dumped�loadedr r r�!test_pickle_and_unpickle_identityUs z:HTMLTreeBuilderSmokeTest.test_pickle_and_unpickle_identitycCsf|j|�\}}|jd}|j|jt�|j||�|jt|�dt|��|�|j|jjdd�dS)z8Assert that a given doctype string is handled correctly.rN�foo)�_document_with_doctype�contentsrr>r�str�len�p)r�doctype_fragmentZdoctype_strr�doctyper r r�assertDoctypeHandled^s z-HTMLTreeBuilderSmokeTest.assertDoctypeHandledcCs"d|}|d}|j|�}||fS)z5Generate and parse a document with the given doctype.z z

foo

)r)rrIrJrrr r rrDls z/HTMLTreeBuilderSmokeTest._document_with_doctypecCs|jd�|jd�dS)z?Make sure normal, everyday HTML doctypes are handled correctly.�htmlz4html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"N)rK)rr r r�test_normal_doctypesss z-HTMLTreeBuilderSmokeTest.test_normal_doctypescCs(|jd�}|jd}|jd|j��dS)Nz rr5)rrEr�strip)rrrJr r r�test_empty_doctypeys z+HTMLTreeBuilderSmokeTest.test_empty_doctypecCsd}|j|�dS)Nznhtml PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd")rK)rrJr r r�test_public_doctype_with_url~sz5HTMLTreeBuilderSmokeTest.test_public_doctype_with_urlcCs|jd�dS)Nz$foo SYSTEM "http://www.example.com/")rK)rr r r�test_system_doctype�sz,HTMLTreeBuilderSmokeTest.test_system_doctypecCs|jd�dS)Nz#xsl:stylesheet SYSTEM "htmlent.dtd")rK)rr r r�test_namespaced_system_doctype�sz7HTMLTreeBuilderSmokeTest.test_namespaced_system_doctypecCs|jd�dS)Nz#xsl:stylesheet PUBLIC "htmlent.dtd")rK)rr r r�test_namespaced_public_doctype�sz7HTMLTreeBuilderSmokeTest.test_namespaced_public_doctypecCs4d}|j|�}|j|jd�jdd�|jdd��dS)zJA real XHTML document should come out more or less the same as it went in.s� Hello. Goodbye. zutf-8� �N)rr�encode�replace)rrrr r r�test_real_xhtml_document�s z1HTMLTreeBuilderSmokeTest.test_real_xhtml_documentcCs(d}|j|�}|jdt|jd��dS)ztWhen a namespaced XML document is parsed as HTML it should be treated as HTML with weird tag names. s.contentr:zns1:fooN)rrrG�find_all)rrrr r r�test_namespaced_html�s z-HTMLTreeBuilderSmokeTest.test_namespaced_htmlcCsBd}|j|�}|j||j��d}|j|�}|j||jd��dS)Nzs�utf8)rrrrV)rrrr r r�test_processing_instruction�s z4HTMLTreeBuilderSmokeTest.test_processing_instructioncCstj|j�dS)z�Make sure you can copy the tree builder. This is important because the builder is part of a BeautifulSoup object, and we want to be able to copy that. N)�copy�deepcopyr)rr r r� test_deepcopy�sz&HTMLTreeBuilderSmokeTest.test_deepcopycCs.|jd�}|j|jj�|jt|j�d�dS)z�A
tag is never designated as an empty-element tag. Even if the markup shows it as an empty-element tag, it shouldn't be presented that way. z
z
N)rZassertFalserHr7rrF)rrr r r�!test_p_tag_is_never_empty_element�s z:HTMLTreeBuilderSmokeTest.test_p_tag_is_never_empty_elementcCs(|jdd�|jdd�|jdd�dS)z�A tag that's not closed by the end of the document should be closed. This applies to all tags except empty-element tags. z
z
zzz
z
N)r)rr r r�test_unclosed_tags_get_closed�sz6HTMLTreeBuilderSmokeTest.test_unclosed_tags_get_closedcCs.|jd�}|j|jj�|jt|j�d�dS)z�A
tag is designated as an empty-element tag. Some parsers treat

as one
tag, some parsers as two tags, but it should always be an empty-element tag. z

z
N)r� assertTruer%r7rrF)rrr r r�#test_br_is_always_empty_element_tag�s z)r)rr r r�test_nested_formatting_elements�sz8HTMLTreeBuilderSmokeTest.test_nested_formatting_elementscCs(d}|j|�}|jd|jd�d�dS)Nz� Ordinary HEAD element test Hello, world! ztext/javascript�script�type)rr�find)rrLrr r r�test_double_head�s z)HTMLTreeBuilderSmokeTest.test_double_headcCsjd}|j|�|j|�}|jdd�}|j|jt�|jdd�}|j||j�|jdd�}|j||j�dS)Nz
foobaz
Zfoobar)�textrC�baz)rrrgrr>rrr)rrrZcommentrCrjr r r�test_comment�s z%HTMLTreeBuilderSmokeTest.test_commentcCstd}d}|j|�|j|�|j|�}|j|jj�|�|j|�}|j|jj�|�|jd�}|j|jj�d�dS)zWhitespace must be preserved in
and tags, even if that would mean not prettifying the markup. z<pre> </pre>z<textarea> woo woo zN)rrrZpreZprettifyZtextarea)rZ pre_markupZtextarea_markuprr r r�-test_preserved_whitespace_in_pre_and_textarea�s zFHTMLTreeBuilderSmokeTest.test_preserved_whitespace_in_pre_and_textareacCs.d}|j|�d}|j|�d}|j|�dS)z+Inline elements can be nested indefinitely.zInside a B tagz!
A nested tag
z/
A doubly nested tag
N)r)rZb_tagZnested_b_tagZdouble_nested_b_tagr r r�test_nested_inline_elements s z4HTMLTreeBuilderSmokeTest.test_nested_inline_elementscCs6|jd�}|j}|j|jjjd�|j|jjd�dS)zBlock elements can be nested.z*
Foo
ZFooN)r� blockquoterrH�b�string)rrrnr r r� test_nested_block_level_elementss z9HTMLTreeBuilderSmokeTest.test_nested_block_level_elementscCsd}|j|d�|jd�dS)z$One table can go inside another one.z[zh
Here's another table:
foo
Here's another table:
foo
z{
Foo
Bar
Baz
N)r)rrr r r�test_correctly_nested_tablessz5HTMLTreeBuilderSmokeTest.test_correctly_nested_tablescCs(d}|j|�}|jdg|jjd�dS)Nz1
Zcss�class)rrZdiv)rrrr r r�(test_deeply_nested_multivalued_attribute0s zAHTMLTreeBuilderSmokeTest.test_deeply_nested_multivalued_attributecCs(d}|j|�}|jddg|jd�dS)Nz�arors)rrrL)rrrr r r�"test_multivalued_attribute_on_html8s z;HTMLTreeBuilderSmokeTest.test_multivalued_attribute_on_htmlcCs|jdd�dS)Nzz)r)rr r r�3test_angle_brackets_in_attribute_values_are_escaped@szLHTMLTreeBuilderSmokeTest.test_angle_brackets_in_attribute_values_are_escapedcCs|jdd�dS)Nz$
• AT&T is in the s&p 500
z,
\u2022 AT&T is in the s&p 500
)r)rr r r�3test_strings_resembling_character_entity_referencesCszLHTMLTreeBuilderSmokeTest.test_strings_resembling_character_entity_referencescCs"d}|j|�}|jd|jj�dS)Nz%
“Hello” -☃
u“Hello” -☃)rrrHrp)rrrr r r�*test_entities_in_foreign_document_encodingKs zCHTMLTreeBuilderSmokeTest.test_entities_in_foreign_document_encodingcCs8d}|jd|�|jd|�|jd|�|jd|�dS)Nu
z
z
z
z
)r)r�expectr r r�0test_entities_in_attributes_converted_to_unicodeWs zIHTMLTreeBuilderSmokeTest.test_entities_in_attributes_converted_to_unicodecCs8d}|jd|�|jd|�|jd|�|jd|�dS)Nu
piñata
z
piñata
z
piñata
z
piñata
z
piñata
)r)rrzr r r�*test_entities_in_text_converted_to_unicode^s zCHTMLTreeBuilderSmokeTest.test_entities_in_text_converted_to_unicodecCs|jdd�dS)Nz#
I said "good day!"
z
I said "good day!"
)r)rr r r�,test_quot_entity_converted_to_quotation_markeszEHTMLTreeBuilderSmokeTest.test_quot_entity_converted_to_quotation_markcCs,d}|jd|�|jd|�|jd|�dS)Nu�z�z�z �)r)rrzr r r�test_out_of_range_entityisz1HTMLTreeBuilderSmokeTest.test_out_of_range_entitycCs<|jd�}|jd|jjjj�|jd|jj�|j|�dS)zDMostly to prevent a recurrence of a bug in the html5lib treebuilder.z!
foo
rHN)rrZh2rprr8rHr)rrr r r�test_multipart_stringsos z/HTMLTreeBuilderSmokeTest.test_multipart_stringscCs|jdd�|jdd�dS)zqVerify consistent handling of empty-element tags, no matter how they come in through the markup. z

z

N)r)rr r rr9vscCs,d}|j|�}|jd|jj�|j|�dS)z8Prevent recurrence of a bug in the html5lib treebuilder.z? foo N)rZassertNotEqualrL�bodyr)r�contentrr r r�#test_head_tag_between_head_and_body}s z

N)rrZarticle)rr�rr r r�test_multiple_copies_of_a_tag�s z6HTMLTreeBuilderSmokeTest.test_multiple_copies_of_a_tagcCs^d}|j|�}|j||j��|j}|jd|jd�|jd|jd�|jd|jd�dS) z�Parsers don't need to *understand* namespaces, but at the very least they should not choke on namespaces or lose data.s�4zhttp://www.w3.org/1999/xhtmlZxmlnsz"http://www.w3.org/1998/Math/MathMLzxmlns:mathmlzhttp://www.w3.org/2000/svgz xmlns:svgN)rrrVrL)rrrrLr r r�test_basic_namespaces�s z.HTMLTreeBuilderSmokeTest.test_basic_namespacescCs(d}|j|�}|jddg|jd�dS)NsrC�barrs)rrru)rrrr r r�-test_multivalued_attribute_value_becomes_list�s zFHTMLTreeBuilderSmokeTest.test_multivalued_attribute_value_becomes_listcCs"d}|j|�}|jd|jj�dS)NuDSacré bleu!uSacré bleu!)rrr�rp)rrrr r r�test_can_parse_unicode_document�s z8HTMLTreeBuilderSmokeTest.test_can_parse_unicode_documentcCs*td�}|jd|d�}|j|j�d�dS)z2Parsers should be able to work with SoupStrainers.roz&A bold statement)Z parse_onlyzboldN)rrrr)rZstrainerrr r r�test_soupstrainer�sz*HTMLTreeBuilderSmokeTest.test_soupstrainercCs|jdd�dS)Nzz)r)rr r r�7test_single_quote_attribute_values_become_double_quotes�szPHTMLTreeBuilderSmokeTest.test_single_quote_attribute_values_become_double_quotescCsd}|j|�dS)Nz'a)r)rrir r r�7test_attribute_values_with_nested_quotes_are_left_alone�szPHTMLTreeBuilderSmokeTest.test_attribute_values_with_nested_quotes_are_left_alonecCs.d}|j|�}d|jd<|j|jj�d�dS)Nz'azBrawls happen at "Bob's Bar"�attrz:a)rrCrr)rrirr r r�:test_attribute_values_with_double_nested_quotes_get_quoted�s zSHTMLTreeBuilderSmokeTest.test_attribute_values_with_double_nested_quotes_get_quotedcCs|jdd�|jdd�dS)Nz+z/z.fooz2foo)r)rr r r�.test_ampersand_in_attribute_value_gets_escaped�s zGHTMLTreeBuilderSmokeTest.test_ampersand_in_attribute_value_gets_escapedcCs|jd�dS)Nz/)r)rr r r�7test_escaped_ampersand_in_attribute_value_is_left_alone�szPHTMLTreeBuilderSmokeTest.test_escaped_ampersand_in_attribute_value_is_left_alonecCsd}d}|j||�dS)Nz-
<<sacré bleu!>>
u#
<<sacré bleu!>>
)r)rri�expectedr r r�1test_entities_in_strings_converted_during_parsing�szJHTMLTreeBuilderSmokeTest.test_entities_in_strings_converted_during_parsingcCs"d}|j|�}|j|jjd�dS)Ns
�Foo�
u ‘Foo’)rrrHrp)rZquoterr r r�)test_smart_quotes_converted_on_the_way_in�s zBHTMLTreeBuilderSmokeTest.test_smart_quotes_converted_on_the_way_incCs|jd�}|j|jjd�dS)Nz � r:u )rrrurp)rrr r r�0test_non_breaking_spaces_converted_on_the_way_in�s zIHTMLTreeBuilderSmokeTest.test_non_breaking_spaces_converted_on_the_way_incCs0d}djd�}|j|�}|j|jjd�|�dS)Nz-
<<sacré bleu!>>
u#
<<sacré bleu!>>
zutf-8)rVrrrH)rrir�rr r r�&test_entities_converted_on_the_way_out�s z?HTMLTreeBuilderSmokeTest.test_entities_converted_on_the_way_outcCsHd}|jd�}|j|�}|jd�}|jdd�}|jd�}|j||�dS)Nu�
Sacré bleu!
z iso-8859-1zutf-8zISO-Latin-1)rVrrWr)r�unicode_htmlZiso_latin_htmlr�resultr�r r r�test_real_iso_latin_document�s z5HTMLTreeBuilderSmokeTest.test_real_iso_latin_documentcCsLd}|jd�}|j|�}|j|jd�|jd��|j|jd�|jd��dS)Nsk
��Shift-JIS�ŃR�[�f�B��O��ꂽ��{��̃t�@�C��ł��B
z shift-jiszutf-8�euc_jp)rrrrV)r�shift_jis_htmlr�rr r r�test_real_shift_jis_documents z5HTMLTreeBuilderSmokeTest.test_real_shift_jis_documentcCs4d}|j|dd�}|j|jd�|jd�jd��dS)Ns�Hebrew (ISO 8859-8) in Visual Directionality
Hebrew (ISO 8859-8) in Visual Directionality
��z iso8859-8)Z from_encodingzutf-8)rrrVr)rZhebrew_documentrr r r�test_real_hebrew_document$s z2HTMLTreeBuilderSmokeTest.test_real_hebrew_documentcCs`d}d|}|j|�}|jdddi�}|d}|jd|�|jt|t��|jd|jd ��dS) NzEzj %s Shift-JIS markup goes here.r.z http-equivzContent-typer�ztext/html; charset=x-sjisztext/html; charset=utf8r[)rrgrrb� isinstancerrV)r�meta_tagr�r�parsed_metar�r r r�'test_meta_tag_reflects_current_encoding1s z@HTMLTreeBuilderSmokeTest.test_meta_tag_reflects_current_encodingcCs^d}d|}|j|�}|jddd�}|d}|jd|�|jt|t��|jd|jd��dS) Nz'zj %s Shift-JIS markup goes here.r.�encoding)�id�charsetzx-sjisr[)rrgrrbr�rrV)rr�r�rr�r�r r r�3test_html5_style_meta_tag_reflects_current_encodingMs zLHTMLTreeBuilderSmokeTest.test_html5_style_meta_tag_reflects_current_encodingcCs*|jd�}d|jd<|jd|jj��dS)Nztextr�rCztext)rrurr)r�datar r r�5test_tag_with_no_attributes_can_have_attributes_addedes zNHTMLTreeBuilderSmokeTest.test_tag_with_no_attributes_can_have_attributes_addedN);rrr �__doc__r9rBrKrDrMrOrPrQrRrSrXrZr\r_r`rarcrdrhrkrlrmrqrrrtrvrwrxryr{r|r}r~rr�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r r r rr"?sr r"c@s�eZdZdd�Zdd�Zdd�Zdd�Zd d �Zdd�Zd d�Z dd�Z dd�Zdd�Zdd�Z dd�Zdd�Zdd�Zdd�Zdd �Zd!d"�Zd#d$�Zd%S)&�XMLTreeBuilderSmokeTestcCsF|jd�}tj|d�}tj|�}|j|jt�|j|j�|j��dS)Nz foor:)rr;r<r=rr>rr)rr?r@rAr r rrBls z9XMLTreeBuilderSmokeTest.test_pickle_and_unpickle_identitycCs|jd�}|j|j�d�dS)Nzs. )rrrV)rrr r r�test_docstring_generatedus z0XMLTreeBuilderSmokeTest.test_docstring_generatedcCs$d}|j|�}|j||jd��dS)Ns, r[)rrrV)rrrr r r�test_xml_declarationzs z,XMLTreeBuilderSmokeTest.test_xml_declarationcCs$d}|j|�}|j||jd��dS)Ns< r[)rrrV)rrrr r rr\s z3XMLTreeBuilderSmokeTest.test_processing_instructioncCs$d}|j|�}|j|jd�|�dS)zGA real XHTML document should come out *exactly* the same as it went in.s� Hello. Goodbye. zutf-8N)rrrV)rrrr r rrX�s z0XMLTreeBuilderSmokeTest.test_real_xhtml_documentcCs"d}|j|�}|j||j��dS)Ns )rrrV)r�docrr r r�test_nested_namespaces�s z.XMLTreeBuilderSmokeTest.test_nested_namespacescCs0d}t|d�}d|j_|j�}|jd|k�dS)Nz/ zlxml-xmlzconsole.log("< < hey > > ");s< < hey > >)rrerprVrb)rr�rZencodedr r r�5test_formatter_processes_script_tag_for_xml_documents�s zMXMLTreeBuilderSmokeTest.test_formatter_processes_script_tag_for_xml_documentscCs"d}|j|�}|jd|jj�dS)Nu?Sacré bleu!uSacré bleu!)rr�rootrp)rrrr r rr��s z7XMLTreeBuilderSmokeTest.test_can_parse_unicode_documentcCs$d}|j|�}|jt|j�|�dS)Nz�b2012-07-02T20:33:42Zcd)rrrFZrss)rrrr r r�test_popping_namespaced_tag�s z3XMLTreeBuilderSmokeTest.test_popping_namespaced_tagcCs |jd�}|j|jd�d�dS)Nz�latin1s/ )rrrV)rrr r r�(test_docstring_includes_correct_encoding�s z@XMLTreeBuilderSmokeTest.test_docstring_includes_correct_encodingcCs0dddd}|j|�}|j|jd�|�dS) z �0r:�szutf-8Ni)rrrV)rrrr r r�test_large_xml_document�s z/XMLTreeBuilderSmokeTest.test_large_xml_documentcCs|jdd�|jd�dS)Nz
z
z
foo
)r)rr r r�9test_tags_are_empty_element_if_and_only_if_they_are_empty�szQXMLTreeBuilderSmokeTest.test_tags_are_empty_element_if_and_only_if_they_are_emptycCs8d}|j|�}|j}|jd|d�|jd|d�dS)Nz�This tag is in the a namespaceThis tag is in the b namespacezhttp://example.com/zxmlns:azhttp://example.net/zxmlns:b)rr�r)rrrr�r r r�test_namespaces_are_preserved�s z5XMLTreeBuilderSmokeTest.test_namespaces_are_preservedcCs$d}|j|�}|jt|j�|�dS)NzN
20010504
)rrrFrH)rrrr r r�test_closing_namespaced_tag�s z3XMLTreeBuilderSmokeTest.test_closing_namespaced_tagcCs$d}|j|�}|jt|j�|�dS)Nzs)rrrFrC)rrrr r r�test_namespaced_attributes�s z2XMLTreeBuilderSmokeTest.test_namespaced_attributescCs$d}|j|�}|jt|j�|�dS)Nzbar)rrrFrC)rrrr r r�(test_namespaced_attributes_xml_namespace�s z@XMLTreeBuilderSmokeTest.test_namespaced_attributes_xml_namespacecCs�d}|j|�}|jdt|jd��|jdt|jd��|jdt|jd��|jdt|jddd ��|jdt|jddg��dS) Na foo bar baz ��tagr:zns1:tag�zns2:tag�value)�key)rrrGrY)rr�rr r r�test_find_by_prefixed_name�s z2XMLTreeBuilderSmokeTest.test_find_by_prefixed_namecCs2d}|j|�}|j}tj|�}|j|j|j�dS)Nzf )rZdocumentr]r�prefix)rZxmlrr�Z duplicater r r�!test_copy_tag_preserves_namespace�s z9XMLTreeBuilderSmokeTest.test_copy_tag_preserves_namespaceN)rrr rBr�r�r\rXr�r�r�r�r�r�r�r�r�r�r�r�r�r r r rr�js$ r�c@s8eZdZdZdd�Zdd�Zdd�Zdd �Zd d�ZdS) �HTML5TreeBuilderSmokeTestz2Smoke test for a tree builder that supports HTML5.cCsdS)Nr )rr r rrXsz2HTML5TreeBuilderSmokeTest.test_real_xhtml_documentcCs"d}|j|�}|jd|jj�dS)Nz zhttp://www.w3.org/1999/xhtml)rrru� namespace)rrrr r r�test_html_tags_have_namespaces z7HTML5TreeBuilderSmokeTest.test_html_tags_have_namespacecCs6d}|j|�}d}|j||jj�|j||jj�dS)Nzzhttp://www.w3.org/2000/svg)rrZsvgr�Zcircle)rrrr�r r r�test_svg_tags_have_namespace s z6HTML5TreeBuilderSmokeTest.test_svg_tags_have_namespacecCs6d}|j|�}d}|j||jj�|j||jj�dS)Nz $\sqrt{5}$ z"http://www.w3.org/1998/Math/MathML)rrZmathr�Zmsqrt)rrrr�r r r�test_mathml_tags_have_namespaces z9HTML5TreeBuilderSmokeTest.test_mathml_tags_have_namespacecCsPd}|j|�}|jt|jdt��|j|jdd�|jd|jdjj�dS)Nz3rz$?xml version="1.0" encoding="utf-8"?rL)rrbr�rErrrr8)rrrr r r�$test_xml_declaration_becomes_comments z>HTML5TreeBuilderSmokeTest.test_xml_declaration_becomes_commentN) rrr r�rXr�r�r�r�r r r rr��sr�csdd��fdd�}|S)Nc_sdS)Nr )Ztest�argsrr r r�nothing!szskipIf..nothingcs�r�S|SdS)Nr )Z test_item)� conditionr�r r� decorator$szskipIf..decoratorr )r��reasonr�r )r�r�r�skipIf sr�)r�Z__license__r;r]� functoolsZunittestrZbs4rZbs4.elementrrrrrZbs4.builderr rr �objectr"r�r�r�r r r r�s(%/#PK�je[�{i��"__pycache__/element.cpython-36.pycnu�[��3 &6]$�@s dZyddlmZWn.ek rBZzddlmZWYddZ[XnXddlZddlZddlZddl Z ddl mZdZej ddkZejd�Zdd �ZGd d�de�ZGdd �d e�ZGdd�de�ZGdd�de�ZGdd�de�ZGdd�de�ZGdd�de�ZGdd�de�ZGdd�de�ZGdd�de�ZGdd�de�ZGd d!�d!e�ZGd"d#�d#ee�Z Gd$d%�d%e �Z!Gd&d'�d'e!�Z"Gd(d)�d)e!�Z#Gd*d+�d+e#�Z$Gd,d-�d-e!�Z%Gd.d/�d/e!�Z&Gd0d1�d1e!�Z'Gd2d3�d3e�Z(Gd4d5�d5e�Z)Gd6d7�d7e*�Z+dS)8ZMIT�)�CallableN)�EntitySubstitutionzutf-8�z\s+cs&t�fdd��}|j�fdd��}|S)z>Alias one attribute name to another for backward compatibilitycs t|��S)N)�getattr)�self)�attr��/usr/lib/python3.6/element.py�aliassz_alias..aliascs t|��S)N)�setattr)r)rrr r s)�property�setter)rr r)rr �_aliassrc@seZdZddd�ZdS)�NamespacedAttributeNcCsV|dkrtj||�}n*|dkr,tj||�}ntj||d|�}||_||_||_|S)N�:)�str�__new__�prefix�name� namespace)�clsrrr�objrrr r"szNamespacedAttribute.__new__)N)�__name__� __module__�__qualname__rrrrr r src@seZdZdZdS)�%AttributeValueWithCharsetSubstitutionz=A stand-in object for a character encoding specified in HTML.N)rrr�__doc__rrrr r/src@s eZdZdZdd�Zdd�ZdS)�CharsetMetaAttributeValuez�A generic stand-in for the value of a meta tag's 'charset' attribute. When Beautiful Soup parses the markup '', the value of the 'charset' attribute will be one of these objects. cCstj||�}||_|S)N)rr�original_value)rrrrrr r9sz!CharsetMetaAttributeValue.__new__cCs|S)Nr)r�encodingrrr �encode>sz CharsetMetaAttributeValue.encodeN)rrrrrr rrrr r2src@s.eZdZdZejdej�Zdd�Zdd�Z dS)�ContentMetaAttributeValueaA generic stand-in for the value of a meta tag's 'content' attribute. When Beautiful Soup parses the markup: The value of the 'content' attribute will be one of these objects. z((^|;)\s*charset=)([^;]*)cCs6|jj|�}|dkr tjt|�Stj||�}||_|S)N)� CHARSET_RE�searchrrr)rr�matchrrrr rMsz!ContentMetaAttributeValue.__new__cs�fdd�}|jj||j�S)Ncs|jd��S)N�)�group)r$)rrr �rewriteXsz1ContentMetaAttributeValue.encode..rewrite)r"�subr)rrr'r)rr r Wsz ContentMetaAttributeValue.encodeN) rrrr�re�compile�Mr"rr rrrr r!Bs r!c@sVeZdZdZeddg�Zedg�Zeddg�Zedd��Z edd ��Z ed d��ZdS) �HTMLAwareEntitySubstitutiona%Entity substitution rules that are aware of some HTML quirks. Specifically, the contents of Hello, world! ztext/javascript�script�type)rr�find)rrLrr r r�test_double_head�s z)HTMLTreeBuilderSmokeTest.test_double_headcCsjd}|j|�|j|�}|jdd�}|j|jt�|jdd�}|j||j�|jdd�}|j||j�dS)Nz
foobaz
Zfoobar)�textrC�baz)rrrgrr>rrr)rrrZcommentrCrjr r r�test_comment�s z%HTMLTreeBuilderSmokeTest.test_commentcCstd}d}|j|�|j|�|j|�}|j|jj�|�|j|�}|j|jj�|�|jd�}|j|jj�d�dS)zWhitespace must be preserved in
and tags, even if that would mean not prettifying the markup. z<pre> </pre>z<textarea> woo woo zN)rrrZpreZprettifyZtextarea)rZ pre_markupZtextarea_markuprr r r�-test_preserved_whitespace_in_pre_and_textarea�s zFHTMLTreeBuilderSmokeTest.test_preserved_whitespace_in_pre_and_textareacCs.d}|j|�d}|j|�d}|j|�dS)z+Inline elements can be nested indefinitely.zInside a B tagz!
A nested tag
z/
A doubly nested tag
N)r)rZb_tagZnested_b_tagZdouble_nested_b_tagr r r�test_nested_inline_elements s z4HTMLTreeBuilderSmokeTest.test_nested_inline_elementscCs6|jd�}|j}|j|jjjd�|j|jjd�dS)zBlock elements can be nested.z*
Foo
ZFooN)r� blockquoterrH�b�string)rrrnr r r� test_nested_block_level_elementss z9HTMLTreeBuilderSmokeTest.test_nested_block_level_elementscCsd}|j|d�|jd�dS)z$One table can go inside another one.z[zh
Here's another table:
foo
Here's another table:
foo
z{
Foo
Bar
Baz
N)r)rrr r r�test_correctly_nested_tablessz5HTMLTreeBuilderSmokeTest.test_correctly_nested_tablescCs(d}|j|�}|jdg|jjd�dS)Nz1
Zcss�class)rrZdiv)rrrr r r�(test_deeply_nested_multivalued_attribute0s zAHTMLTreeBuilderSmokeTest.test_deeply_nested_multivalued_attributecCs(d}|j|�}|jddg|jd�dS)Nz�arors)rrrL)rrrr r r�"test_multivalued_attribute_on_html8s z;HTMLTreeBuilderSmokeTest.test_multivalued_attribute_on_htmlcCs|jdd�dS)Nzz)r)rr r r�3test_angle_brackets_in_attribute_values_are_escaped@szLHTMLTreeBuilderSmokeTest.test_angle_brackets_in_attribute_values_are_escapedcCs|jdd�dS)Nz$
• AT&T is in the s&p 500
z,
\u2022 AT&T is in the s&p 500
)r)rr r r�3test_strings_resembling_character_entity_referencesCszLHTMLTreeBuilderSmokeTest.test_strings_resembling_character_entity_referencescCs"d}|j|�}|jd|jj�dS)Nz%
“Hello” -☃
u“Hello” -☃)rrrHrp)rrrr r r�*test_entities_in_foreign_document_encodingKs zCHTMLTreeBuilderSmokeTest.test_entities_in_foreign_document_encodingcCs8d}|jd|�|jd|�|jd|�|jd|�dS)Nu
z
z
z
z
)r)r�expectr r r�0test_entities_in_attributes_converted_to_unicodeWs zIHTMLTreeBuilderSmokeTest.test_entities_in_attributes_converted_to_unicodecCs8d}|jd|�|jd|�|jd|�|jd|�dS)Nu
piñata
z
piñata
z
piñata
z
piñata
z
piñata
)r)rrzr r r�*test_entities_in_text_converted_to_unicode^s zCHTMLTreeBuilderSmokeTest.test_entities_in_text_converted_to_unicodecCs|jdd�dS)Nz#
I said "good day!"
z
I said "good day!"
)r)rr r r�,test_quot_entity_converted_to_quotation_markeszEHTMLTreeBuilderSmokeTest.test_quot_entity_converted_to_quotation_markcCs,d}|jd|�|jd|�|jd|�dS)Nu�z�z�z �)r)rrzr r r�test_out_of_range_entityisz1HTMLTreeBuilderSmokeTest.test_out_of_range_entitycCs<|jd�}|jd|jjjj�|jd|jj�|j|�dS)zDMostly to prevent a recurrence of a bug in the html5lib treebuilder.z!
foo
rHN)rrZh2rprr8rHr)rrr r r�test_multipart_stringsos z/HTMLTreeBuilderSmokeTest.test_multipart_stringscCs|jdd�|jdd�dS)zqVerify consistent handling of empty-element tags, no matter how they come in through the markup. z

z

N)r)rr r rr9vscCs,d}|j|�}|jd|jj�|j|�dS)z8Prevent recurrence of a bug in the html5lib treebuilder.z? foo N)rZassertNotEqualrL�bodyr)r�contentrr r r�#test_head_tag_between_head_and_body}s z

N)rrZarticle)rr�rr r r�test_multiple_copies_of_a_tag�s z6HTMLTreeBuilderSmokeTest.test_multiple_copies_of_a_tagcCs^d}|j|�}|j||j��|j}|jd|jd�|jd|jd�|jd|jd�dS) z�Parsers don't need to *understand* namespaces, but at the very least they should not choke on namespaces or lose data.s�4zhttp://www.w3.org/1999/xhtmlZxmlnsz"http://www.w3.org/1998/Math/MathMLzxmlns:mathmlzhttp://www.w3.org/2000/svgz xmlns:svgN)rrrVrL)rrrrLr r r�test_basic_namespaces�s z.HTMLTreeBuilderSmokeTest.test_basic_namespacescCs(d}|j|�}|jddg|jd�dS)NsrC�barrs)rrru)rrrr r r�-test_multivalued_attribute_value_becomes_list�s zFHTMLTreeBuilderSmokeTest.test_multivalued_attribute_value_becomes_listcCs"d}|j|�}|jd|jj�dS)NuDSacré bleu!uSacré bleu!)rrr�rp)rrrr r r�test_can_parse_unicode_document�s z8HTMLTreeBuilderSmokeTest.test_can_parse_unicode_documentcCs*td�}|jd|d�}|j|j�d�dS)z2Parsers should be able to work with SoupStrainers.roz&A bold statement)Z parse_onlyzboldN)rrrr)rZstrainerrr r r�test_soupstrainer�sz*HTMLTreeBuilderSmokeTest.test_soupstrainercCs|jdd�dS)Nzz)r)rr r r�7test_single_quote_attribute_values_become_double_quotes�szPHTMLTreeBuilderSmokeTest.test_single_quote_attribute_values_become_double_quotescCsd}|j|�dS)Nz'a)r)rrir r r�7test_attribute_values_with_nested_quotes_are_left_alone�szPHTMLTreeBuilderSmokeTest.test_attribute_values_with_nested_quotes_are_left_alonecCs.d}|j|�}d|jd<|j|jj�d�dS)Nz'azBrawls happen at "Bob's Bar"�attrz:a)rrCrr)rrirr r r�:test_attribute_values_with_double_nested_quotes_get_quoted�s zSHTMLTreeBuilderSmokeTest.test_attribute_values_with_double_nested_quotes_get_quotedcCs|jdd�|jdd�dS)Nz+z/z.fooz2foo)r)rr r r�.test_ampersand_in_attribute_value_gets_escaped�s zGHTMLTreeBuilderSmokeTest.test_ampersand_in_attribute_value_gets_escapedcCs|jd�dS)Nz/)r)rr r r�7test_escaped_ampersand_in_attribute_value_is_left_alone�szPHTMLTreeBuilderSmokeTest.test_escaped_ampersand_in_attribute_value_is_left_alonecCsd}d}|j||�dS)Nz-
<<sacré bleu!>>
u#
<<sacré bleu!>>
)r)rri�expectedr r r�1test_entities_in_strings_converted_during_parsing�szJHTMLTreeBuilderSmokeTest.test_entities_in_strings_converted_during_parsingcCs"d}|j|�}|j|jjd�dS)Ns
�Foo�
u ‘Foo’)rrrHrp)rZquoterr r r�)test_smart_quotes_converted_on_the_way_in�s zBHTMLTreeBuilderSmokeTest.test_smart_quotes_converted_on_the_way_incCs|jd�}|j|jjd�dS)Nz � r:u )rrrurp)rrr r r�0test_non_breaking_spaces_converted_on_the_way_in�s zIHTMLTreeBuilderSmokeTest.test_non_breaking_spaces_converted_on_the_way_incCs0d}djd�}|j|�}|j|jjd�|�dS)Nz-
<<sacré bleu!>>
u#
<<sacré bleu!>>
zutf-8)rVrrrH)rrir�rr r r�&test_entities_converted_on_the_way_out�s z?HTMLTreeBuilderSmokeTest.test_entities_converted_on_the_way_outcCsHd}|jd�}|j|�}|jd�}|jdd�}|jd�}|j||�dS)Nu�
Sacré bleu!
z iso-8859-1zutf-8zISO-Latin-1)rVrrWr)r�unicode_htmlZiso_latin_htmlr�resultr�r r r�test_real_iso_latin_document�s z5HTMLTreeBuilderSmokeTest.test_real_iso_latin_documentcCsLd}|jd�}|j|�}|j|jd�|jd��|j|jd�|jd��dS)Nsk
��Shift-JIS�ŃR�[�f�B��O��ꂽ��{��̃t�@�C��ł��B
z shift-jiszutf-8�euc_jp)rrrrV)r�shift_jis_htmlr�rr r r�test_real_shift_jis_documents z5HTMLTreeBuilderSmokeTest.test_real_shift_jis_documentcCsBd}|j|dd�}|jdks t�|j|jd�|jd�jd��dS)Ns�Hebrew (ISO 8859-8) in Visual Directionality
Hebrew (ISO 8859-8) in Visual Directionality
�� iso8859-8)Z from_encoding� iso-8859-8zutf-8)r�r�)rZoriginal_encoding�AssertionErrorrrVr)rZhebrew_documentrr r r�test_real_hebrew_document$s z2HTMLTreeBuilderSmokeTest.test_real_hebrew_documentcCs`d}d|}|j|�}|jdddi�}|d}|jd|�|jt|t��|jd|jd ��dS) NzEzj %s Shift-JIS markup goes here.r.z http-equivzContent-typer�ztext/html; charset=x-sjisztext/html; charset=utf8r[)rrgrrb� isinstancerrV)r�meta_tagr�r�parsed_metar�r r r�'test_meta_tag_reflects_current_encoding1s z@HTMLTreeBuilderSmokeTest.test_meta_tag_reflects_current_encodingcCs^d}d|}|j|�}|jddd�}|d}|jd|�|jt|t��|jd|jd��dS) Nz'zj %s Shift-JIS markup goes here.r.�encoding)�id�charsetzx-sjisr[)rrgrrbr�rrV)rr�r�rr�r�r r r�3test_html5_style_meta_tag_reflects_current_encodingMs zLHTMLTreeBuilderSmokeTest.test_html5_style_meta_tag_reflects_current_encodingcCs*|jd�}d|jd<|jd|jj��dS)Nztextr�rCztext)rrurr)r�datar r r�5test_tag_with_no_attributes_can_have_attributes_addedes zNHTMLTreeBuilderSmokeTest.test_tag_with_no_attributes_can_have_attributes_addedN);rrr �__doc__r9rBrKrDrMrOrPrQrRrSrXrZr\r_r`rarcrdrhrkrlrmrqrrrtrvrwrxryr{r|r}r~rr�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r�r r r rr"?sr r"c@s�eZdZdd�Zdd�Zdd�Zdd�Zd d �Zdd�Zd d�Z dd�Z dd�Zdd�Zdd�Z dd�Zdd�Zdd�Zdd�Zdd �Zd!d"�Zd#d$�Zd%S)&�XMLTreeBuilderSmokeTestcCsF|jd�}tj|d�}tj|�}|j|jt�|j|j�|j��dS)Nz foor:)rr;r<r=rr>rr)rr?r@rAr r rrBls z9XMLTreeBuilderSmokeTest.test_pickle_and_unpickle_identitycCs|jd�}|j|j�d�dS)Nzs. )rrrV)rrr r r�test_docstring_generatedus z0XMLTreeBuilderSmokeTest.test_docstring_generatedcCs$d}|j|�}|j||jd��dS)Ns, r[)rrrV)rrrr r r�test_xml_declarationzs z,XMLTreeBuilderSmokeTest.test_xml_declarationcCs$d}|j|�}|j||jd��dS)Ns< r[)rrrV)rrrr r rr\s z3XMLTreeBuilderSmokeTest.test_processing_instructioncCs$d}|j|�}|j|jd�|�dS)zGA real XHTML document should come out *exactly* the same as it went in.s� Hello. Goodbye. zutf-8N)rrrV)rrrr r rrX�s z0XMLTreeBuilderSmokeTest.test_real_xhtml_documentcCs"d}|j|�}|j||j��dS)Ns )rrrV)r�docrr r r�test_nested_namespaces�s z.XMLTreeBuilderSmokeTest.test_nested_namespacescCs0d}t|d�}d|j_|j�}|jd|k�dS)Nz/ zlxml-xmlzconsole.log("< < hey > > ");s< < hey > >)rrerprVrb)rr�rZencodedr r r�5test_formatter_processes_script_tag_for_xml_documents�s zMXMLTreeBuilderSmokeTest.test_formatter_processes_script_tag_for_xml_documentscCs"d}|j|�}|jd|jj�dS)Nu?Sacré bleu!uSacré bleu!)rr�rootrp)rrrr r rr��s z7XMLTreeBuilderSmokeTest.test_can_parse_unicode_documentcCs$d}|j|�}|jt|j�|�dS)Nz�b2012-07-02T20:33:42Zcd)rrrFZrss)rrrr r r�test_popping_namespaced_tag�s z3XMLTreeBuilderSmokeTest.test_popping_namespaced_tagcCs |jd�}|j|jd�d�dS)Nz�latin1s/ )rrrV)rrr r r�(test_docstring_includes_correct_encoding�s z@XMLTreeBuilderSmokeTest.test_docstring_includes_correct_encodingcCs0dddd}|j|�}|j|jd�|�dS) z �0r:�szutf-8Ni)rrrV)rrrr r r�test_large_xml_document�s z/XMLTreeBuilderSmokeTest.test_large_xml_documentcCs|jdd�|jd�dS)Nz
z
z
foo
)r)rr r r�9test_tags_are_empty_element_if_and_only_if_they_are_empty�szQXMLTreeBuilderSmokeTest.test_tags_are_empty_element_if_and_only_if_they_are_emptycCs8d}|j|�}|j}|jd|d�|jd|d�dS)Nz�This tag is in the a namespaceThis tag is in the b namespacezhttp://example.com/zxmlns:azhttp://example.net/zxmlns:b)rr�r)rrrr�r r r�test_namespaces_are_preserved�s z5XMLTreeBuilderSmokeTest.test_namespaces_are_preservedcCs$d}|j|�}|jt|j�|�dS)NzN
20010504
)rrrFrH)rrrr r r�test_closing_namespaced_tag�s z3XMLTreeBuilderSmokeTest.test_closing_namespaced_tagcCs$d}|j|�}|jt|j�|�dS)Nzs)rrrFrC)rrrr r r�test_namespaced_attributes�s z2XMLTreeBuilderSmokeTest.test_namespaced_attributescCs$d}|j|�}|jt|j�|�dS)Nzbar)rrrFrC)rrrr r r�(test_namespaced_attributes_xml_namespace�s z@XMLTreeBuilderSmokeTest.test_namespaced_attributes_xml_namespacecCs�d}|j|�}|jdt|jd��|jdt|jd��|jdt|jd��|jdt|jddd ��|jdt|jddg��dS) Na foo bar baz ��tagr:zns1:tag�zns2:tag�value)�key)rrrGrY)rr�rr r r�test_find_by_prefixed_name�s z2XMLTreeBuilderSmokeTest.test_find_by_prefixed_namecCs2d}|j|�}|j}tj|�}|j|j|j�dS)Nzf )rZdocumentr]r�prefix)rZxmlrr�Z duplicater r r�!test_copy_tag_preserves_namespace�s z9XMLTreeBuilderSmokeTest.test_copy_tag_preserves_namespaceN)rrr rBr�r�r\rXr�r�r�r�r�r�r�r�r�r�r�r�r�r r r rr�js$ r�c@s8eZdZdZdd�Zdd�Zdd�Zdd �Zd d�ZdS) �HTML5TreeBuilderSmokeTestz2Smoke test for a tree builder that supports HTML5.cCsdS)Nr )rr r rrXsz2HTML5TreeBuilderSmokeTest.test_real_xhtml_documentcCs"d}|j|�}|jd|jj�dS)Nz zhttp://www.w3.org/1999/xhtml)rrru� namespace)rrrr r r�test_html_tags_have_namespaces z7HTML5TreeBuilderSmokeTest.test_html_tags_have_namespacecCs6d}|j|�}d}|j||jj�|j||jj�dS)Nzzhttp://www.w3.org/2000/svg)rrZsvgr�Zcircle)rrrr�r r r�test_svg_tags_have_namespace s z6HTML5TreeBuilderSmokeTest.test_svg_tags_have_namespacecCs6d}|j|�}d}|j||jj�|j||jj�dS)Nz $\sqrt{5}$ z"http://www.w3.org/1998/Math/MathML)rrZmathr�Zmsqrt)rrrr�r r r�test_mathml_tags_have_namespaces z9HTML5TreeBuilderSmokeTest.test_mathml_tags_have_namespacecCsPd}|j|�}|jt|jdt��|j|jdd�|jd|jdjj�dS)Nz3rz$?xml version="1.0" encoding="utf-8"?rL)rrbr�rErrrr8)rrrr r r�$test_xml_declaration_becomes_comments z>HTML5TreeBuilderSmokeTest.test_xml_declaration_becomes_commentN) rrr r�rXr�r�r�r�r r r rr��sr�csdd��fdd�}|S)Nc_sdS)Nr )Ztest�argsrr r r�nothing!szskipIf..nothingcs�r�S|SdS)Nr )Z test_item)� conditionr�r r� decorator$szskipIf..decoratorr )r��reasonr�r )r�r�r�skipIf sr�)r�Z__license__r;r]� functoolsZunittestrZbs4rZbs4.elementrrrrrZbs4.builderr rr �objectr"r�r�r�r r r r�s(%/#PK�je[�{i��(__pycache__/element.cpython-36.opt-1.pycnu�[��3 &6]$�@s dZyddlmZWn.ek rBZzddlmZWYddZ[XnXddlZddlZddlZddl Z ddl mZdZej ddkZejd�Zdd �ZGd d�de�ZGdd �d e�ZGdd�de�ZGdd�de�ZGdd�de�ZGdd�de�ZGdd�de�ZGdd�de�ZGdd�de�ZGdd�de�ZGdd�de�ZGd d!�d!e�ZGd"d#�d#ee�Z Gd$d%�d%e �Z!Gd&d'�d'e!�Z"Gd(d)�d)e!�Z#Gd*d+�d+e#�Z$Gd,d-�d-e!�Z%Gd.d/�d/e!�Z&Gd0d1�d1e!�Z'Gd2d3�d3e�Z(Gd4d5�d5e�Z)Gd6d7�d7e*�Z+dS)8ZMIT�)�CallableN)�EntitySubstitutionzutf-8�z\s+cs&t�fdd��}|j�fdd��}|S)z>Alias one attribute name to another for backward compatibilitycs t|��S)N)�getattr)�self)�attr��/usr/lib/python3.6/element.py�aliassz_alias..aliascs t|��S)N)�setattr)r)rrr r s)�property�setter)rr r)rr �_aliassrc@seZdZddd�ZdS)�NamespacedAttributeNcCsV|dkrtj||�}n*|dkr,tj||�}ntj||d|�}||_||_||_|S)N�:)�str�__new__�prefix�name� namespace)�clsrrr�objrrr r"szNamespacedAttribute.__new__)N)�__name__� __module__�__qualname__rrrrr r src@seZdZdZdS)�%AttributeValueWithCharsetSubstitutionz=A stand-in object for a character encoding specified in HTML.N)rrr�__doc__rrrr r/src@s eZdZdZdd�Zdd�ZdS)�CharsetMetaAttributeValuez�A generic stand-in for the value of a meta tag's 'charset' attribute. When Beautiful Soup parses the markup '', the value of the 'charset' attribute will be one of these objects. cCstj||�}||_|S)N)rr�original_value)rrrrrr r9sz!CharsetMetaAttributeValue.__new__cCs|S)Nr)r�encodingrrr �encode>sz CharsetMetaAttributeValue.encodeN)rrrrrr rrrr r2src@s.eZdZdZejdej�Zdd�Zdd�Z dS)�ContentMetaAttributeValueaA generic stand-in for the value of a meta tag's 'content' attribute. When Beautiful Soup parses the markup: The value of the 'content' attribute will be one of these objects. z((^|;)\s*charset=)([^;]*)cCs6|jj|�}|dkr tjt|�Stj||�}||_|S)N)� CHARSET_RE�searchrrr)rr�matchrrrr rMsz!ContentMetaAttributeValue.__new__cs�fdd�}|jj||j�S)Ncs|jd��S)N�)�group)r$)rrr �rewriteXsz1ContentMetaAttributeValue.encode..rewrite)r"�subr)rrr'r)rr r Wsz ContentMetaAttributeValue.encodeN) rrrr�re�compile�Mr"rr rrrr r!Bs r!c@sVeZdZdZeddg�Zedg�Zeddg�Zedd��Z edd ��Z ed d��ZdS) �HTMLAwareEntitySubstitutiona%Entity substitution rules that are aware of some HTML quirks. Specifically, the contents of

foo

Hebrew (ISO 8859-8) in Visual Directionality

\nfoo

Hebrew (ISO 8859-8) in Visual Directionality

éé

foo\0bar

Räksmörgås

here it is

An H1

An H2

Another H2

Räksmörgås

here it is

An H1

An H2

Another H2

foo

Hebrew (ISO 8859-8) in Visual Directionality