Kindly requesting your help on one problem related to running a Python script with envoking BeautifulSoup.
Basically, I had unzipped the bs4.zip file and put the respective folder into the same folder where my .py files are stored.
Enter -
http://www.dr-chuck.com/page2.htmTraceback (most recent call last):
File "C:\Books\py4e - Training\Exercises\
Exercise12.4.py", line 18, in <module>
soup = BeautifulSoup(html, 'html.parser')
File "C:\Books\py4e - Training\Exercises\bs4\__init__.py", line 215, in __init__
self._feed()
File "C:\Books\py4e - Training\Exercises\bs4\__init__.py", line 239, in _feed
self.builder.feed(self.markup)
File "C:\Books\py4e - Training\Exercises\bs4\builder\_htmlparser.py", line 164, in feed
parser.feed(markup)
File "C:\Users\Наталья\AppData\Local\Programs\Python\Python311\Lib\html\parser.py", line 110, in feed
self.goahead(0)
File "C:\Users\Наталья\AppData\Local\Programs\Python\Python311\Lib\html\parser.py", line 170, in goahead
k = self.parse_starttag(i)
File "C:\Users\Наталья\AppData\Local\Programs\Python\Python311\Lib\html\parser.py", line 337, in parse_starttag
self.handle_starttag(tag, attrs)
File "C:\Books\py4e - Training\Exercises\bs4\builder\_htmlparser.py", line 62, in handle_starttag
self.soup.handle_starttag(name, None, None, attr_dict)
File "C:\Books\py4e - Training\Exercises\bs4\__init__.py", line 404, in handle_starttag
self.currentTag, self._most_recent_element)
File "C:\Books\py4e - Training\Exercises\bs4\element.py", line 1001, in __getattr__
return self.find(tag)
File "C:\Books\py4e - Training\Exercises\bs4\element.py", line 1238, in find
l = self.find_all(name, attrs, recursive, text, 1, **kwargs)
File "C:\Books\py4e - Training\Exercises\bs4\element.py", line 1259, in find_all
return self._find_all(name, attrs, text, limit, generator, **kwargs)
File "C:\Books\py4e - Training\Exercises\bs4\element.py", line 516, in _find_all
strainer = SoupStrainer(name, attrs, text, **kwargs)
File "C:\Books\py4e - Training\Exercises\bs4\element.py", line 1560, in __init__
self.text = self._normalize_search_value(text)
File "C:\Books\py4e - Training\Exercises\bs4\element.py", line 1565, in _normalize_search_value
if (isinstance(value, str) or isinstance(value, collections.Callable) or hasattr(value, 'match')
AttributeError: module 'collections' has no attribute 'Callable'
import urllib.request, urllib.parse, urllib.error
from bs4 import BeautifulSoup
import ssl
# Ignore SSL certificate errors
ctx = ssl.create_default_context()
ctx.check_hostname = False
ctx.verify_mode = ssl.CERT_NONE
url = input('Enter - ')
if len(url)<1:
url = '
http://data.pr4e.org'
html = urllib.request.urlopen(url, context=ctx).read()
soup = BeautifulSoup(html, 'html.parser')
# Retrieve all of the anchor tags
tags = soup('a')
for tag in tags:
print(tag.get('href', None))
I have no idea what might have gone wrong.
Highly appreciate if you could help me on this.