Feb-25-2019, 11:54 PM
# The following will return a list of 2-grams found in the Wikipedia article on the Python programming language: import requests from bs4 import BeautifulSoup def getNgrams(input, n): input = input.split('') output = [] for i in range(len(input)-n+1): output.append(input[i:i+n]) return output html = requests.get("https://en.wikipedia.org/wiki/Python_(programming_language)") bsObj = BeautifulSoup(html.content, 'html.parser') content = bsObj.find("div", {"id":"mw-content-text"}).get_text() ngrams = getNgrams(content, 2) print(ngrams) print("2-grams count is: "+str(len(ngrams)))
Error:Traceback (most recent call last):
File "C:\Python36\kodovi\ngram.py", line 3, in <module>
import requests
File "C:\Python36\lib\site-packages\requests\__init__.py", line 43, in <modul
>
import urllib3
File "C:\Python36\lib\site-packages\urllib3\__init__.py", line 8, in <module>
from .connectionpool import (
File "C:\Python36\lib\site-packages\urllib3\connectionpool.py", line 11, in <
odule>
from .exceptions import (
File "C:\Python36\lib\site-packages\urllib3\exceptions.py", line 2, in <modul
>
from .packages.six.moves.http_client import (
File "C:\Python36\lib\site-packages\urllib3\packages\six.py", line 203, in lo
d_module
mod = mod._resolve()
File "C:\Python36\lib\site-packages\urllib3\packages\six.py", line 115, in _r
solve
return _import_module(self.mod)
File "C:\Python36\lib\site-packages\urllib3\packages\six.py", line 82, in _im
ort_module
__import__(name)
File "C:\Python36\lib\http\client.py", line 71, in <module>
import email.parser
File "C:\Python36\kodovi\email.py", line 3, in <module>
import smtplib
File "C:\Python36\lib\smtplib.py", line 47, in <module>
import email.utils
ModuleNotFoundError: No module named 'email.utils'; 'email' is not a package
Any idea why these errors appear?