diff --git a/py/html2text.py b/py/html2text.py new file mode 100644 index 0000000..740e7ce --- /dev/null +++ b/py/html2text.py @@ -0,0 +1,6 @@ +from urllib import request +import html2text + +url = 'https://duckduckgo.com' +text = request.urlopen(url).read().decode('utf8') +print(html2text.html2text(text))