mrmp/hypertext.py
Marc Beninca c79ec30078 links
2023-01-28 21:19:16 +01:00

22 lines
491 B
Python

import html.parser
import requests
CHARSET = 'u8'
class Parser(html.parser.HTMLParser):
def __init__(self):
self.links = []
super().__init__()
def handle_starttag(self, tag, attributes):
if tag == 'a':
self.links.extend(
[v for k, v in attributes if k == 'href'])
def get_links(location):
hypertext = requests.get(location).content.decode(CHARSET)
parser = Parser()
parser.feed(hypertext)
return parser.links