python
pip install readability-lxml
python
from readability import Document
import requests
url = "https://example.com/article.html"
response = requests.get(url)
html = response.text
doc = Document(html)
title = doc.title()
author = doc.byline()
content = doc.content()