feat: lite deep researcher implementation

This commit is contained in:
He Tao
2025-04-07 16:25:55 +08:00
commit 03798ded08
58 changed files with 4242 additions and 0 deletions

View File

@@ -0,0 +1,12 @@
from readabilipy import simple_json_from_html_string
from .article import Article
class ReadabilityExtractor:
def extract_article(self, html: str) -> Article:
article = simple_json_from_html_string(html, use_readability=True)
return Article(
title=article.get("title"),
html_content=article.get("content"),
)