diff options
author | H Lohaus <hlohaus@users.noreply.github.com> | 2024-11-15 18:21:22 +0100 |
---|---|---|
committer | GitHub <noreply@github.com> | 2024-11-15 18:21:22 +0100 |
commit | d53db732485df4112b0eb2eb126d3fc189c58154 (patch) | |
tree | 1e503725093d116a9be7ef9a14f6695ba3125c38 /g4f/gui/server/internet.py | |
parent | Update internet.py (diff) | |
download | gpt4free-d53db732485df4112b0eb2eb126d3fc189c58154.tar gpt4free-d53db732485df4112b0eb2eb126d3fc189c58154.tar.gz gpt4free-d53db732485df4112b0eb2eb126d3fc189c58154.tar.bz2 gpt4free-d53db732485df4112b0eb2eb126d3fc189c58154.tar.lz gpt4free-d53db732485df4112b0eb2eb126d3fc189c58154.tar.xz gpt4free-d53db732485df4112b0eb2eb126d3fc189c58154.tar.zst gpt4free-d53db732485df4112b0eb2eb126d3fc189c58154.zip |
Diffstat (limited to '')
-rw-r--r-- | g4f/gui/server/internet.py | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/g4f/gui/server/internet.py b/g4f/gui/server/internet.py index a2d0165b..6426f608 100644 --- a/g4f/gui/server/internet.py +++ b/g4f/gui/server/internet.py @@ -67,7 +67,7 @@ def scrape_text(html: str, max_words: int = None) -> str: if select: select.extract() clean_text = "" - for paragraph in soup.select("p"): + for paragraph in soup.select("p, h1, h2, h3, h4, h5, h6"): text = paragraph.get_text() for line in text.splitlines(): words = [] |