summaryrefslogtreecommitdiffstats
path: root/g4f
diff options
context:
space:
mode:
authorH Lohaus <hlohaus@users.noreply.github.com>2024-11-15 18:21:22 +0100
committerGitHub <noreply@github.com>2024-11-15 18:21:22 +0100
commitd53db732485df4112b0eb2eb126d3fc189c58154 (patch)
tree1e503725093d116a9be7ef9a14f6695ba3125c38 /g4f
parentUpdate internet.py (diff)
downloadgpt4free-d53db732485df4112b0eb2eb126d3fc189c58154.tar
gpt4free-d53db732485df4112b0eb2eb126d3fc189c58154.tar.gz
gpt4free-d53db732485df4112b0eb2eb126d3fc189c58154.tar.bz2
gpt4free-d53db732485df4112b0eb2eb126d3fc189c58154.tar.lz
gpt4free-d53db732485df4112b0eb2eb126d3fc189c58154.tar.xz
gpt4free-d53db732485df4112b0eb2eb126d3fc189c58154.tar.zst
gpt4free-d53db732485df4112b0eb2eb126d3fc189c58154.zip
Diffstat (limited to 'g4f')
-rw-r--r--g4f/gui/server/internet.py2
1 files changed, 1 insertions, 1 deletions
diff --git a/g4f/gui/server/internet.py b/g4f/gui/server/internet.py
index a2d0165b..6426f608 100644
--- a/g4f/gui/server/internet.py
+++ b/g4f/gui/server/internet.py
@@ -67,7 +67,7 @@ def scrape_text(html: str, max_words: int = None) -> str:
if select:
select.extract()
clean_text = ""
- for paragraph in soup.select("p"):
+ for paragraph in soup.select("p, h1, h2, h3, h4, h5, h6"):
text = paragraph.get_text()
for line in text.splitlines():
words = []