Arafath10 commited on
Commit
599b9d7
·
verified ·
1 Parent(s): a7db7e5

Update scraper.py

Browse files
Files changed (1) hide show
  1. scraper.py +1 -1
scraper.py CHANGED
@@ -25,7 +25,7 @@ class Scraper:
25
 
26
  # Get page content (paragraphs, headers)
27
  page_content = await page.evaluate("""() => {
28
- let elements = Array.from(document.querySelectorAll('p, h1, h2, h3, h4, h5, h6'));
29
  return elements.map(element => element.innerText).join('\\n');
30
  }""")
31
 
 
25
 
26
  # Get page content (paragraphs, headers)
27
  page_content = await page.evaluate("""() => {
28
+ let elements = Array.from(document.querySelectorAll('body *'));
29
  return elements.map(element => element.innerText).join('\\n');
30
  }""")
31