Spaces:

kijeoung
/

blogcatch250113test

Sleeping

kijeoung commited on Jan 13

Commit

87047c3

verified ·

1 Parent(s): cf95b41

Create app.py

Files changed (1) hide show

app.py ADDED Viewed

+from flask import Flask, request, jsonify
+from bs4 import BeautifulSoup
+import requests
+app = Flask(__name__)
+def scrape_naver_blog(url):
+    try:
+        # Send a GET request to the URL
+        response = requests.get(url)
+        response.raise_for_status()
+        # Parse the HTML content
+        soup = BeautifulSoup(response.text, 'html.parser')
+        # Extract title using the provided XPath-like logic
+        title_element = soup.select_one('div.se-module.se-module-text span.se-fs- se-ff-')
+        title = title_element.get_text(strip=True) if title_element else "Title not found"
+        # Extract content using the provided XPath-like logic
+        content_element = soup.select_one('div.se-main-container')
+        content = content_element.get_text(strip=True) if content_element else "Content not found"
+        return {"title": title, "content": content}
+    except Exception as e:
+        return {"error": str(e)}
+@app.route('/scrape', methods=['POST'])
+def scrape():
+    data = request.json
+    url = data.get('url')
+    if not url:
+        return jsonify({"error": "URL is required"}), 400
+    result = scrape_naver_blog(url)
+    return jsonify(result)
+if __name__ == '__main__':
+    app.run(debug=True)