Spaces:

JiaxinGe
/

AutoPresent

Running

App Files Files Community

AutoPresent / SlidesLib /search.py

para-lost

fix bug

3fe784f about 2 months ago

raw

history blame contribute delete

5.75 kB

	from selenium import webdriver
	from selenium.webdriver.chrome.service import Service
	from selenium.webdriver.chrome.options import Options
	from chromedriver_py import binary_path
	from selenium.webdriver.common.by import By
	from selenium.webdriver.support.ui import WebDriverWait
	import time
	import requests
	from bing_image_downloader import downloader
	import os
	import shutil
	class GoogleSearch:
	@classmethod
	def _init_driver(cls):
	chrome_options = Options()
	chrome_options.add_argument("--headless")
	chrome_options.add_argument("--disable-gpu")
	chrome_options.add_argument("--no-sandbox")
	chrome_options.add_argument("--disable-dev-shm-usage")
	service = Service(binary_path)
	driver = webdriver.Chrome(service=service, options=chrome_options)
	wait = WebDriverWait(driver, 100)
	return driver, wait

	@classmethod
	def search_result(cls, question: str, screenshot_path: str = "screenshot.png") -> str:
	"""Search a question on Google and return a screenshot of the search result."""
	driver, wait = cls._init_driver()

	if not question:
	raise ValueError("Please provide a question")

	# Perform Google search
	search_url = f"https://www.google.com/search?q={question}"
	driver.get(search_url)

	# Give some time for the page to load
	time.sleep(3)

	# Take a screenshot
	driver.save_screenshot(screenshot_path)

	driver.quit()
	return screenshot_path

	@classmethod
	def search_image_org(cls, query: str, download_path: str = 'top_image.png') -> str:
	"""Search for an image on Google and download the top result."""
	driver, wait = cls._init_driver()

	if not query:
	raise ValueError("Please provide a query")

	# Perform Google image search
	search_url = f"https://www.google.com/search?tbm=isch&q={query}"
	driver.get(search_url)

	# Find all image elements
	image_elements = driver.find_elements(By.CSS_SELECTOR, "img")

	# Filter out Google icon images and get the first valid image URL
	image_url = None
	for img in image_elements:
	src = img.get_attribute("src")
	if src and "googlelogo" not in src:
	image_url = src
	try:
	response = requests.get(image_url)
	with open(download_path, 'wb') as file:
	file.write(response.content)

	driver.quit()
	print(image_url)
	return download_path
	except Exception:
	print("Error downloading image, skipping.")
	continue

	driver.quit()
	raise Exception("No valid image found")

	@classmethod
	def search_image_prev(cls, query, output_dir='./downloads', limit=10):
	# Download images using Bing Image Downloader
	downloader.download(query, limit=limit, output_dir=output_dir, adult_filter_off=True, force_replace=False, timeout=60)
	# List the files in the output directory
	image_dir = os.path.join(output_dir, query)
	if not os.path.exists(image_dir):
	raise FileNotFoundError(f"No images found for query '{query}' in directory '{output_dir}'")

	# Collect all image paths
	image_paths = [os.path.join(image_dir, file) for file in os.listdir(image_dir) if file.endswith(('jpg', 'jpeg', 'png'))]

	# Return the first image
	return image_paths[0]

	@classmethod
	def search_image_prev(cls, query, output_dir='./downloads', limit=10):
	# Download images using Bing Image Downloader
	downloader.download(query, limit=limit, output_dir=output_dir, adult_filter_off=True, force_replace=False, timeout=60)
	# List the files in the output directory
	image_dir = os.path.join(output_dir, query)
	if not os.path.exists(image_dir):
	raise FileNotFoundError(f"No images found for query '{query}' in directory '{output_dir}'")

	# Collect all image paths
	image_paths = [os.path.join(image_dir, file) for file in os.listdir(image_dir) if file.endswith(('jpg', 'jpeg', 'png'))]

	# Return the first image
	return image_paths[0]

	@classmethod
	def search_image(cls, query, save_path):
	"""
	Search for an image based on the query and save the result to the specified path.

	Args:
	query (str): The query to search for.
	save_path (str): The path to save the downloaded image.

	Returns:
	str: The path where the image was saved.
	"""
	# Create a temporary directory for storing downloaded images
	temp_dir = "./temp_download"
	os.makedirs(temp_dir, exist_ok=True)

	# Download only the top image result
	downloader.download(query, limit=1, output_dir=temp_dir, adult_filter_off=True, force_replace=True, timeout=60)

	# Construct the expected directory and image path
	image_dir = os.path.join(temp_dir, query)
	image_files = [file for file in os.listdir(image_dir) if file.endswith(('jpg', 'jpeg', 'png'))]

	# Check if any image files were downloaded
	if not image_files:
	raise FileNotFoundError(f"No images found for query '{query}'.")

	# Copy the top image to the desired save path
	top_image_path = os.path.join(image_dir, image_files[0])
	shutil.move(top_image_path, save_path)

	# Clean up temporary directory
	shutil.rmtree(temp_dir)

	return save_path