Spaces:

Zaherrr
/

OOP_KG_Transform_POC

Sleeping

OOP_KG_Transform_POC / models /gemini_image_to_json.py

Rename gemini_image_to_json.py to models/gemini_image_to_json.py

1d31c90 verified 3 months ago

1.49 kB

	import google.generativeai as genai

	from dotenv import load_dotenv
	import os

	load_dotenv()
	GOOGLE_API_KEY = os.getenv("GOOGLE_API_KEY")

	genai.configure(api_key=GOOGLE_API_KEY)

	# gemini-1.5-pro only gives 50 requests per day. check https://ai.google.dev/pricing for more details
	# model = genai.GenerativeModel('gemini-1.5-pro',
	model = genai.GenerativeModel(
	"gemini-1.5-flash",
	# Set the `response_mime_type` to output JSON
	# Pass the schema object to the `response_schema` field
	generation_config={
	"response_mime_type": "application/json",
	"temperature": 0.0,
	},
	)
	# "response_schema": Recipe, 'max_output_tokens':4000})

	PROMPT = """
	You are responsible for extracting the entities (nodes) and relationships (edges) from the images of mind maps. The mind maps are for Object Oriented Programming.
	Don't make up facts, just extracts them. Do not create new entity types that aren't mentioned in the image, and at the same time don't miss anything.
	Give the output in JSON format with this schema:
	{
	"nodes": [{"id": "1", "label": string},{"id": "2", "label": string}],"edges": [{"source": SOURCE_ID, "target": TARGET_ID, "type": "->"},{"source": SOURCE_ID, "target": TARGET_ID, "type": "->"}]
	}

	Now extract the entities and relationships from this image:
	"""


	def fetch_gemini_response(mind_map_image):

	print("fetching gemini response")
	response = model.generate_content([PROMPT, mind_map_image], stream=False)

	return response.text