Spaces:

bedead
/

Multimodal_LLM_for_generating_testcases

Runtime error

App Files Files Community

Multimodal_LLM_for_generating_testcases / llm.py

bedead

Upload 3 files

20279d8 verified 2 months ago

raw

history blame contribute delete

2.73 kB

	import torch
	from transformers import AutoModelForCausalLM, AutoTokenizer
	from PIL import Image
	import gradio as gr
	import time

	model = AutoModelForCausalLM.from_pretrained(
	"MILVLG/imp-v1-3b",
	torch_dtype=torch.float16,
	device_map="auto",
	trust_remote_code=True,
	)

	tokenizer = AutoTokenizer.from_pretrained("MILVLG/imp-v1-3b", trust_remote_code=True)


	def response(USER_DATA, TOKEN) -> str:
	print(USER_DATA)
	MESSAGE = USER_DATA["text"]
	NUM_FILES = len(USER_DATA["files"])
	FILES = USER_DATA["files"]

	SYSTEM_PROMPT = f"""
	A chat between a curious user and an artificial intelligence assistant. The assistant gives helpful, detailed testcase related to image uploaded. You are tasked with generating detailed, step-by-step test cases for software functionality based on uploaded images. The user will provide one or more images of a software or website interface. For each image, generate a separate set of test cases following the format below:

	'''Description: Provide a brief explanation of the functionality being tested, as inferred from the image.
	Pre-conditions: Identify any setup requirements, dependencies, or conditions that must be met before testing can begin (e.g., user logged in, specific data pre-populated, etc.).
	Testing Steps: Outline a clear, numbered sequence of actions that a user would take to test the functionality in the image.
	Expected Result: Specify the expected outcome if the functionality is working as intended.'''

	Ensure that:
	Testcases should be related to validation of data, component interactions, navigation, etc.
	Each testcase should have it's own Description, Pre-conidtions, Testing Steps, Expected Result.

	USER: <image>\n{MESSAGE}
	ASSISTANT:
	"""

	RES = generate_answer(FILES, SYSTEM_PROMPT)

	response = f"{RES}."
	return response
	for i in range(len(response)):
	time.sleep(0.025)
	yield response[: i + 1]


	def generate_answer(IMAGES: list, SYSTEM_PROMPT) -> str:
	print(len(IMAGES))

	INPUT_IDS = tokenizer(SYSTEM_PROMPT, return_tensors="pt").input_ids

	RESULT = ""
	for EACH_IMG in IMAGES:
	image_path = EACH_IMG["path"]
	image = Image.open(image_path)
	image_tensor = model.image_preprocess(image)

	output_ids = model.generate(
	inputs=INPUT_IDS,
	max_new_tokens=500,
	images=image_tensor,
	use_cache=False,
	)[0]
	CUR_RESULT = tokenizer.decode(
	output_ids[INPUT_IDS.shape[1] :], skip_special_tokens=True
	).strip()

	RESULT = f"{RESULT} /n/n {CUR_RESULT}"

	return RESULT