Spaces:

s0uL141
/

Cyber_Gemma2

Sleeping

App Files Files Community

Cyber_Gemma2 / app.py

s0uL141

Update app.py

77f3279 verified 5 months ago

raw

history blame contribute delete

1.92 kB

	import streamlit as st
	from transformers import AutoTokenizer, AutoModelForCausalLM
	import torch

	# Cache the model loading to avoid reloading it on every interaction
	@st.cache_resource
	def load_model():
	model_name = "s0uL141/Cyber_gemma2_2B_it" # Replace with your Hugging Face repo or local path
	tokenizer = AutoTokenizer.from_pretrained(model_name)
	model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype=torch.float16)
	return tokenizer, model

	# Load the model and tokenizer
	tokenizer, model = load_model()

	# Function to generate text based on the user prompt
	def generate_response(prompt, max_length=50):
	# Tokenize input prompt
	inputs = tokenizer(prompt, return_tensors="pt")
	# Generate response using the model
	output = model.generate(inputs.input_ids, max_length=max_length, num_return_sequences=1)
	# Decode the response and return
	return tokenizer.decode(output[0], skip_special_tokens=True)

	# Streamlit App
	def main():
	# Set up the title and description for the app
	st.title("Fine-Tuned Cyber Gemma 2b-it Model")
	st.write("This app generates responses based on your input using a fine-tuned version of the Gemma 2b-it model.")

	# Text input area for the user to provide a prompt
	user_input = st.text_area("Enter your prompt here:", height=200)

	# Button to trigger text generation
	if st.button("Generate Response"):
	# Check if user input is provided
	if user_input.strip() == "":
	st.write("Please enter a valid prompt.")
	else:
	with st.spinner("Generating response..."):
	# Generate response using the model
	response = generate_response(user_input)
	# Display the generated response
	st.write("### Model Response:")
	st.write(response)

	# Entry point to run the app
	if __name__ == "__main__":
	main()