Spaces:

codelion
/

LLMFeed

Runtime error

App Files Files Community

LLMFeed / app.py

codelion

Update app.py

4f86d21 verified 3 months ago

raw

history blame

14.3 kB

	import gradio as gr
	from google import genai
	from google.genai import types
	from PIL import Image
	from io import BytesIO
	import base64
	import os
	import json
	import random

	# Initialize the Google Generative AI client with the API key from environment variables
	try:
	api_key = os.environ['GEMINI_API_KEY']
	except KeyError:
	raise ValueError("Please set the GEMINI_API_KEY environment variable.")
	client = genai.Client(api_key=api_key)

	def generate_ideas(tag):
	"""
	Generate a diverse set of ideas related to the tag using the LLM.

	Args:
	tag (str): The tag to base the ideas on.

	Returns:
	list: A list of ideas as strings.
	"""
	prompt = f"""
	Generate a list of 5 diverse and creative ideas related to {tag} that can be used for a TikTok video.
	Each idea should be a short sentence describing a specific scene or concept.
	Return the response as a JSON object with a single key 'ideas' containing a list of 5 ideas.
	Example: {{"ideas": ["A neon-lit gaming setup with RGB lights flashing", "A futuristic robot assembling a gadget"]}}
	"""
	response = client.models.generate_content(
	model='gemini-2.5-flash-preview-04-17',
	contents=[prompt],
	config=types.GenerateContentConfig(temperature=1.2)
	)
	try:
	response_json = json.loads(response.text.strip())
	ideas = response_json['ideas']
	return ideas
	except (json.JSONDecodeError, KeyError):
	# Fallback ideas if parsing fails
	return [
	f"A vibrant {tag} scene at sunset",
	f"A close-up of {tag} with neon lights",
	f"A futuristic take on {tag} with holograms",
	f"A cozy {tag} moment with warm lighting",
	f"An action-packed {tag} scene with dynamic colors"
	]

	def generate_item(tag, ideas):
	"""
	Generate a single feed item using one of the ideas.

	Args:
	tag (str): The tag to base the content on.
	ideas (list): List of ideas to choose from.

	Returns:
	dict: A dictionary with 'text' (str) and 'image_base64' (str).
	"""
	# Select a random idea for diversity
	selected_idea = random.choice(ideas)

	# Second LLM call to generate the precise image prompt and caption
	prompt = f"""
	Based on the idea "{selected_idea}", create content for a TikTok video about {tag}.
	Return a JSON object with two keys:
	- 'caption': A short, viral TikTok-style caption with hashtags.
	- 'image_prompt': A detailed image prompt for generating a high-quality visual scene.
	The image prompt should describe the scene vividly, specify a perspective and style, and ensure no text or letters are included.
	Example: {{"caption": "Neon vibes only! 🌌 #tech", "image_prompt": "A close-up view of a neon-lit gaming setup with RGB lights flashing, in a futuristic style, no text or letters"}}
	"""
	response = client.models.generate_content(
	model='gemini-2.5-flash-preview-04-17',
	contents=[prompt],
	config=types.GenerateContentConfig(temperature=1.2)
	)
	try:
	response_json = json.loads(response.text.strip())
	text = response_json['caption']
	image_prompt = response_json['image_prompt']
	except (json.JSONDecodeError, KeyError):
	# Fallback if parsing fails
	text = f"Obsessed with {tag}! 🔥 #{tag}"
	image_prompt = f"A vivid scene of {selected_idea}, in a vibrant pop art style, no text or letters"

	# Generate the image using the precise prompt
	image_response = client.models.generate_images(
	model='imagen-3.0-generate-002',
	prompt=image_prompt,
	config=types.GenerateImagesConfig(
	number_of_images=1,
	aspect_ratio="9:16",
	person_generation="DONT_ALLOW"
	)
	)

	# Check if images were generated
	if image_response.generated_images and len(image_response.generated_images) > 0:
	generated_image = image_response.generated_images[0]
	image = Image.open(BytesIO(generated_image.image.image_bytes))
	else:
	# Fallback to a placeholder image
	image = Image.new('RGB', (360, 640), color='gray')

	# Convert the image to base64
	buffered = BytesIO()
	image.save(buffered, format="PNG")
	img_str = base64.b64encode(buffered.getvalue()).decode()

	return {'text': text, 'image_base64': img_str, 'ideas': ideas}

	def start_feed(tag, current_index, feed_items, is_loading):
	"""
	Start or update the feed based on the tag.

	Args:
	tag (str): The tag to generate content for.
	current_index (int): The current item index.
	feed_items (list): The current list of feed items.
	is_loading (bool): Whether the feed is currently loading.

	Returns:
	tuple: (current_tag, current_index, feed_items, html_content, is_loading)
	"""
	if not tag.strip():
	tag = "trending"

	# Set loading state to True
	is_loading = True
	yield tag, current_index, feed_items, generate_html([], False, 0), is_loading

	# Generate new ideas for the tag
	ideas = generate_ideas(tag)
	# Generate the first item
	item = generate_item(tag, ideas)
	feed_items = [item] # Reset feed with the new item
	current_index = 0

	# Set loading state to False
	is_loading = False
	return tag, current_index, feed_items, generate_html(feed_items, False, current_index), is_loading

	def load_next(tag, current_index, feed_items, is_loading):
	"""
	Load the next item in the feed.

	Args:
	tag (str): The tag to generate content for.
	current_index (int): The current item index.
	feed_items (list): The current list of feed items.
	is_loading (bool): Whether the feed is currently loading.

	Returns:
	tuple: (current_tag, current_index, feed_items, html_content, is_loading)
	"""
	# Set loading state to True
	is_loading = True
	yield tag, current_index, feed_items, generate_html(feed_items, False, current_index), is_loading

	# If there’s a next item, show it; otherwise, generate a new one
	if current_index + 1 < len(feed_items):
	current_index += 1
	else:
	# Use the ideas from the last item to generate a new one
	ideas = feed_items[-1]['ideas'] if feed_items else generate_ideas(tag)
	new_item = generate_item(tag, ideas)
	feed_items.append(new_item)
	current_index = len(feed_items) - 1

	# Set loading state to False
	is_loading = False
	return tag, current_index, feed_items, generate_html(feed_items, False, current_index), is_loading

	def load_previous(tag, current_index, feed_items, is_loading):
	"""
	Load the previous item in the feed.

	Args:
	tag (str): The tag to generate content for.
	current_index (int): The current item index.
	feed_items (list): The current list of feed items.
	is_loading (bool): Whether the feed is currently loading.

	Returns:
	tuple: (current_tag, current_index, feed_items, html_content, is_loading)
	"""
	if current_index > 0:
	current_index -= 1
	return tag, current_index, feed_items, generate_html(feed_items, False, current_index), is_loading

	def generate_html(feed_items, scroll_to_latest=False, current_index=0):
	"""
	Generate an HTML string to display the current feed item with click navigation.

	Args:
	feed_items (list): List of dictionaries containing 'text' and 'image_base64'.
	scroll_to_latest (bool): Whether to auto-scroll to the latest item (not used here).
	current_index (int): The index of the item to display.

	Returns:
	str: HTML string representing the feed.
	"""
	if not feed_items or current_index >= len(feed_items):
	return """
	<div style="
	display: flex;
	flex-direction: column;
	align-items: center;
	justify-content: center;
	max-width: 360px;
	margin: 0 auto;
	background-color: #000;
	height: 640px;
	border: 1px solid #333;
	border-radius: 10px;
	color: white;
	font-family: Arial, sans-serif;
	">
	<p>Select a tag to start your feed!</p>
	</div>
	"""

	item = feed_items[current_index]
	html_str = """
	<div id="feed-container" style="
	display: flex;
	flex-direction: column;
	align-items: center;
	max-width: 360px;
	margin: 0 auto;
	background-color: #000;
	height: 640px;
	border: 1px solid #333;
	border-radius: 10px;
	position: relative;
	">
	<div class="feed-item" style="
	width: 100%;
	height: 100%;
	position: relative;
	display: flex;
	flex-direction: column;
	justify-content: flex-end;
	overflow: hidden;
	cursor: pointer;
	" onclick="handleClick(event)">
	<img id="feed-image" src="data:image/png;base64,{image_base64}" style="
	width: 100%;
	height: 100%;
	object-fit: cover;
	position: absolute;
	top: 0;
	left: 0;
	z-index: 1;
	">
	<div style="
	position: relative;
	z-index: 2;
	background: linear-gradient(to top, rgba(0,0,0,0.7), transparent);
	padding: 20px;
	color: white;
	font-family: Arial, sans-serif;
	font-size: 18px;
	font-weight: bold;
	text-shadow: 1px 1px 2px rgba(0,0,0,0.5);
	">
	{text}
	</div>
	</div>
	</div>
	<script>
	function handleClick(event) {{
	const image = document.getElementById('feed-image');
	const rect = image.getBoundingClientRect();
	const clickX = event.clientX - rect.left;
	const width = rect.width;
	if (clickX > width * 0.75) {{
	// Click on the right 25% to go to previous
	document.getElementById('previous-button').click();
	}} else {{
	// Click anywhere else to go to next
	document.getElementById('next-button').click();
	}}
	}}
	</script>
	<button id="next-button" style="display: none;" onclick="document.getElementById('next-button').click()"></button>
	<button id="previous-button" style="display: none;" onclick="document.getElementById('previous-button').click()"></button>
	""".format(image_base64=item['image_base64'], text=item['text'])

	return html_str

	# Define the Gradio interface
	with gr.Blocks(
	css="""
	body { background-color: #000; color: #fff; font-family: Arial, sans-serif; }
	.gradio-container { max-width: 400px; margin: 0 auto; padding: 10px; }
	input, select { border-radius: 5px; background-color: #222; color: #fff; border: 1px solid #444; }
	.gr-form { background-color: #111; padding: 15px; border-radius: 10px; }
	.gr-progress { background-color: #ff2d55; }
	""",
	title="TikTok-Style Infinite Feed"
	) as demo:
	# State variables
	current_tag = gr.State(value="")
	current_index = gr.State(value=0)
	feed_items = gr.State(value=[])
	is_loading = gr.State(value=False)

	# Input section
	with gr.Column(elem_classes="gr-form"):
	gr.Markdown("### Create Your TikTok Feed")
	with gr.Row():
	suggested_tags = gr.Dropdown(
	choices=["food", "travel", "fashion", "tech"],
	label="Pick a Tag",
	value="food"
	)
	tag_input = gr.Textbox(
	label="Or Enter a Custom Tag",
	value="food",
	placeholder="e.g., sushi, adventure",
	submit_btn=False # Disable default submit button
	)

	# Progress bar
	progress_bar = gr.Slider(
	minimum=0,
	maximum=1,
	value=0,
	label="Loading Feed...",
	visible=False
	)

	# Output display
	feed_html = gr.HTML()

	# Event handlers
	def set_tag(selected_tag):
	"""Update the tag input when a suggested tag is selected and start the feed."""
	return selected_tag

	def update_progress(is_loading):
	"""Show or hide the progress bar based on loading state."""
	return gr.update(visible=is_loading, value=0 if is_loading else 1)

	# Handle dropdown selection
	suggested_tags.change(
	fn=set_tag,
	inputs=suggested_tags,
	outputs=tag_input
	).then(
	fn=start_feed,
	inputs=[tag_input, current_index, feed_items, is_loading],
	outputs=[current_tag, current_index, feed_items, feed_html, is_loading]
	).then(
	fn=update_progress,
	inputs=is_loading,
	outputs=progress_bar
	)

	# Handle Enter keypress in the custom tag input
	tag_input.submit(
	fn=start_feed,
	inputs=[tag_input, current_index, feed_items, is_loading],
	outputs=[current_tag, current_index, feed_items, feed_html, is_loading]
	).then(
	fn=update_progress,
	inputs=is_loading,
	outputs=progress_bar
	)

	# Hidden buttons for navigation
	next_button = gr.Button("Next", elem_id="next-button", visible=False)
	previous_button = gr.Button("Previous", elem_id="previous-button", visible=False)

	# Handle click to go to next item
	next_button.click(
	fn=load_next,
	inputs=[current_tag, current_index, feed_items, is_loading],
	outputs=[current_tag, current_index, feed_items, feed_html, is_loading]
	).then(
	fn=update_progress,
	inputs=is_loading,
	outputs=progress_bar
	)

	# Handle click to go to previous item
	previous_button.click(
	fn=load_previous,
	inputs=[current_tag, current_index, feed_items, is_loading],
	outputs=[current_tag, current_index, feed_items, feed_html, is_loading]
	)

	# Launch the app with a public link
	demo.launch(share=True)