import streamlit as st import base64 from datetime import datetime import plotly.graph_objects as go import cv2 import os import pytz import random import re import requests from moviepy.editor import VideoFileClip from PIL import Image import glob from audio_recorder_streamlit import audio_recorder import json from openai import OpenAI from dotenv import load_dotenv from huggingface_hub import InferenceClient from bs4 import BeautifulSoup import textract from xml.etree import ElementTree as ET from urllib.parse import quote import time from collections import deque # Page config st.set_page_config( page_title="Bike Cinematic Universe 🎬", page_icon="🚲", layout="wide" ) # Custom CSS with expanded styling st.markdown(""" """, unsafe_allow_html=True) # Load environment variables load_dotenv() # Initialize OpenAI client client = OpenAI( api_key=os.getenv('OPENAI_API_KEY'), organization=os.getenv('OPENAI_ORG_ID') ) # Initialize session state if "openai_model" not in st.session_state: st.session_state["openai_model"] = "gpt-4o-2024-05-13" if "messages" not in st.session_state: st.session_state.messages = [] # Hugging Face settings API_URL = os.getenv('API_URL') HF_KEY = os.getenv('HF_KEY') headers = { "Authorization": f"Bearer {HF_KEY}", "Content-Type": "application/json" } # Bike Collections bike_collections = { "Celestial Collection 🌌": { "Eclipse Vaulter": { "prompt": """Cinematic shot of a sleek black mountain bike silhouetted against a total solar eclipse. The corona creates an ethereal halo effect, with lens flares accentuating key points of the frame. Dynamic composition shows the bike mid-leap, with stardust particles trailing behind. Camera angle: Low angle, wide shot Lighting: Dramatic rim lighting from eclipse Color palette: Deep purples, cosmic blues, corona gold""", "emoji": "🌑" }, "Starlight Leaper": { "prompt": """A black bike performing an epic leap under a vast Milky Way galaxy. Shimmering stars blanket the sky while the bike's wheels leave a trail of stardust. Camera angle: Wide-angle upward shot Lighting: Natural starlight with subtle rim lighting Color palette: Deep blues, silver highlights, cosmic purples""", "emoji": "✨" } }, "Nature-Inspired Collection 🌲": { "Shadow Grasshopper": { "prompt": """A black bike jumping between forest paths. Dappled sunlight streams through the canopy, creating dynamic shadows. Camera angle: Through-the-trees tracking shot Lighting: Natural forest lighting with sun rays Color palette: Forest greens, golden sunlight, deep shadows""", "emoji": "🦗" } } } # File handling functions def generate_filename(prompt, file_type): """Generate a safe filename using the prompt and file type.""" central = pytz.timezone('US/Central') safe_date_time = datetime.now(central).strftime("%m%d_%H%M") replaced_prompt = re.sub(r'[<>:"/\\|?*\n]', ' ', prompt) safe_prompt = re.sub(r'\s+', ' ', replaced_prompt).strip()[:240] return f"{safe_date_time}_{safe_prompt}.{file_type}" def create_and_save_file(content, file_type="md", prompt=None, is_image=False, should_save=True): """Create and save file with proper handling of different types.""" if not should_save: return None filename = generate_filename(prompt if prompt else content, file_type) if file_type == "md": title_from_content = extract_markdown_title(content) if title_from_content: filename = generate_filename(title_from_content, file_type) with open(filename, "w", encoding="utf-8") as f: if is_image: f.write(content) else: f.write(prompt + "\n\n" + content) return filename def extract_markdown_title(content): """Extract the first markdown title from content.""" title_match = re.search(r'^\s*#\s*(.+)', content, re.MULTILINE) if title_match: return title_match.group(1).strip() return None # HTML5 Speech Synthesis @st.cache_resource def SpeechSynthesis(result): documentHTML5 = f''' Read It Aloud

🔊 Read It Aloud

''' st.components.v1.html(documentHTML5, width=1280, height=300) # Process functions for different media types def process_text(text_input): """Process text input with GPT-4o.""" if text_input: st.session_state.messages.append({"role": "user", "content": text_input}) with st.chat_message("user"): st.markdown(text_input) with st.chat_message("assistant"): completion = client.chat.completions.create( model=st.session_state["openai_model"], messages=[ {"role": m["role"], "content": m["content"]} for m in st.session_state.messages ], stream=False ) return_text = completion.choices[0].message.content st.write("Assistant: " + return_text) create_and_save_file(return_text, file_type="md", prompt=text_input) st.session_state.messages.append({"role": "assistant", "content": return_text}) def process_image(image_input, user_prompt): """Process image with GPT-4o vision.""" if isinstance(image_input, str): with open(image_input, "rb") as image_file: image_input = image_file.read() base64_image = base64.b64encode(image_input).decode("utf-8") response = client.chat.completions.create( model=st.session_state["openai_model"], messages=[ {"role": "system", "content": "You are a helpful assistant that responds in Markdown."}, {"role": "user", "content": [ {"type": "text", "text": user_prompt}, {"type": "image_url", "image_url": { "url": f"data:image/png;base64,{base64_image}" }} ]} ], temperature=0.0, ) return response.choices[0].message.content def process_audio(audio_input, text_input=''): """Process audio with GPT-4o and Whisper.""" if isinstance(audio_input, str): with open(audio_input, "rb") as file: audio_input = file.read() transcription = client.audio.transcriptions.create( model="whisper-1", file=audio_input, ) st.session_state.messages.append({"role": "user", "content": transcription.text}) with st.chat_message("assistant"): st.markdown(transcription.text) SpeechSynthesis(transcription.text) filename = generate_filename(transcription.text, "wav") create_and_save_file(audio_input.getvalue(), "wav", transcription.text, True) def process_video(video_path, seconds_per_frame=1): """Process video files for frame extraction and audio.""" base64Frames = [] video = cv2.VideoCapture(video_path) total_frames = int(video.get(cv2.CAP_PROP_FRAME_COUNT)) fps = video.get(cv2.CAP_PROP_FPS) frames_to_skip = int(fps * seconds_per_frame) for frame_idx in range(0, total_frames, frames_to_skip): video.set(cv2.CAP_PROP_POS_FRAMES, frame_idx) success, frame = video.read() if not success: break _, buffer = cv2.imencode(".jpg", frame) base64Frames.append(base64.b64encode(buffer).decode("utf-8")) video.release() # Extract audio base_video_path = os.path.splitext(video_path)[0] audio_path = f"{base_video_path}.mp3" try: video_clip = VideoFileClip(video_path) video_clip.audio.write_audiofile(audio_path) video_clip.close() except: st.warning("No audio track found in video") audio_path = None return base64Frames, audio_path def create_media_gallery(): """Create the media gallery interface.""" st.header("🎬 Media Gallery") tabs = st.tabs(["🖼️ Images", "🎵 Audio", "🎥 Video", "🎨 Scene Generator"]) with tabs[0]: image_files = glob.glob("*.png") + glob.glob("*.jpg") if image_files: cols = st.columns(3) for idx, image_file in enumerate(image_files): with cols[idx % 3]: st.image(image_file) st.caption(os.path.basename(image_file)) # Add prompt input for GPT-4o analysis prompt = st.text_input(f"Analyze image {idx}", "Describe this image in detail and list key elements.") if st.button(f"Analyze {idx}"): analysis = process_image(image_file, prompt) st.markdown(analysis) with tabs[1]: audio_files = glob.glob("*.mp3") + glob.glob("*.wav") for audio_file in audio_files: with st.expander(f"🎵 {os.path.basename(audio_file)}"): st.audio(audio_file) if st.button(f"Transcribe {audio_file}"): process_audio(audio_file) with tabs[2]: video_files = glob.glob("*.mp4") for video_file in video_files: with st.expander(f"🎥 {os.path.basename(video_file)}"): st.video(video_file) if st.button(f"Analyze {video_file}"): frames, audio = process_video(video_file) if audio: st.audio(audio) with tabs[3]: for collection_name, bikes in bike_collections.items(): st.subheader(collection_name) cols = st.columns(len(bikes)) for idx, (bike_name, details) in enumerate(bikes.items()): with cols[idx]: st.markdown(f"""

{details['emoji']} {bike_name}

{details['prompt']}

""", unsafe_allow_html=True) def main(): st.title("🚲 Bike Cinematic Universe") # Main navigation tab_main = st.radio("Choose Action:", ["📸 Upload Media", "🎬 View Gallery", "🎨 Generate Scene", "🤖 Chat"], horizontal=True) if tab_main == "📸 Upload Media": col1, col2 = st.columns(2) with col1: uploaded_image = st.file_uploader("Upload Image", type=['png', 'jpg']) if uploaded_image: st.image(uploaded_image) prompt = st