Spaces:

awacke1
/

RescuerOfStolenBikes

Sleeping

App Files Files Community

awacke1 commited on Nov 16, 2024

Commit

37c6135

verified ·

1 Parent(s): 8f04cdd

Update app.py

Browse files

Files changed (1) hide show

app.py +164 -63

app.py CHANGED Viewed

@@ -15,6 +15,13 @@ from audio_recorder_streamlit import audio_recorder
 import json
 from openai import OpenAI
 from dotenv import load_dotenv
 # Page config
 st.set_page_config(
@@ -65,7 +72,26 @@ st.markdown("""
 # Load environment variables
 load_dotenv()
-client = OpenAI(api_key=os.getenv('OPENAI_API_KEY'))
 # Bike Collections
 bike_collections = {
@@ -86,14 +112,6 @@ bike_collections = {
                      Lighting: Natural starlight with subtle rim lighting
                      Color palette: Deep blues, silver highlights, cosmic purples""",
             "emoji": "✨"
-        },
-        "Moonlit Hopper": {
-            "prompt": """A sleek black bike mid-hop over a moonlit meadow.
-                     Full moon illuminating misty surroundings with fireflies dancing around.
-                     Camera angle: Side profile with slight low angle
-                     Lighting: Soft moonlight with atmospheric fog
-                     Color palette: Silver blues, soft whites, deep shadows""",
-            "emoji": "🌙"
         }
     },
     "Nature-Inspired Collection 🌲": {
@@ -104,36 +122,142 @@ bike_collections = {
                      Lighting: Natural forest lighting with sun rays
                      Color palette: Forest greens, golden sunlight, deep shadows""",
             "emoji": "🦗"
-        },
-        "Onyx Leapfrog": {
-            "prompt": """A bike with obsidian-black finish jumping over a sparkling creek.
-                     Water reflection creates mirror effect with ripples from the leap.
-                     Camera angle: Low angle from water level
-                     Lighting: Golden hour side lighting
-                     Color palette: Deep blacks, water blues, forest greens""",
-            "emoji": "🐸"
         }
     }
 }
 # File handling functions
 def generate_filename(prompt, file_type):
-    """Generate a safe filename from prompt and timestamp"""
     central = pytz.timezone('US/Central')
     safe_date_time = datetime.now(central).strftime("%m%d_%H%M")
     replaced_prompt = re.sub(r'[<>:"/\\|?*\n]', ' ', prompt)
     safe_prompt = re.sub(r'\s+', ' ', replaced_prompt).strip()[:240]
     return f"{safe_date_time}_{safe_prompt}.{file_type}"
-def save_file(content, filename, is_binary=False):
-    """Save content to file with proper mode"""
-    mode = 'wb' if is_binary else 'w'
-    with open(filename, mode) as f:
-        f.write(content)
     return filename
 def process_video(video_path, seconds_per_frame=1):
-    """Extract frames and audio from video"""
     base64Frames = []
     video = cv2.VideoCapture(video_path)
     total_frames = int(video.get(cv2.CAP_PROP_FRAME_COUNT))
@@ -164,6 +288,7 @@ def process_video(video_path, seconds_per_frame=1):
     return base64Frames, audio_path
 def create_media_gallery():
     st.header("🎬 Media Gallery")
     tabs = st.tabs(["🖼️ Images", "🎵 Audio", "🎥 Video", "🎨 Scene Generator"])
@@ -176,18 +301,31 @@ def create_media_gallery():
                 with cols[idx % 3]:
                     st.image(image_file)
                     st.caption(os.path.basename(image_file))
     with tabs[1]:
         audio_files = glob.glob("*.mp3") + glob.glob("*.wav")
         for audio_file in audio_files:
             with st.expander(f"🎵 {os.path.basename(audio_file)}"):
                 st.audio(audio_file)
     with tabs[2]:
         video_files = glob.glob("*.mp4")
         for video_file in video_files:
             with st.expander(f"🎥 {os.path.basename(video_file)}"):
                 st.video(video_file)
     with tabs[3]:
         for collection_name, bikes in bike_collections.items():
@@ -208,51 +346,14 @@ def main():
     # Main navigation
     tab_main = st.radio("Choose Action:",
-                        ["📸 Upload Media", "🎬 View Gallery", "🎨 Generate Scene"],
                         horizontal=True)
     if tab_main == "📸 Upload Media":
         col1, col2 = st.columns(2)
         with col1:
-            # Image upload
             uploaded_image = st.file_uploader("Upload Image", type=['png', 'jpg'])
             if uploaded_image:
                 st.image(uploaded_image)
-                prompt = st.text_input("Image Description:")
-                if st.button("Process Image"):
-                    filename = generate_filename(prompt, uploaded_image.type.split('/')[-1])
-                    save_file(uploaded_image.getvalue(), filename, is_binary=True)
-                    st.success(f"Saved as {filename}")
-        with col2:
-            # Audio/Video upload
-            uploaded_media = st.file_uploader("Upload Audio/Video", type=['mp3', 'wav', 'mp4'])
-            if uploaded_media:
-                if uploaded_media.type.startswith('audio'):
-                    st.audio(uploaded_media)
-                else:
-                    st.video(uploaded_media)
-                if st.button("Save Media"):
-                    filename = generate_filename("media", uploaded_media.type.split('/')[-1])
-                    save_file(uploaded_media.getvalue(), filename, is_binary=True)
-                    st.success(f"Saved as {filename}")
-    elif tab_main == "🎬 View Gallery":
-        create_media_gallery()
-    else:  # Generate Scene
-        st.header("🎨 Scene Generator")
-        selected_collection = st.selectbox("Choose Collection", list(bike_collections.keys()))
-        selected_bike = st.selectbox("Choose Bike", list(bike_collections[selected_collection].keys()))
-        bike_details = bike_collections[selected_collection][selected_bike]
-        st.markdown(f"""
-        <div class='scene-card'>
-            <h3>{bike_details['emoji']} {selected_bike}</h3>
-            <p>{bike_details['prompt']}</p>
-        </div>
-        """, unsafe_allow_html=True)
-if __name__ == "__main__":
-    main()

 import json
 from openai import OpenAI
 from dotenv import load_dotenv
+from huggingface_hub import InferenceClient
+from bs4 import BeautifulSoup
+import textract
+from xml.etree import ElementTree as ET
+from urllib.parse import quote
+import time
+from collections import deque
 # Page config
 st.set_page_config(
 # Load environment variables
 load_dotenv()
+# Initialize OpenAI client
+client = OpenAI(
+    api_key=os.getenv('OPENAI_API_KEY'),
+    organization=os.getenv('OPENAI_ORG_ID')
+)
+# Initialize session state
+if "openai_model" not in st.session_state:
+    st.session_state["openai_model"] = "gpt-4o-2024-05-13"
+if "messages" not in st.session_state:
+    st.session_state.messages = []
+# Hugging Face settings
+API_URL = os.getenv('API_URL')
+HF_KEY = os.getenv('HF_KEY')
+headers = {
+    "Authorization": f"Bearer {HF_KEY}",
+    "Content-Type": "application/json"
+}
 # Bike Collections
 bike_collections = {
                      Lighting: Natural starlight with subtle rim lighting
                      Color palette: Deep blues, silver highlights, cosmic purples""",
             "emoji": "✨"
         }
     },
     "Nature-Inspired Collection 🌲": {
                      Lighting: Natural forest lighting with sun rays
                      Color palette: Forest greens, golden sunlight, deep shadows""",
             "emoji": "🦗"
         }
     }
 }
 # File handling functions
 def generate_filename(prompt, file_type):
+    """Generate a safe filename using the prompt and file type."""
     central = pytz.timezone('US/Central')
     safe_date_time = datetime.now(central).strftime("%m%d_%H%M")
     replaced_prompt = re.sub(r'[<>:"/\\|?*\n]', ' ', prompt)
     safe_prompt = re.sub(r'\s+', ' ', replaced_prompt).strip()[:240]
     return f"{safe_date_time}_{safe_prompt}.{file_type}"
+def create_and_save_file(content, file_type="md", prompt=None, is_image=False, should_save=True):
+    """Create and save file with proper handling of different types."""
+    if not should_save:
+        return None
+    filename = generate_filename(prompt if prompt else content, file_type)
+    if file_type == "md":
+        title_from_content = extract_markdown_title(content)
+        if title_from_content:
+            filename = generate_filename(title_from_content, file_type)
+    with open(filename, "w", encoding="utf-8") as f:
+        if is_image:
+            f.write(content)
+        else:
+            f.write(prompt + "\n\n" + content)
     return filename
+def extract_markdown_title(content):
+    """Extract the first markdown title from content."""
+    title_match = re.search(r'^\s*#\s*(.+)', content, re.MULTILINE)
+    if title_match:
+        return title_match.group(1).strip()
+    return None
+# HTML5 Speech Synthesis
+@st.cache_resource
+def SpeechSynthesis(result):
+    documentHTML5 = f'''
+    <!DOCTYPE html>
+    <html>
+    <head>
+        <title>Read It Aloud</title>
+        <script type="text/javascript">
+            function readAloud() {{
+                const text = document.getElementById("textArea").value;
+                const speech = new SpeechSynthesisUtterance(text);
+                window.speechSynthesis.speak(speech);
+            }}
+        </script>
+    </head>
+    <body>
+        <h1>🔊 Read It Aloud</h1>
+        <textarea id="textArea" rows="10" cols="80">{result}</textarea>
+        <br>
+        <button onclick="readAloud()">🔊 Read Aloud</button>
+    </body>
+    </html>
+    '''
+    st.components.v1.html(documentHTML5, width=1280, height=300)
+# Process functions for different media types
+def process_text(text_input):
+    """Process text input with GPT-4o."""
+    if text_input:
+        st.session_state.messages.append({"role": "user", "content": text_input})
+        with st.chat_message("user"):
+            st.markdown(text_input)
+        with st.chat_message("assistant"):
+            completion = client.chat.completions.create(
+                model=st.session_state["openai_model"],
+                messages=[
+                    {"role": m["role"], "content": m["content"]}
+                    for m in st.session_state.messages
+                ],
+                stream=False
+            )
+            return_text = completion.choices[0].message.content
+            st.write("Assistant: " + return_text)
+            create_and_save_file(return_text, file_type="md", prompt=text_input)
+            st.session_state.messages.append({"role": "assistant", "content": return_text})
+def process_image(image_input, user_prompt):
+    """Process image with GPT-4o vision."""
+    if isinstance(image_input, str):
+        with open(image_input, "rb") as image_file:
+            image_input = image_file.read()
+    base64_image = base64.b64encode(image_input).decode("utf-8")
+    response = client.chat.completions.create(
+        model=st.session_state["openai_model"],
+        messages=[
+            {"role": "system", "content": "You are a helpful assistant that responds in Markdown."},
+            {"role": "user", "content": [
+                {"type": "text", "text": user_prompt},
+                {"type": "image_url", "image_url": {
+                    "url": f"data:image/png;base64,{base64_image}"
+                }}
+            ]}
+        ],
+        temperature=0.0,
+    )
+    return response.choices[0].message.content
+def process_audio(audio_input, text_input=''):
+    """Process audio with GPT-4o and Whisper."""
+    if isinstance(audio_input, str):
+        with open(audio_input, "rb") as file:
+            audio_input = file.read()
+    transcription = client.audio.transcriptions.create(
+        model="whisper-1",
+        file=audio_input,
+    )
+    st.session_state.messages.append({"role": "user", "content": transcription.text})
+    with st.chat_message("assistant"):
+        st.markdown(transcription.text)
+        SpeechSynthesis(transcription.text)
+        filename = generate_filename(transcription.text, "wav")
+        create_and_save_file(audio_input.getvalue(), "wav", transcription.text, True)
 def process_video(video_path, seconds_per_frame=1):
+    """Process video files for frame extraction and audio."""
     base64Frames = []
     video = cv2.VideoCapture(video_path)
     total_frames = int(video.get(cv2.CAP_PROP_FRAME_COUNT))
     return base64Frames, audio_path
 def create_media_gallery():
+    """Create the media gallery interface."""
     st.header("🎬 Media Gallery")
     tabs = st.tabs(["🖼️ Images", "🎵 Audio", "🎥 Video", "🎨 Scene Generator"])
                 with cols[idx % 3]:
                     st.image(image_file)
                     st.caption(os.path.basename(image_file))
+                    # Add prompt input for GPT-4o analysis
+                    prompt = st.text_input(f"Analyze image {idx}",
+                                         "Describe this image in detail and list key elements.")
+                    if st.button(f"Analyze {idx}"):
+                        analysis = process_image(image_file, prompt)
+                        st.markdown(analysis)
     with tabs[1]:
         audio_files = glob.glob("*.mp3") + glob.glob("*.wav")
         for audio_file in audio_files:
             with st.expander(f"🎵 {os.path.basename(audio_file)}"):
                 st.audio(audio_file)
+                if st.button(f"Transcribe {audio_file}"):
+                    process_audio(audio_file)
     with tabs[2]:
         video_files = glob.glob("*.mp4")
         for video_file in video_files:
             with st.expander(f"🎥 {os.path.basename(video_file)}"):
                 st.video(video_file)
+                if st.button(f"Analyze {video_file}"):
+                    frames, audio = process_video(video_file)
+                    if audio:
+                        st.audio(audio)
     with tabs[3]:
         for collection_name, bikes in bike_collections.items():
     # Main navigation
     tab_main = st.radio("Choose Action:",
+                        ["📸 Upload Media", "🎬 View Gallery", "🎨 Generate Scene", "🤖 Chat"],
                         horizontal=True)
     if tab_main == "📸 Upload Media":
         col1, col2 = st.columns(2)
         with col1:
             uploaded_image = st.file_uploader("Upload Image", type=['png', 'jpg'])
             if uploaded_image:
                 st.image(uploaded_image)
+                prompt = st