Spaces:

czd358121692
/

MusicalToy4Frank_Standalone

Running on Zero

App Files Files Community

czd358121692 commited on Nov 5

Commit

d5f2ccb

•

1 Parent(s): d0d23d6

add credits and features

Browse files

Files changed (1) hide show

app.py +41 -12

app.py CHANGED Viewed

@@ -18,7 +18,6 @@ from huggingface_hub import scan_cache_dir
 from stable_audio_tools import get_pretrained_model
 from stable_audio_tools.inference.generation import generate_diffusion_cond
-# Cache setup code remains same
 CACHE_ROOT = '/tmp'
 os.environ['HF_HOME'] = CACHE_ROOT
 os.environ['HUGGINGFACE_HUB_CACHE'] = os.path.join(CACHE_ROOT, 'hub')
@@ -117,7 +116,7 @@ def get_caption(image_in):
 # Continuing from previous code...
-def get_musical_prompt(user_prompt, chosen_model):
     if not user_prompt:
         raise gr.Error("No image caption provided")
@@ -134,6 +133,12 @@ Consider these elements in your composition:
 - Soundscapes: environmental depth and spatial audio qualities
 Respond immediately with a single musical prompt. No explanation, just the musical description.
 """
         instruction = f"""
 <|system|>
@@ -154,7 +159,7 @@ Respond immediately with a single musical prompt. No explanation, just the music
         musical_prompt = outputs[0]["generated_text"]
         # Clean system message and tokens
-        cleaned_prompt = musical_prompt.replace("<|system|>", "").replace("</s>", "").replace("<|user|>", "").replace("<|assistant|>", "")
         lines = cleaned_prompt.split('\n')
         relevant_lines = [line.strip() for line in lines
@@ -174,7 +179,8 @@ Respond immediately with a single musical prompt. No explanation, just the music
     except Exception as e:
         print(f"Error in get_musical_prompt: {str(e)}")
-        return "Ambient orchestral composition with piano and strings, creating a contemplative atmosphere"
 def get_stable_audio_open(prompt, seconds_total=47, steps=100, cfg_scale=7):
     try:
@@ -239,10 +245,10 @@ def check_disk_space(min_gb=10):
     disk_usage = psutil.disk_usage('/')
     gb_free = disk_usage.free / (1024 * 1024 * 1024)
     if gb_free < min_gb:
-        print("Disk space GB free" + str(gb_free))
-        raise RuntimeError(f"Low disk space: {gb_free:.1f}GB free, need {min_gb}GB")
     else:
-        print("Disk space GB free" + str(gb_free))
     return True
 def smart_cleanup():
@@ -289,7 +295,7 @@ def infer(image_in, api_status):
     if image_in is None:
         raise gr.Error("Please provide an image of architecture")
-    if api_status == "Orchestra is tuning...":
         raise gr.Error("The model is still tuning, please try again later")
     try:
@@ -297,7 +303,7 @@ def infer(image_in, api_status):
         user_prompt = get_caption(image_in)
         gr.Info("🎼 Weaving into melody...")
-        musical_prompt = get_musical_prompt(user_prompt, "Stable Audio Open")
         gr.Info("🎻 Breathing life into notes...")
         music_o = get_stable_audio_open(musical_prompt)
@@ -366,13 +372,36 @@ with gr.Blocks(css=css) as demo:
                 )
                 retry_btn = gr.Button("🎲", visible=False)
                 result = gr.Audio(
-                    label="Music"
                 )
-        # Credits section remains the same
         gr.HTML("""
         <div style="margin-top: 40px; padding: 20px; border-top: 1px solid #ddd;">
-            <!-- Your existing credits HTML -->
         </div>
         """)

 from stable_audio_tools import get_pretrained_model
 from stable_audio_tools.inference.generation import generate_diffusion_cond
 CACHE_ROOT = '/tmp'
 os.environ['HF_HOME'] = CACHE_ROOT
 os.environ['HUGGINGFACE_HUB_CACHE'] = os.path.join(CACHE_ROOT, 'hub')
 # Continuing from previous code...
+def get_musical_prompt(user_prompt):
     if not user_prompt:
         raise gr.Error("No image caption provided")
 - Soundscapes: environmental depth and spatial audio qualities
 Respond immediately with a single musical prompt. No explanation, just the musical description.
+Examples:
+Input: "A curved titanium facade reflecting sunlight with flowing organic forms"
+Output: "Fluid jazz piano with shimmering orchestral textures, metallic percussion accents, and expansive reverb creating architectural depth"
+Input: "A geometric glass atrium with intersecting angular planes"
+Output: "Crystalline minimalist composition with layered string harmonies and precise rhythmic structures, emphasizing spatial transparency"
 """
         instruction = f"""
 <|system|>
         musical_prompt = outputs[0]["generated_text"]
         # Clean system message and tokens
+        cleaned_prompt = musical_prompt.replace("<|system|>", "").replace("</s>", "").replace("<|user|>", "").replace("<|assistant|>", "").replace("Output:", "")
         lines = cleaned_prompt.split('\n')
         relevant_lines = [line.strip() for line in lines
     except Exception as e:
         print(f"Error in get_musical_prompt: {str(e)}")
+        final_prompt = "Ambient orchestral composition with piano and strings, creating a contemplative atmosphere"
+        return final_prompt
 def get_stable_audio_open(prompt, seconds_total=47, steps=100, cfg_scale=7):
     try:
     disk_usage = psutil.disk_usage('/')
     gb_free = disk_usage.free / (1024 * 1024 * 1024)
     if gb_free < min_gb:
+        print("Disk space GB free: " + str(int(gb_free)))
+        raise RuntimeError(f"Low disk space: {int(gb_free)}GB free, need {min_gb}GB")
     else:
+        print("Disk space GB free: " + str(int(gb_free)))
     return True
 def smart_cleanup():
     if image_in is None:
         raise gr.Error("Please provide an image of architecture")
+    if api_status == "Orchestra is tuning. Please refresh the webpage.":
         raise gr.Error("The model is still tuning, please try again later")
     try:
         user_prompt = get_caption(image_in)
         gr.Info("🎼 Weaving into melody...")
+        musical_prompt = get_musical_prompt(user_prompt)
         gr.Info("🎻 Breathing life into notes...")
         music_o = get_stable_audio_open(musical_prompt)
                 )
                 retry_btn = gr.Button("🎲", visible=False)
                 result = gr.Audio(
+                    label="Music",
+                    autoplay = True
                 )
+        # Credits section
         gr.HTML("""
         <div style="margin-top: 40px; padding: 20px; border-top: 1px solid #ddd;">
+            <h3 style="text-align: center;">Credits & Acknowledgments</h3>
+            <h4>Architecture</h4>
+            <p>Frank O Gehry, Gehry Partners LLP and Gehry Tech team for pushing the boundaries of form and space for humanity.</p>
+            <h4>Technologies</h4>
+            <ul>
+                <li>Music Generation: <a href="https://huggingface.co/spaces/harmonai/stable-audio-public">Stable Audio Open</a> by STABILITY AI LTD</li>
+                <li>Image Understanding: <a href="https://huggingface.co/microsoft/kosmos-2">Kosmos-2</a> by Microsoft</li>
+                <li>Language Model: Zephyr by Hugging Face</li>
+                <li>Affordable Online Hosting Platform & Computational Resources by Hugging Face</li>
+            </ul>
+            <h4>Contributors</h4>
+            <ul>
+                <li>Architects, Engineers & Consultants who bring these visions to life</li>
+                <li>Contractor teams, craftspeople, and workers who materialize these dreams</li>
+                <li>Photographers who capture and share these architectural moments to general public online</li>
+                <li>Musicians and composers whose work inspires our audio training behind the scenes for generations</li>
+            </ul>
+            <p style="text-align: center; margin-top: 20px; font-size: 0.9em;">
+                This project stands on the shoulders of countless individuals who contribute to the intersection of architecture, technology, and broader arts.
+                <br>Special thanks to all the open-source communities and researchers making these technologies accessible.
+            </p>
         </div>
         """)