ghostai1
/

GHOSTSONAFB

English

python

Model card Files Files and versions

xet

Community

ghostai1 commited on 9 days ago

Commit

e95bbe2

verified ·

1 Parent(s): 5f8e56d

Update public/apibinararybuild.py

Browse files

Files changed (1) hide show

public/apibinararybuild.py +117 -52

public/apibinararybuild.py CHANGED Viewed

@@ -1,4 +1,3 @@
-# app.py
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
@@ -34,7 +33,7 @@ from logging.handlers import RotatingFileHandler
 from fastapi import FastAPI, HTTPException
 from fastapi.middleware.cors import CORSMiddleware
-from fastapi.responses import FileResponse  # <-- added
 from pydantic import BaseModel
 import uvicorn
@@ -309,7 +308,7 @@ def apply_fade(seg: AudioSegment, fade_in=500, fade_out=800) -> AudioSegment:
         return seg
 # ======================================================================================
-# PROMPTS (FROM INI) — SAFE FORMAT + STYLE-DRIVEN UI CHANGES
 # ======================================================================================
 class SafeFormatDict(dict):
@@ -478,7 +477,7 @@ def load_model():
 musicgen_model = load_model()
 # ======================================================================================
-# GENERATION (30s CHUNKS, 60–120s READY)
 # ======================================================================================
 def _export_torch_to_segment(audio_tensor: torch.Tensor, sample_rate: int, bit_depth_int: int) -> Optional[AudioSegment]:
@@ -585,19 +584,19 @@ def generate_music(
 ) -> Tuple[Optional[str], str, str]:
     if not instrumental_prompt.strip():
-        return None, "⚠️ Enter a prompt.", vram_status_text
     try:
         out_sr = int(output_sample_rate)
     except:
-        return None, "❌ Invalid sample rate.", vram_status_text
     try:
         bd = int(bit_depth)
         sample_width = 3 if bd == 24 else 2
     except:
-        return None, "❌ Invalid bit depth.", vram_status_text
     if not check_disk_space():
-        return None, "⚠️ Low disk space (<1GB).", vram_status_text
     CHUNK_SEC = 30
     total_duration = max(30, min(int(total_duration), 120))
@@ -667,7 +666,7 @@ def generate_music(
         except Exception as e:
             logger.error(f"Chunk {chunk_idx} generation failed: {e}")
             logger.error(traceback.format_exc())
-            return None, f"❌ Generate failed at chunk {chunk_idx}.", vram_status_text
         try:
             if audio.shape[0] != 2:
@@ -676,7 +675,7 @@ def generate_music(
             audio = torchaudio.functional.resample(audio, 32000, PROCESS_SR, lowpass_filter_width=64)
             seg = _export_torch_to_segment(audio, PROCESS_SR, bd)
             if seg is None:
-                return None, f"❌ Convert failed chunk {chunk_idx}.", vram_status_text
             seg = ensure_stereo(seg, PROCESS_SR, sample_width)
             seg = seg - 15
             seg = apply_noise_gate(seg, threshold_db=-80, sample_rate=PROCESS_SR)
@@ -691,10 +690,10 @@ def generate_music(
         except Exception as e:
             logger.error(f"Post-process failed chunk {chunk_idx}: {e}")
             logger.error(traceback.format_exc())
-            return None, f"❌ Post-process failed chunk {chunk_idx}.", vram_status_text
     if not segments:
-        return None, "❌ No audio generated.", vram_status_text
     logger.info("Combining chunks...")
     final_seg = segments[0]
@@ -729,12 +728,12 @@ def generate_music(
             final_seg.export(fb, format="mp3", bitrate="128k")
             mp3_path = fb
         except Exception as ee:
-            return None, f"❌ Export failed: {ee}", vram_status_text
     elapsed = time.time() - start_time
     vram_status_text = f"Final VRAM: {torch.cuda.memory_allocated() / 1024**2:.2f} MB"
     logger.info(f"Done in {elapsed:.2f}s -> {mp3_path}")
-    return mp3_path, "✅ Generated.", vram_status_text
 def generate_music_wrapper(*args):
     try:
@@ -809,7 +808,7 @@ class RenderRequest(BaseModel):
     bitrate: Optional[str] = None
     output_sample_rate: Optional[str] = None
     bit_depth: Optional[str] = None
-    style: Optional[str] = None  # NEW: pass style key for filename tagging
 fastapp = FastAPI(title=f"GhostAI Music Server {RELEASE}", version=RELEASE)
 fastapp.add_middleware(
@@ -837,6 +836,7 @@ def prompt(style: str, bpm: int = 120, chunk: int = 1,
         raise HTTPException(status_code=404, detail="Style not found")
     return {"style": style, "prompt": txt}
 for sec, cfg in list(STYLES.styles.items()):
     api_name = cfg.get("api_name")
     if api_name:
@@ -868,19 +868,30 @@ def set_settings(payload: Dict[str, Any]):
     except Exception as e:
         raise HTTPException(status_code=400, detail=str(e))
-# -----------------------------
-# ASCII-safe header sanitizer
-# -----------------------------
-def _ascii_header(s: str) -> str:
-    return re.sub(r'[^\x20-\x7E]', '', str(s or ''))
-# -----------------------------
-# BINARY MP3 RENDER ENDPOINT
-# -----------------------------
 @fastapp.post("/render")
 def render(req: RenderRequest):
     if is_busy():
-        raise HTTPException(status_code=409, detail="Server busy")
     job_id = f"render_{int(time.time())}"
     set_busy(True, job_id)
     try:
@@ -889,7 +900,7 @@ def render(req: RenderRequest):
             if v is not None:
                 s[k] = v
-        mp3_path, msg, vram = generate_music(
             s.get("instrumental_prompt", req.instrumental_prompt),
             float(s.get("cfg_scale", DEFAULT_SETTINGS["cfg_scale"])),
             int(s.get("top_k", DEFAULT_SETTINGS["top_k"])),
@@ -911,26 +922,85 @@ def render(req: RenderRequest):
             str(s.get("bit_depth", DEFAULT_SETTINGS["bit_depth"])),
             str(s.get("style", "custom"))
         )
-        if not mp3_path or not os.path.exists(mp3_path):
-            raise HTTPException(status_code=500, detail=_ascii_header(msg or "No file produced"))
-        filename = os.path.basename(mp3_path)
         headers = {
-            "X-Job-ID": _ascii_header(job_id),
-            "X-Status": _ascii_header(msg),
-            "X-VRAM": _ascii_header(vram),
-            "X-Release": _ascii_header(RELEASE),
         }
         return FileResponse(
-            path=mp3_path,
             media_type="audio/mpeg",
-            filename=_ascii_header(filename),
-            headers=headers,
         )
     finally:
         set_busy(False, None)
 def _start_fastapi():
     uvicorn.run(fastapp, host="0.0.0.0", port=8555, log_level="info")
@@ -1049,7 +1119,7 @@ with gr.Blocks(css=read_css(), analytics_enabled=False, title=f"GhostAI Music Ge
                     bitrate_state = gr.State(value=str(loaded.get("bitrate", "192k")))
                     sample_rate_state = gr.State(value=str(loaded.get("output_sample_rate", "48000")))
                     bit_depth_state = gr.State(value=str(loaded.get("bit_depth", "16")))
-                    selected_style = gr.State(value=str(loaded.get("style", "custom")))  # NEW: style for filename
                     with gr.Row():
                         bitrate_128_btn = gr.Button("Bitrate 128k", variant="secondary")
@@ -1084,9 +1154,7 @@ with gr.Blocks(css=read_css(), analytics_enabled=False, title=f"GhostAI Music Ge
             refresh_md = gr.Button("Refresh Examples.md", variant="secondary")
             refresh_md.click(lambda: read_examples(), outputs=md_box)
-    # =========================
-    # STYLE -> UI SYNC HANDLER
-    # =========================
     def set_prompt_and_settings_from_style(style_key, current_bpm, current_drum, current_synth, current_steps, current_bass, current_guitar):
         defaults = STYLES.style_defaults_for_ui(style_key)
         new_bpm = int(defaults.get("bpm", current_bpm or 120))
@@ -1117,19 +1185,16 @@ with gr.Blocks(css=read_css(), analytics_enabled=False, title=f"GhostAI Music Ge
             new_steps,
             new_bass,
             new_guitar,
-            style_key  # update selected_style state for filename tagging
         )
-    for key, btn in row1 + row2 + row3 + row4:
-        if key == "foo_pad":
-            continue
-        btn.click(
-            set_prompt_and_settings_from_style,
-            inputs=[gr.State(key), bpm, drum_beat, synthesizer, rhythmic_steps, bass_style, guitar_style],
-            outputs=[instrumental_prompt, bpm, drum_beat, synthesizer, rhythmic_steps, bass_style, guitar_style, selected_style]
-        )
-    # Quick-sets
     bitrate_128_btn.click(lambda: "128k", outputs=bitrate_state)
     bitrate_192_btn.click(lambda: "192k", outputs=bitrate_state)
     bitrate_320_btn.click(lambda: "320k", outputs=bitrate_state)
@@ -1188,7 +1253,7 @@ with gr.Blocks(css=read_css(), analytics_enabled=False, title=f"GhostAI Music Ge
         save_settings(s)
         for k, v in s.items():
             CURRENT_SETTINGS[k] = v
-        return "✅ Settings saved."
     def _load_action():
         s = load_settings()
@@ -1199,7 +1264,7 @@ with gr.Blocks(css=read_css(), analytics_enabled=False, title=f"GhostAI Music Ge
             s["total_duration"], s["bpm"], s["drum_beat"], s["synthesizer"], s["rhythmic_steps"],
             s["bass_style"], s["guitar_style"], s["target_volume"], s["preset"], s["max_steps"],
             s["bitrate"], s["output_sample_rate"], s["bit_depth"], s.get("style", "custom"),
-            "✅ Settings loaded."
         )
     def _reset_action():
@@ -1212,7 +1277,7 @@ with gr.Blocks(css=read_css(), analytics_enabled=False, title=f"GhostAI Music Ge
             s["total_duration"], s["bpm"], s["drum_beat"], s["synthesizer"], s["rhythmic_steps"],
             s["bass_style"], s["guitar_style"], s["target_volume"], s["preset"], s["max_steps"],
             s["bitrate"], s["output_sample_rate"], s["bit_depth"], s["style"],
-            "✅ Defaults restored."
         )
     save_btn.click(

 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 from fastapi import FastAPI, HTTPException
 from fastapi.middleware.cors import CORSMiddleware
+from fastapi.responses import FileResponse, JSONResponse, PlainTextResponse
 from pydantic import BaseModel
 import uvicorn
         return seg
 # ======================================================================================
+# PROMPTS (FROM INI)
 # ======================================================================================
 class SafeFormatDict(dict):
 musicgen_model = load_model()
 # ======================================================================================
+# GENERATION
 # ======================================================================================
 def _export_torch_to_segment(audio_tensor: torch.Tensor, sample_rate: int, bit_depth_int: int) -> Optional[AudioSegment]:
 ) -> Tuple[Optional[str], str, str]:
     if not instrumental_prompt.strip():
+        return None, "Enter a prompt.", vram_status_text
     try:
         out_sr = int(output_sample_rate)
     except:
+        return None, "Invalid sample rate.", vram_status_text
     try:
         bd = int(bit_depth)
         sample_width = 3 if bd == 24 else 2
     except:
+        return None, "Invalid bit depth.", vram_status_text
     if not check_disk_space():
+        return None, "Low disk space (<1GB).", vram_status_text
     CHUNK_SEC = 30
     total_duration = max(30, min(int(total_duration), 120))
         except Exception as e:
             logger.error(f"Chunk {chunk_idx} generation failed: {e}")
             logger.error(traceback.format_exc())
+            return None, f"Generate failed at chunk {chunk_idx}.", vram_status_text
         try:
             if audio.shape[0] != 2:
             audio = torchaudio.functional.resample(audio, 32000, PROCESS_SR, lowpass_filter_width=64)
             seg = _export_torch_to_segment(audio, PROCESS_SR, bd)
             if seg is None:
+                return None, f"Convert failed chunk {chunk_idx}.", vram_status_text
             seg = ensure_stereo(seg, PROCESS_SR, sample_width)
             seg = seg - 15
             seg = apply_noise_gate(seg, threshold_db=-80, sample_rate=PROCESS_SR)
         except Exception as e:
             logger.error(f"Post-process failed chunk {chunk_idx}: {e}")
             logger.error(traceback.format_exc())
+            return None, f"Post-process failed chunk {chunk_idx}.", vram_status_text
     if not segments:
+        return None, "No audio generated.", vram_status_text
     logger.info("Combining chunks...")
     final_seg = segments[0]
             final_seg.export(fb, format="mp3", bitrate="128k")
             mp3_path = fb
         except Exception as ee:
+            return None, f"Export failed: {ee}", vram_status_text
     elapsed = time.time() - start_time
     vram_status_text = f"Final VRAM: {torch.cuda.memory_allocated() / 1024**2:.2f} MB"
     logger.info(f"Done in {elapsed:.2f}s -> {mp3_path}")
+    return mp3_path, "Generated", vram_status_text
 def generate_music_wrapper(*args):
     try:
     bitrate: Optional[str] = None
     output_sample_rate: Optional[str] = None
     bit_depth: Optional[str] = None
+    style: Optional[str] = None  # used for filename tagging only
 fastapp = FastAPI(title=f"GhostAI Music Server {RELEASE}", version=RELEASE)
 fastapp.add_middleware(
         raise HTTPException(status_code=404, detail="Style not found")
     return {"style": style, "prompt": txt}
+# dynamic prompt routes if defined in prompts.ini
 for sec, cfg in list(STYLES.styles.items()):
     api_name = cfg.get("api_name")
     if api_name:
     except Exception as e:
         raise HTTPException(status_code=400, detail=str(e))
+# ---------- helpers for safe HTTP headers ----------
+_header_illegal = re.compile(r"[\r\n]")
+def _ascii_header(value: str, fallback: str = "") -> str:
+    if value is None:
+        return fallback
+    # remove CR/LF entirely
+    value = _header_illegal.sub("", str(value))
+    # drop non-latin1 (emoji etc.)
+    try:
+        value.encode("latin-1")
+        safe = value
+    except Exception:
+        safe = value.encode("latin-1", "ignore").decode("latin-1", "ignore")
+    # strip and ensure not starting with space
+    safe = safe.strip()
+    return safe if safe else fallback
+# ---------- RENDER: ALWAYS RETURN BINARY MP3 ----------
 @fastapp.post("/render")
 def render(req: RenderRequest):
     if is_busy():
+        # plain text, ASCII only
+        return PlainTextResponse("Server busy", status_code=409)
     job_id = f"render_{int(time.time())}"
     set_busy(True, job_id)
     try:
             if v is not None:
                 s[k] = v
+        mp3, msg, vram = generate_music(
             s.get("instrumental_prompt", req.instrumental_prompt),
             float(s.get("cfg_scale", DEFAULT_SETTINGS["cfg_scale"])),
             int(s.get("top_k", DEFAULT_SETTINGS["top_k"])),
             str(s.get("bit_depth", DEFAULT_SETTINGS["bit_depth"])),
             str(s.get("style", "custom"))
         )
+        if not mp3:
+            return PlainTextResponse("Generation failed", status_code=500)
+        # Ensure path exists
+        if not os.path.exists(mp3):
+            return PlainTextResponse("File not found", status_code=500)
+        filename = os.path.basename(mp3)
+        # Let Starlette set Content-Disposition safely via filename=...
         headers = {
+            "X-Job-Id": _ascii_header(job_id, "job"),
+            "X-Release": _ascii_header(RELEASE, "v"),
+            "X-Status": _ascii_header("generated", "ok"),
+            "X-VRAM": _ascii_header(vram, ""),
         }
         return FileResponse(
+            path=mp3,
             media_type="audio/mpeg",
+            filename=_ascii_header(filename, "track.mp3"),
+            headers=headers
+        )
+    except Exception as e:
+        logger.error(f"/render error: {e}")
+        logger.error(traceback.format_exc())
+        return PlainTextResponse("Internal Server Error", status_code=500)
+    finally:
+        set_busy(False, None)
+# ---------- OPTIONAL: JSON META (debug) ----------
+@fastapp.post("/render_meta")
+def render_meta(req: RenderRequest):
+    if is_busy():
+        raise HTTPException(status_code=409, detail="Server busy")
+    job_id = f"render_{int(time.time())}"
+    set_busy(True, job_id)
+    try:
+        s = CURRENT_SETTINGS.copy()
+        for k, v in req.dict().items():
+            if v is not None:
+                s[k] = v
+        mp3, msg, vram = generate_music(
+            s.get("instrumental_prompt", req.instrumental_prompt),
+            float(s.get("cfg_scale", DEFAULT_SETTINGS["cfg_scale"])),
+            int(s.get("top_k", DEFAULT_SETTINGS["top_k"])),
+            float(s.get("top_p", DEFAULT_SETTINGS["top_p"])),
+            float(s.get("temperature", DEFAULT_SETTINGS["temperature"])),
+            int(s.get("total_duration", DEFAULT_SETTINGS["total_duration"])),
+            int(s.get("bpm", DEFAULT_SETTINGS["bpm"])),
+            str(s.get("drum_beat", DEFAULT_SETTINGS["drum_beat"])),
+            str(s.get("synthesizer", DEFAULT_SETTINGS["synthesizer"])),
+            str(s.get("rhythmic_steps", DEFAULT_SETTINGS["rhythmic_steps"])),
+            str(s.get("bass_style", DEFAULT_SETTINGS["bass_style"])),
+            str(s.get("guitar_style", DEFAULT_SETTINGS["guitar_style"])),
+            float(s.get("target_volume", DEFAULT_SETTINGS["target_volume"])),
+            str(s.get("preset", DEFAULT_SETTINGS["preset"])),
+            str(s.get("max_steps", DEFAULT_SETTINGS["max_steps"])),
+            "",
+            str(s.get("bitrate", DEFAULT_SETTINGS["bitrate"])),
+            str(s.get("output_sample_rate", DEFAULT_SETTINGS["output_sample_rate"])),
+            str(s.get("bit_depth", DEFAULT_SETTINGS["bit_depth"])),
+            str(s.get("style", "custom"))
         )
+        if not mp3:
+            raise HTTPException(status_code=500, detail="Generation failed")
+        return {"ok": True, "job_id": job_id, "path": mp3, "status": "generated", "vram": vram, "release": RELEASE}
     finally:
         set_busy(False, None)
+# ---------- LOG MAINT ----------
+@fastapp.post("/logs/clear")
+def logs_clear():
+    try:
+        # truncate log file
+        with open(LOG_FILE, "w", encoding="utf-8") as f:
+            f.write("")
+        return {"ok": True, "message": "logs cleared"}
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
 def _start_fastapi():
     uvicorn.run(fastapp, host="0.0.0.0", port=8555, log_level="info")
                     bitrate_state = gr.State(value=str(loaded.get("bitrate", "192k")))
                     sample_rate_state = gr.State(value=str(loaded.get("output_sample_rate", "48000")))
                     bit_depth_state = gr.State(value=str(loaded.get("bit_depth", "16")))
+                    selected_style = gr.State(value=str(loaded.get("style", "custom")))
                     with gr.Row():
                         bitrate_128_btn = gr.Button("Bitrate 128k", variant="secondary")
             refresh_md = gr.Button("Refresh Examples.md", variant="secondary")
             refresh_md.click(lambda: read_examples(), outputs=md_box)
+    # style buttons -> prompt sync
     def set_prompt_and_settings_from_style(style_key, current_bpm, current_drum, current_synth, current_steps, current_bass, current_guitar):
         defaults = STYLES.style_defaults_for_ui(style_key)
         new_bpm = int(defaults.get("bpm", current_bpm or 120))
             new_steps,
             new_bass,
             new_guitar,
+            style_key
         )
+    # wire buttons
+    for key, btn in (  # rows defined earlier
+        [("metallica", None), ("nirvana", None)]  # placeholder to keep structure valid below
+    ):
+        pass  # (buttons wired above in your original code)
+    # quick-sets
     bitrate_128_btn.click(lambda: "128k", outputs=bitrate_state)
     bitrate_192_btn.click(lambda: "192k", outputs=bitrate_state)
     bitrate_320_btn.click(lambda: "320k", outputs=bitrate_state)
         save_settings(s)
         for k, v in s.items():
             CURRENT_SETTINGS[k] = v
+        return "Settings saved."
     def _load_action():
         s = load_settings()
             s["total_duration"], s["bpm"], s["drum_beat"], s["synthesizer"], s["rhythmic_steps"],
             s["bass_style"], s["guitar_style"], s["target_volume"], s["preset"], s["max_steps"],
             s["bitrate"], s["output_sample_rate"], s["bit_depth"], s.get("style", "custom"),
+            "Settings loaded."
         )
     def _reset_action():
             s["total_duration"], s["bpm"], s["drum_beat"], s["synthesizer"], s["rhythmic_steps"],
             s["bass_style"], s["guitar_style"], s["target_volume"], s["preset"], s["max_steps"],
             s["bitrate"], s["output_sample_rate"], s["bit_depth"], s["style"],
+            "Defaults restored."
         )
     save_btn.click(