Spaces:

juzer09
/

ai-music-detection

Sleeping

App Files Files Community

juzer09 commited on Jul 15

Commit

4b12a2e

verified ·

1 Parent(s): 68cbc97

Update app.py

Browse files

Files changed (1) hide show

app.py +385 -272

app.py CHANGED Viewed

@@ -1,272 +1,385 @@
-#!/usr/bin/env python3
-"""
-Madverse Music - Hugging Face Spaces Version
-Streamlit app for HF Spaces deployment
-"""
-import streamlit as st
-import torch
-import librosa
-import tempfile
-import os
-import time
-import numpy as np
-# Import the sonics library for model loading
-try:
-    from sonics import HFAudioClassifier
-except ImportError:
-    st.error("Sonics library not found. Please install it first.")
-    st.stop()
-# Global model variable
-model = None
-# Page configuration
-st.set_page_config(
-    page_title="Madverse Music: AI Music Detector",
-    page_icon="🎵",
-    layout="wide",
-    initial_sidebar_state="expanded"
-)
-# Custom CSS
-st.markdown("""
-<style>
-    .main-header {
-        background: linear-gradient(90deg, #667eea 0%, #764ba2 100%);
-        padding: 1rem;
-        border-radius: 10px;
-        color: white;
-        text-align: center;
-        margin-bottom: 2rem;
-    }
-    .result-box {
-        padding: 1rem;
-        border-radius: 10px;
-        margin: 1rem 0;
-        border-left: 5px solid;
-    }
-    .real-music {
-        background-color: #d4edda;
-        border-left-color: #28a745;
-    }
-    .fake-music {
-        background-color: #f8d7da;
-        border-left-color: #dc3545;
-    }
-</style>
-""", unsafe_allow_html=True)
-@st.cache_resource
-def load_model():
-    """Load the model with caching for HF Spaces"""
-    try:
-        with st.spinner("Loading AI model... This may take a moment..."):
-            # Use the same loading method as the working API
-            model = HFAudioClassifier.from_pretrained("awsaf49/sonics-spectttra-alpha-120s")
-            model.eval()
-            return model
-    except Exception as e:
-        st.error(f"Failed to load model: {str(e)}")
-        return None
-def process_audio(audio_file, model):
-    """Process audio file and return classification"""
-    try:
-        # Save uploaded file temporarily
-        with tempfile.NamedTemporaryFile(delete=False, suffix='.wav') as tmp_file:
-            tmp_file.write(audio_file.read())
-            tmp_path = tmp_file.name
-        # Load audio (model uses 16kHz sample rate)
-        audio, sr = librosa.load(tmp_path, sr=16000)
-        # Convert to tensor and add batch dimension
-        audio_tensor = torch.FloatTensor(audio).unsqueeze(0)
-        # Get prediction using the same pattern as working API
-        with torch.no_grad():
-            output = model(audio_tensor)
-            # Convert logit to probability using sigmoid
-            probability = torch.sigmoid(output).item()
-            # Classify: prob < 0.5 = Real, prob >= 0.5 = Fake
-            if probability < 0.5:
-                classification = "Real"
-                confidence = (1 - probability) * 2  # Convert to 0-1 scale
-            else:
-                classification = "Fake"
-                confidence = (probability - 0.5) * 2  # Convert to 0-1 scale
-        # Calculate duration
-        duration = len(audio) / sr
-        # Clean up
-        os.unlink(tmp_path)
-        return {
-            'classification': classification,
-            'confidence': min(confidence, 1.0),  # Cap at 1.0
-            'probability': probability,
-            'raw_score': output.item(),
-            'duration': duration,
-            'success': True
-        }
-    except Exception as e:
-        # Clean up on error
-        if 'tmp_path' in locals():
-            try:
-                os.unlink(tmp_path)
-            except:
-                pass
-        return {
-            'success': False,
-            'error': str(e)
-        }
-def main():
-    # Header
-    st.markdown("""
-    <div class="main-header">
-        <h1>Madverse Music: AI Music Detector</h1>
-        <p>Detect AI-generated music vs human-created music using advanced AI technology</p>
-    </div>
-    """, unsafe_allow_html=True)
-    # Sidebar
-    with st.sidebar:
-        st.markdown("### About")
-        st.markdown("""
-        This AI model can detect whether music is:
-        - **Real**: Human-created music
-        - **Fake**: AI-generated music (Suno, Udio, etc.)
-        **Model**: SpecTTTra-α (120s)
-        **Accuracy**: 97% F1 score
-        **Max Duration**: 120 seconds
-        """)
-        st.markdown("### Supported Formats")
-        st.markdown("- WAV (.wav)")
-        st.markdown("- MP3 (.mp3)")
-        st.markdown("- FLAC (.flac)")
-        st.markdown("- M4A (.m4a)")
-        st.markdown("- OGG (.ogg)")
-        st.markdown("### Links")
-        st.markdown("- [Madverse Website](https://madverse.co)")
-        st.markdown("- [GitHub Repository](#)")
-    # Load model
-    model = load_model()
-    if model is None:
-        st.error("Model failed to load. Please refresh the page.")
-        return
-    st.success("AI model loaded successfully!")
-    # File upload
-    st.markdown("### Upload Audio File")
-    uploaded_file = st.file_uploader(
-        "Choose an audio file",
-        type=['wav', 'mp3', 'flac', 'm4a', 'ogg'],
-        help="Upload an audio file to analyze (max 120 seconds)"
-    )
-    if uploaded_file is not None:
-        # Display file info
-        st.markdown("### File Information")
-        col1, col2, col3 = st.columns(3)
-        with col1:
-            st.metric("Filename", uploaded_file.name)
-        with col2:
-            st.metric("File Size", f"{uploaded_file.size / 1024:.1f} KB")
-        with col3:
-            st.metric("Format", uploaded_file.type)
-        # Audio player
-        st.markdown("### Preview")
-        st.audio(uploaded_file)
-        # Analysis button
-        if st.button("Analyze Audio", type="primary", use_container_width=True):
-            try:
-                with st.spinner("Analyzing audio... This may take a few seconds..."):
-                    # Reset file pointer
-                    uploaded_file.seek(0)
-                    # Process audio
-                    start_time = time.time()
-                    result = process_audio(uploaded_file, model)
-                    processing_time = time.time() - start_time
-                if not result['success']:
-                    st.error(f"Error processing audio: {result['error']}")
-                    return
-                # Display results
-                st.markdown("### Analysis Results")
-                classification = result['classification']
-                confidence = result['confidence']
-                # Result box
-                if classification == "Real":
-                    st.markdown(f"""
-                    <div class="result-box real-music">
-                        <h3>Result: Human-Created Music</h3>
-                        <p><strong>Classification:</strong> {classification}</p>
-                        <p><strong>Confidence:</strong> {confidence:.1%}</p>
-                        <p><strong>Message:</strong> This appears to be human-created music!</p>
-                    </div>
-                    """, unsafe_allow_html=True)
-                else:
-                    st.markdown(f"""
-                    <div class="result-box fake-music">
-                        <h3>Result: AI-Generated Music</h3>
-                        <p><strong>Classification:</strong> {classification}</p>
-                        <p><strong>Confidence:</strong> {confidence:.1%}</p>
-                        <p><strong>Message:</strong> This appears to be AI-generated music!</p>
-                    </div>
-                    """, unsafe_allow_html=True)
-                # Detailed metrics
-                with st.expander("Detailed Metrics"):
-                    col1, col2, col3 = st.columns(3)
-                    with col1:
-                        st.metric("Confidence", f"{confidence:.1%}")
-                    with col2:
-                        st.metric("Probability", f"{result['probability']:.3f}")
-                    with col3:
-                        st.metric("Processing Time", f"{processing_time:.2f}s")
-                    if result['duration'] > 0:
-                        st.metric("Duration", f"{result['duration']:.1f}s")
-                    st.markdown("**Interpretation:**")
-                    st.markdown("""
-                    - **Probability < 0.5**: Classified as Real (human-created)
-                    - **Probability ≥ 0.5**: Classified as Fake (AI-generated)
-                    - **Confidence**: How certain the model is about its prediction
-                    """)
-            except Exception as e:
-                st.error(f"Error processing audio: {str(e)}")
-    # Footer
-    st.markdown("---")
-    st.markdown("""
-    <div style="text-align: center; color: #666;">
-        <p>Powered by <strong>Madverse Music</strong> | Built with Streamlit & PyTorch</p>
-        <p>This tool is for research and educational purposes. Results may vary depending on audio quality.</p>
-    </div>
-    """, unsafe_allow_html=True)
-if __name__ == "__main__":
-    main()

+#!/usr/bin/env python3
+"""
+Madverse Music API
+AI Music Detection Service
+"""
+from fastapi import FastAPI, HTTPException, BackgroundTasks, Header, Depends
+from fastapi.security import HTTPBearer, HTTPAuthorizationCredentials
+from pydantic import BaseModel, HttpUrl
+import torch
+import librosa
+import tempfile
+import os
+import requests
+from pathlib import Path
+import time
+from typing import Optional, Annotated, List
+import uvicorn
+import asyncio
+# Initialize FastAPI app
+app = FastAPI(
+    title="Madverse Music API",
+    description="AI-powered music detection API to identify AI-generated vs human-created music",
+    version="1.0.0",
+    docs_url="/",
+    redoc_url="/docs"
+)
+# API Key Configuration
+API_KEY = os.getenv("MADVERSE_API_KEY", "madverse-music-api-key-2024")  # Default key for demo
+# Global model variable
+model = None
+async def verify_api_key(x_api_key: Annotated[str | None, Header()] = None):
+    """Verify API key from header"""
+    if x_api_key is None:
+        raise HTTPException(
+            status_code=401,
+            detail="Missing API key. Please provide a valid X-API-Key header."
+        )
+    if x_api_key != API_KEY:
+        raise HTTPException(
+            status_code=401,
+            detail="Invalid API key. Please provide a valid X-API-Key header."
+        )
+    return x_api_key
+class MusicAnalysisRequest(BaseModel):
+    urls: List[HttpUrl]
+def check_api_key_first(request: MusicAnalysisRequest, x_api_key: Annotated[str | None, Header()] = None):
+    """Check API key before processing request"""
+    if x_api_key is None:
+        raise HTTPException(
+            status_code=401,
+            detail="Missing API key. Please provide a valid X-API-Key header."
+        )
+    if x_api_key != API_KEY:
+        raise HTTPException(
+            status_code=401,
+            detail="Invalid API key. Please provide a valid X-API-Key header."
+        )
+    return request
+class FileAnalysisResult(BaseModel):
+    url: str
+    success: bool
+    classification: Optional[str] = None  # "Real" or "Fake"
+    confidence: Optional[float] = None    # 0.0 to 1.0
+    probability: Optional[float] = None   # Raw sigmoid probability
+    raw_score: Optional[float] = None     # Raw model output
+    duration: Optional[float] = None      # Audio duration in seconds
+    message: str
+    processing_time: Optional[float] = None
+    error: Optional[str] = None
+class MusicAnalysisResponse(BaseModel):
+    success: bool
+    total_files: int
+    successful_analyses: int
+    failed_analyses: int
+    results: List[FileAnalysisResult]
+    total_processing_time: float
+    message: str
+class ErrorResponse(BaseModel):
+    success: bool
+    error: str
+    message: str
+@app.on_event("startup")
+async def load_model():
+    """Load the AI model on startup"""
+    global model
+    try:
+        from sonics import HFAudioClassifier
+        print("🔄 Loading Madverse Music AI model...")
+        model = HFAudioClassifier.from_pretrained("awsaf49/sonics-spectttra-alpha-120s")
+        model.eval()
+        print("✅ Model loaded successfully!")
+    except Exception as e:
+        print(f"❌ Failed to load model: {e}")
+        raise
+def cleanup_file(file_path: str):
+    """Background task to cleanup temporary files"""
+    try:
+        if os.path.exists(file_path):
+            os.unlink(file_path)
+    except:
+        pass
+def download_audio(url: str, max_size_mb: int = 100) -> str:
+    """Download audio file from URL with size validation"""
+    try:
+        # Check if URL is accessible
+        response = requests.head(str(url), timeout=10)
+        # Check content size
+        content_length = response.headers.get('Content-Length')
+        if content_length and int(content_length) > max_size_mb * 1024 * 1024:
+            raise HTTPException(
+                status_code=413,
+                detail=f"File too large. Maximum size: {max_size_mb}MB"
+            )
+        # Download file
+        response = requests.get(str(url), timeout=30, stream=True)
+        response.raise_for_status()
+        # Create temporary file
+        with tempfile.NamedTemporaryFile(delete=False, suffix='.tmp') as tmp_file:
+            downloaded_size = 0
+            for chunk in response.iter_content(chunk_size=8192):
+                downloaded_size += len(chunk)
+                if downloaded_size > max_size_mb * 1024 * 1024:
+                    os.unlink(tmp_file.name)
+                    raise HTTPException(
+                        status_code=413,
+                        detail=f"File too large. Maximum size: {max_size_mb}MB"
+                    )
+                tmp_file.write(chunk)
+            return tmp_file.name
+    except requests.exceptions.RequestException as e:
+        raise HTTPException(
+            status_code=400,
+            detail=f"Failed to download audio: {str(e)}"
+        )
+    except Exception as e:
+        raise HTTPException(
+            status_code=500,
+            detail=f"Error downloading file: {str(e)}"
+        )
+def classify_audio(file_path: str) -> dict:
+    """Classify audio file using the AI model"""
+    try:
+        # Load audio (model uses 16kHz sample rate)
+        audio, sr = librosa.load(file_path, sr=16000)
+        # Convert to tensor and add batch dimension
+        audio_tensor = torch.FloatTensor(audio).unsqueeze(0)
+        # Get prediction
+        with torch.no_grad():
+            output = model(audio_tensor)
+            # Convert logit to probability using sigmoid
+            prob = torch.sigmoid(output).item()
+            # Classify: prob < 0.5 = Real, prob >= 0.5 = Fake
+            if prob < 0.5:
+                classification = "Real"
+                confidence = (1 - prob) * 2  # Convert to 0-1 scale
+            else:
+                classification = "Fake"
+                confidence = (prob - 0.5) * 2  # Convert to 0-1 scale
+        return {
+            "classification": classification,
+            "confidence": min(confidence, 1.0),  # Cap at 1.0
+            "probability": prob,
+            "raw_score": output.item(),
+            "duration": len(audio) / sr
+        }
+    except Exception as e:
+        raise HTTPException(
+            status_code=500,
+            detail=f"Error analyzing audio: {str(e)}"
+        )
+async def process_single_url(url: str) -> FileAnalysisResult:
+    """Process a single URL and return result"""
+    start_time = time.time()
+    try:
+        # Download audio file
+        temp_file = download_audio(url)
+        # Classify audio
+        result = classify_audio(temp_file)
+        # Calculate processing time
+        processing_time = time.time() - start_time
+        # Cleanup file in background
+        try:
+            os.unlink(temp_file)
+        except:
+            pass
+        # Prepare response
+        emoji = "🎤" if result["classification"] == "Real" else "🤖"
+        message = f'{emoji} Detected as {result["classification"].lower()} music'
+        return FileAnalysisResult(
+            url=str(url),
+            success=True,
+            classification=result["classification"],
+            confidence=result["confidence"],
+            probability=result["probability"],
+            raw_score=result["raw_score"],
+            duration=result["duration"],
+            message=message,
+            processing_time=processing_time
+        )
+    except Exception as e:
+        processing_time = time.time() - start_time
+        error_msg = str(e)
+        return FileAnalysisResult(
+            url=str(url),
+            success=False,
+            message=f"❌ Failed to process: {error_msg}",
+            processing_time=processing_time,
+            error=error_msg
+        )
+@app.post("/analyze", response_model=MusicAnalysisResponse)
+async def analyze_music(
+    request: MusicAnalysisRequest = Depends(check_api_key_first)
+):
+    """
+    Analyze music from URL(s) to detect if it's AI-generated or human-created
+    - **urls**: Array of direct URLs to audio files (MP3, WAV, FLAC, M4A, OGG)
+    - Returns classification results for each file
+    - Processes files concurrently for better performance when multiple URLs provided
+    """
+    start_time = time.time()
+    if not model:
+        raise HTTPException(
+            status_code=503,
+            detail="Model not loaded. Please try again later."
+        )
+    if len(request.urls) > 50:  # Limit processing
+        raise HTTPException(
+            status_code=400,
+            detail="Too many URLs. Maximum 50 files per request."
+        )
+    if len(request.urls) == 0:
+        raise HTTPException(
+            status_code=400,
+            detail="At least one URL is required."
+        )
+    try:
+        # Process all URLs concurrently with limited concurrency
+        semaphore = asyncio.Semaphore(5)  # Limit to 5 concurrent downloads
+        async def process_with_semaphore(url):
+            async with semaphore:
+                return await process_single_url(str(url))
+        # Create tasks for all URLs
+        tasks = [process_with_semaphore(url) for url in request.urls]
+        # Wait for all tasks to complete
+        results = await asyncio.gather(*tasks, return_exceptions=True)
+        # Process results and handle any exceptions
+        processed_results = []
+        successful_count = 0
+        failed_count = 0
+        for i, result in enumerate(results):
+            if isinstance(result, Exception):
+                # Handle exception case
+                processed_results.append(FileAnalysisResult(
+                    url=str(request.urls[i]),
+                    success=False,
+                    message=f"❌ Processing failed: {str(result)}",
+                    error=str(result)
+                ))
+                failed_count += 1
+            else:
+                processed_results.append(result)
+                if result.success:
+                    successful_count += 1
+                else:
+                    failed_count += 1
+        # Calculate total processing time
+        total_processing_time = time.time() - start_time
+        # Prepare summary message
+        total_files = len(request.urls)
+        if total_files == 1:
+            # Single file message
+            if successful_count == 1:
+                message = processed_results[0].message
+            else:
+                message = processed_results[0].message
+        else:
+            # Multiple files message
+            if successful_count == total_files:
+                message = f"✅ Successfully analyzed all {total_files} files"
+            elif successful_count > 0:
+                message = f"⚠️ Analyzed {successful_count}/{total_files} files successfully"
+            else:
+                message = f"❌ Failed to analyze any files"
+        return MusicAnalysisResponse(
+            success=successful_count > 0,
+            total_files=total_files,
+            successful_analyses=successful_count,
+            failed_analyses=failed_count,
+            results=processed_results,
+            total_processing_time=total_processing_time,
+            message=message
+        )
+    except Exception as e:
+        raise HTTPException(
+            status_code=500,
+            detail=f"Internal server error during processing: {str(e)}"
+        )
+@app.get("/health")
+async def health_check():
+    """Health check endpoint"""
+    return {
+        "status": "healthy",
+        "model_loaded": model is not None,
+        "service": "Madverse Music API"
+    }
+@app.get("/info")
+async def get_info():
+    """Get API information"""
+    return {
+        "name": "Madverse Music API",
+        "version": "1.0.0",
+        "description": "AI-powered music detection to identify AI-generated vs human-created music",
+        "model": "SpecTTTra-α (120s)",
+        "accuracy": {
+            "f1_score": 0.97,
+            "sensitivity": 0.96,
+            "specificity": 0.99
+        },
+        "supported_formats": ["MP3", "WAV", "FLAC", "M4A", "OGG"],
+        "max_file_size": "100MB",
+        "max_duration": "120 seconds",
+        "authentication": {
+            "required": True,
+            "type": "API Key",
+            "header": "X-API-Key",
+            "example": "X-API-Key: your-api-key-here"
+        },
+        "usage": {
+            "curl_example": "curl -X POST 'http://localhost:8000/analyze' -H 'X-API-Key: your-api-key' -H 'Content-Type: application/json' -d '{\"url\":\"https://example.com/song.mp3\"}'"
+        }
+    }
+if __name__ == "__main__":
+    uvicorn.run(app, host="0.0.0.0", port=8000)