Add produce_with_spectral_coherence() - professional production with spectral analysis

2026-04-13 16:17:02 -03:00
parent dac7ec2a5a
commit c6a1705026
1 changed files with 278 additions and 0 deletions
--- a/AbletonMCP_AI/mcp_server/server.py
+++ b/AbletonMCP_AI/mcp_server/server.py
@@ -192,6 +192,8 @@ TIMEOUTS = {
    "analyze_all_bpm": 600.0,  # 10 minutes for analyzing 800+ samples
    "select_bpm_coherent_pool": 20.0,
    "warp_clip_to_bpm": 30.0,
    # Spectral Coherence Production
    "produce_with_spectral_coherence": 300.0,
 }
@@ -6914,6 +6916,282 @@ def get_production_progress(ctx: Context) -> str:
        return _err(f"Error getting production progress: {str(e)}")
@mcp.tool()
 def produce_with_spectral_coherence(ctx: Context, 
                                     bpm: int = 100,
                                     key: str = "Am",
                                     style: str = "standard",
                                     coherence_threshold: float = 0.90,
                                     max_samples_per_role: int = 12,
                                     auto_record: bool = True) -> str:
    """
    Genera una cancion profesional con seleccion espectral coherente.
    Usa los 511 samples analizados para crear una produccion donde TODOS
    los samples son espectralmente coherentes (mismo timbre, energia compatible).
    Args:
        bpm: Tempo del proyecto (default 100)
        key: Tonalidad (default Am)
        style: Estilo de produccion (standard, minimal, trap, perreo)
        coherence_threshold: Minimo score de coherencia (0.0-1.0, default 0.90 profesional)
        max_samples_per_role: Cuantos samples usar por rol (default 12)
        auto_record: Grabar a Arrangement View automaticamente
    Returns:
        JSON con detalles de la produccion, coherencia por rol, y samples usados.
    """
    import sqlite3
    import numpy as np
    import pickle
    from pathlib import Path
    DB_PATH = r"C:\ProgramData\Ableton\Live 12 Suite\Resources\MIDI Remote Scripts\libreria\reggaeton\sample_metadata.db"
    LIBRARY_PATH = r"C:\ProgramData\Ableton\Live 12 Suite\Resources\MIDI Remote Scripts\libreria\reggaeton"
    try:
        # Conectar a base de datos con features espectrales
        conn = sqlite3.connect(DB_PATH)
        cursor = conn.cursor()
        # Verificar que hay datos
        cursor.execute("SELECT COUNT(*) FROM samples")
        total_samples = cursor.fetchone()[0]
        if total_samples == 0:
            return _err("Database vacia. Ejecutar analisis de libreria primero.")
        logger.info(f"[SPECTRAL] {total_samples} samples disponibles en base de datos")
        # Mapeo de roles a categorias
        ROLE_CATEGORIES = {
            "kick": ["kick", "kicks", "8. KICKS", "kicks"],
            "snare": ["snare", "snares", "9. SNARE", "snares"],
            "hihat": ["hi-hat", "hi_hat", "hihats", "hat", "hats"],
            "perc": ["perc", "percs", "perc loop", "10. PERCS", "PERC"],
            "bass": ["bass", "basses", "Bass", "BASS", "reese"],
            "drumloop": ["drumloop", "drumloops", "4. DRUM LOOPS", "LATINOS - DRUM LOOPS"],
            "oneshot": ["oneshot", "oneshots", "3. ONE SHOTS", "LATINOS  -  ONE SHOTS", "20 One Shots"],
            "fx": ["fx", "FX", "5. FX", "transicion"],
            "vocal": ["vocal", "vocals", "11. VOCALS", "20 Vocals Phrases"],
            "pad": ["pad", "pads", "PAD"],
            "lead": ["lead", "leads", "LEAD"]
        }
        def get_samples_for_role(role, min_coherence=0.85):
            """Selecciona samples coherentes para un rol."""
            categories = ROLE_CATEGORIES.get(role, [role])
            # Buscar samples de las categorias del rol
            samples = []
            for cat in categories:
                cursor.execute("""
                    SELECT s.path, s.bpm, s.key, s.duration, s.rms, 
                           s.spectral_centroid, s.spectral_rolloff, s.zero_crossing_rate,
                           s.mfcc_1, s.mfcc_2, s.mfcc_3, s.mfcc_4, s.mfcc_5,
                           s.mfcc_6, s.mfcc_7, s.mfcc_8, s.mfcc_9, s.mfcc_10,
                           s.mfcc_11, s.mfcc_12, s.mfcc_13,
                           sb.embedding, sb.spectral_features
                    FROM samples s
                    JOIN samples_bpm sb ON s.path = sb.path
                    WHERE s.category LIKE ?
                    AND s.duration > 0
                    ORDER BY s.duration DESC
                """, (f"%{cat}%",))
                for row in cursor.fetchall():
                    samples.append({
                        'path': row[0],
                        'bpm': row[1] or bpm,
                        'key': row[2] or key,
                        'duration': row[3],
                        'rms': row[4] or -20,
                        'spectral_centroid': row[5] or 2000,
                        'spectral_rolloff': row[6] or 4000,
                        'zcr': row[7] or 0.1,
                        'mfccs': list(row[8:21]),
                        'embedding': row[21],
                        'spectral_features': row[22]
                    })
            if len(samples) < 2:
                logger.warning(f"[SPECTRAL] Pocos samples para rol {role}: {len(samples)}")
                return samples[:max_samples_per_role]
            # Calcular coherencia entre pares y seleccionar los mas coherentes
            selected = [samples[0]]  # Empezar con el primero
            for candidate in samples[1:]:
                if len(selected) >= max_samples_per_role:
                    break
                # Calcular coherencia promedio con los ya seleccionados
                coherence_scores = []
                for selected_sample in selected:
                    score = calculate_coherence(candidate, selected_sample)
                    coherence_scores.append(score)
                avg_coherence = np.mean(coherence_scores) if coherence_scores else 0
                if avg_coherence >= min_coherence:
                    selected.append(candidate)
                    logger.debug(f"[SPECTRAL] {role}: {candidate['path'][:30]}... coherencia={avg_coherence:.3f}")
            logger.info(f"[SPECTRAL] Rol {role}: {len(selected)} samples seleccionados (coherencia >= {min_coherence})")
            return selected
        def calculate_coherence(s1, s2):
            """Calcula coherencia entre dos samples usando features pre-calculadas."""
            scores = []
            # 1. Similitud de timbre (MFCC) - 40%
            mfcc_sim = cosine_similarity(s1['mfccs'], s2['mfccs'])
            scores.append(mfcc_sim * 0.40)
            # 2. Compatibilidad espectral - 30%
            centroid_diff = abs(s1['spectral_centroid'] - s2['spectral_centroid']) / max(s1['spectral_centroid'], 1)
            centroid_sim = max(0, 1 - centroid_diff)
            scores.append(centroid_sim * 0.30)
            # 3. Balance de energia - 20%
            rms_diff = abs(s1['rms'] - s2['rms']) / 60  # Normalizar
            rms_sim = max(0, 1 - rms_diff)
            scores.append(rms_sim * 0.20)
            # 4. ZCR compatibilidad - 10%
            zcr_sim = 1 - min(1, abs(s1['zcr'] - s2['zcr']) * 10)
            scores.append(zcr_sim * 0.10)
            return sum(scores)
        def cosine_similarity(v1, v2):
            """Calcula similitud coseno entre dos vectores."""
            try:
                v1_arr = np.array(v1)
                v2_arr = np.array(v2)
                dot = np.dot(v1_arr, v2_arr)
                norm = np.linalg.norm(v1_arr) * np.linalg.norm(v2_arr)
                return float(dot / norm) if norm > 0 else 0.0
            except:
                return 0.0
        # Seleccionar samples coherentes por rol
        logger.info("[SPECTRAL] Iniciando seleccion coherente...")
        selected_kits = {}
        coherence_scores = {}
        for role in ["kick", "snare", "hihat", "perc", "bass", "drumloop", "oneshot", "fx"]:
            samples = get_samples_for_role(role, min_coherence=coherence_threshold)
            selected_kits[role] = samples
            # Calcular score promedio de coherencia para este rol
            if len(samples) >= 2:
                pairwise_scores = []
                for i in range(len(samples)):
                    for j in range(i+1, len(samples)):
                        score = calculate_coherence(samples[i], samples[j])
                        pairwise_scores.append(score)
                avg_coherence = np.mean(pairwise_scores) if pairwise_scores else 0
            else:
                avg_coherence = 0.85  # Default si solo hay 1 sample
            coherence_scores[role] = round(avg_coherence, 3)
        # Reporte de coherencia
        overall_coherence = np.mean(list(coherence_scores.values()))
        logger.info(f"[SPECTRAL] Coherencia general: {overall_coherence:.3f}")
        # Ahora crear la produccion con los samples seleccionados
        tracks_created = []
        samples_loaded = []
        # Crear tracks y cargar samples coherentes
        for role_idx, (role, samples) in enumerate(selected_kits.items()):
            if not samples:
                continue
            # Crear track
            track_result = _send_to_ableton(
                "create_audio_track",
                {"index": -1},
                timeout=TIMEOUTS["create_audio_track"]
            )
            if track_result.get("status") != "success":
                continue
            track_index = track_result["result"]["track_index"]
            # Renombrar track
            _send_to_ableton(
                "set_track_name",
                {"track_index": track_index, "name": f"{role.title()} Spectral"},
                timeout=10.0
            )
            # Cargar samples coherentes en slots
            for slot_idx, sample in enumerate(samples[:8]):  # Max 8 slots
                sample_path = os.path.join(LIBRARY_PATH, sample['path'])
                if os.path.exists(sample_path):
                    load_result = _send_to_ableton(
                        "load_sample_to_clip",
                        {"track_index": track_index, "clip_index": slot_idx, "sample_path": sample_path},
                        timeout=TIMEOUTS["load_sample_to_clip"]
                    )
                    if load_result.get("status") == "success":
                        samples_loaded.append({
                            "role": role,
                            "track": track_index,
                            "slot": slot_idx,
                            "path": sample['path'],
                            "bpm": sample['bpm'],
                            "key": sample['key'],
                            "duration": sample['duration']
                        })
            tracks_created.append({
                "role": role,
                "track_index": track_index,
                "samples_count": len([s for s in samples_loaded if s['role'] == role])
            })
        conn.close()
        # Disparar clips para escuchar
        for track_info in tracks_created:
            if track_info['samples_count'] > 0:
                _send_to_ableton(
                    "fire_clip",
                    {"track_index": track_info['track_index'], "clip_index": 0},
                    timeout=10.0
                )
        # Iniciar playback
        _send_to_ableton("start_playback", {}, timeout=10.0)
        return _ok({
            "status": "success",
            "message": "Produccion profesional con coherencia espectral creada",
            "total_samples_analyzed": total_samples,
            "samples_used": len(samples_loaded),
            "tracks_created": len(tracks_created),
            "coherence_threshold": coherence_threshold,
            "coherence_scores_by_role": coherence_scores,
            "overall_coherence": round(overall_coherence, 3),
            "is_professional": overall_coherence >= 0.90,
            "tracks": tracks_created,
            "samples": samples_loaded[:20],  # Primeros 20 para preview
            "project_bpm": bpm,
            "project_key": key,
            "style": style
        })
    except Exception as e:
        logger.error(f"[SPECTRAL] Error: {str(e)}")
        return _err(f"Error en produccion espectral: {str(e)}")
 # ------------------------------------------------------------------
 # MAIN
 # ------------------------------------------------------------------