Source code for lrs.monitoring.dashboard

"""
Real-time Streamlit dashboard for LRS agents.

Provides visualization of:
- Precision trajectories (3-level hierarchy)
- G-space map (epistemic vs pragmatic)
- Prediction error stream
- Adaptation timeline
- Tool usage statistics
"""

import streamlit as st
import matplotlib.pyplot as plt
import pandas as pd
from typing import Optional
from datetime import datetime

from lrs.monitoring.tracker import LRSStateTracker



[docs]
def create_dashboard(tracker: LRSStateTracker):
    """
    Create Streamlit dashboard for LRS agent monitoring.
    
    Args:
        tracker: LRSStateTracker instance with execution history
    
    Examples:
        >>> import streamlit as st
        >>> from lrs.monitoring import create_dashboard
        >>> 
        >>> tracker = LRSStateTracker()
        >>> # ... run agent with tracker ...
        >>> 
        >>> create_dashboard(tracker)
    """
    st.set_page_config(
        page_title="LRS Agent Monitor",
        page_icon="🧠",
        layout="wide"
    )
    
    st.title("🧠 LRS Agent Monitoring Dashboard")
    st.markdown("Real-time Active Inference agent observability")
    
    # Sidebar with summary stats
    _render_sidebar(tracker)
    
    # Main content
    col1, col2 = st.columns(2)
    
    with col1:
        _render_precision_trajectories(tracker)
        _render_prediction_error_stream(tracker)
    
    with col2:
        _render_g_space_map(tracker)
        _render_tool_usage(tracker)
    
    # Full-width sections
    _render_adaptation_timeline(tracker)
    _render_detailed_history(tracker)



def _render_sidebar(tracker: LRSStateTracker):
    """Render sidebar with summary statistics"""
    st.sidebar.header("📊 Summary Statistics")
    
    summary = tracker.get_summary()
    
    st.sidebar.metric("Total Steps", summary['total_steps'])
    st.sidebar.metric("Adaptations", summary['total_adaptations'])
    st.sidebar.metric("Avg Precision", f"{summary['avg_precision']:.3f}")
    
    if summary['final_precision']:
        st.sidebar.subheader("Current Precision")
        for level, value in summary['final_precision'].items():
            st.sidebar.metric(
                level.capitalize(),
                f"{value:.3f}",
                delta=None
            )
    
    # Export button
    if st.sidebar.button("Export History"):
        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
        filepath = f"lrs_history_{timestamp}.json"
        tracker.export_history(filepath)
        st.sidebar.success(f"Exported to {filepath}")


def _render_precision_trajectories(tracker: LRSStateTracker):
    """Render precision trajectory chart"""
    st.subheader("📈 Precision Trajectories")
    
    trajectories = tracker.get_all_precision_trajectories()
    
    if not trajectories or not trajectories['execution']:
        st.info("No data yet. Run agent to see precision trajectories.")
        return
    
    fig, ax = plt.subplots(figsize=(10, 6))
    
    steps = range(len(trajectories['execution']))
    
    ax.plot(steps, trajectories['abstract'], 
            label='Abstract', linewidth=2, alpha=0.8, color='blue')
    ax.plot(steps, trajectories['planning'], 
            label='Planning', linewidth=2, alpha=0.8, color='orange')
    ax.plot(steps, trajectories['execution'], 
            label='Execution', linewidth=2, alpha=0.8, color='green')
    
    # Threshold lines
    ax.axhline(y=0.7, color='green', linestyle='--', alpha=0.3, label='High confidence')
    ax.axhline(y=0.4, color='orange', linestyle='--', alpha=0.3, label='Adaptation threshold')
    
    ax.set_xlabel('Step')
    ax.set_ylabel('Precision (γ)')
    ax.set_title('Hierarchical Precision Over Time')
    ax.legend(loc='best')
    ax.grid(alpha=0.3)
    ax.set_ylim([0, 1])
    
    st.pyplot(fig)
    plt.close()
    
    # Current values
    current = tracker.get_current_state()
    if current:
        cols = st.columns(3)
        for i, (level, value) in enumerate(current.precision.items()):
            with cols[i]:
                st.metric(
                    level.capitalize(),
                    f"{value:.3f}",
                    delta=None
                )


def _render_g_space_map(tracker: LRSStateTracker):
    """Render G-space visualization"""
    st.subheader("🎯 G-Space Map")
    
    # This requires G values from candidate policies
    # For now, show a placeholder
    st.info("G-space map shows epistemic vs pragmatic values for candidate policies.")
    st.markdown("""
    **Coming soon**: Scatter plot of:
    - X-axis: Epistemic value (information gain)
    - Y-axis: Pragmatic value (expected reward)
    - Points: Candidate policies
    - Highlight: Selected policy
    """)


def _render_prediction_error_stream(tracker: LRSStateTracker):
    """Render prediction error timeline"""
    st.subheader("⚠️ Prediction Error Stream")
    
    errors = tracker.get_prediction_errors()
    
    if not errors:
        st.info("No prediction errors recorded yet.")
        return
    
    fig, ax = plt.subplots(figsize=(10, 4))
    
    ax.bar(range(len(errors)), errors, color='red', alpha=0.6)
    ax.axhline(y=0.7, color='orange', linestyle='--', alpha=0.5, label='High surprise')
    ax.set_xlabel('Execution Step')
    ax.set_ylabel('Prediction Error (ε)')
    ax.set_title('Surprise Events Over Time')
    ax.legend()
    ax.grid(alpha=0.3)
    ax.set_ylim([0, 1])
    
    st.pyplot(fig)
    plt.close()
    
    # Statistics
    avg_error = sum(errors) / len(errors)
    high_errors = [e for e in errors if e > 0.7]
    
    col1, col2, col3 = st.columns(3)
    col1.metric("Avg Error", f"{avg_error:.3f}")
    col2.metric("High Surprise Events", len(high_errors))
    col3.metric("Max Error", f"{max(errors):.3f}")


def _render_tool_usage(tracker: LRSStateTracker):
    """Render tool usage statistics"""
    st.subheader("🔧 Tool Usage Statistics")
    
    stats = tracker.get_tool_usage_stats()
    
    if not stats:
        st.info("No tool executions yet.")
        return
    
    # Create dataframe
    df = pd.DataFrame([
        {
            'Tool': tool_name,
            'Calls': data['calls'],
            'Success Rate': data['success_rate'],
            'Avg Error': data['avg_error']
        }
        for tool_name, data in stats.items()
    ])
    
    # Display table
    st.dataframe(
        df.style.format({
            'Success Rate': '{:.1%}',
            'Avg Error': '{:.3f}'
        }),
        use_container_width=True
    )
    
    # Visualization
    fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(10, 4))
    
    # Success rates
    ax1.barh(df['Tool'], df['Success Rate'], color='green', alpha=0.7)
    ax1.set_xlabel('Success Rate')
    ax1.set_title('Tool Reliability')
    ax1.set_xlim([0, 1])
    
    # Call counts
    ax2.barh(df['Tool'], df['Calls'], color='blue', alpha=0.7)
    ax2.set_xlabel('Number of Calls')
    ax2.set_title('Tool Usage Frequency')
    
    plt.tight_layout()
    st.pyplot(fig)
    plt.close()


def _render_adaptation_timeline(tracker: LRSStateTracker):
    """Render adaptation events timeline"""
    st.subheader("🔄 Adaptation Timeline")
    
    events = tracker.get_adaptation_events()
    
    if not events:
        st.info("No adaptations occurred yet.")
        return
    
    for i, event in enumerate(events, 1):
        with st.expander(f"Adaptation #{i} - {event.get('timestamp', 'Unknown time')}"):
            col1, col2 = st.columns(2)
            
            with col1:
                st.markdown("**Trigger**")
                st.write(f"Tool: `{event.get('trigger_tool', 'Unknown')}`")
                st.write(f"Error: {event.get('trigger_error', 0.0):.3f}")
            
            with col2:
                st.markdown("**Precision Change**")
                before = event.get('precision_before', {})
                after = event.get('precision_after', {})
                
                for level in ['execution', 'planning', 'abstract']:
                    b = before.get(level, 0.5)
                    a = after.get(level, 0.5)
                    delta = a - b
                    st.write(f"{level}: {b:.3f} → {a:.3f} ({delta:+.3f})")


def _render_detailed_history(tracker: LRSStateTracker):
    """Render detailed execution history"""
    st.subheader("📜 Execution History")
    
    if not tracker.history:
        st.info("No execution history yet.")
        return
    
    # Create detailed log
    history_data = []
    
    for snapshot in tracker.history:
        for entry in snapshot.tool_history:
            history_data.append({
                'Timestamp': snapshot.timestamp.strftime("%H:%M:%S"),
                'Tool': entry.get('tool', 'Unknown'),
                'Success': '✓' if entry.get('success') else '✗',
                'Error': f"{entry.get('prediction_error', 0.0):.3f}",
                'Precision': f"{snapshot.precision.get('execution', 0.5):.3f}"
            })
    
    if history_data:
        df = pd.DataFrame(history_data)
        st.dataframe(df, use_container_width=True)



[docs]
def run_dashboard(tracker: Optional[LRSStateTracker] = None):
    """
    Run dashboard as standalone Streamlit app.
    
    Args:
        tracker: Optional pre-populated tracker
    
    Examples:
        >>> # In terminal:
        >>> # streamlit run lrs/monitoring/dashboard.py
        >>> 
        >>> # Or programmatically:
        >>> from lrs.monitoring import run_dashboard
        >>> run_dashboard()
    """
    if tracker is None:
        # Create demo tracker with sample data
        tracker = _create_demo_tracker()
    
    create_dashboard(tracker)



def _create_demo_tracker() -> LRSStateTracker:
    """Create demo tracker with sample data for testing"""
    tracker = LRSStateTracker()
    
    # Simulate some execution history
    import random
    
    for i in range(20):
        # Simulate precision changing
        precision = {
            'execution': max(0.2, min(0.9, 0.5 + random.gauss(0, 0.1))),
            'planning': max(0.3, min(0.8, 0.5 + random.gauss(0, 0.08))),
            'abstract': max(0.4, min(0.7, 0.5 + random.gauss(0, 0.05)))
        }
        
        # Simulate tool execution
        tool_name = random.choice(['api_fetch', 'cache_fetch', 'parse_json'])
        success = random.random() > 0.3
        pred_error = random.random() * (0.3 if success else 1.0)
        
        state = {
            'precision': precision,
            'tool_history': [{
                'tool': tool_name,
                'success': success,
                'prediction_error': pred_error
            }],
            'adaptation_count': i // 5,  # Adapt every 5 steps
            'belief_state': {}
        }
        
        tracker.track_state(state)
    
    return tracker


# Allow running as standalone app
if __name__ == "__main__":
    run_dashboard()