ria-toolkit-oss/src/ria_toolkit_oss/viz/pytorch_state_dict.py

import torch
import plotly.graph_objects as go
from plotly.graph_objects import Figure
import numpy as np

def model_summary_plot(state_dict: dict) -> Figure:
    """Generate a summary plot of the PyTorch model state dict."""
    if not state_dict:
        # Handle empty state dict
        fig = go.Figure()
        fig.add_annotation(
            text="No parameters found in state dict",
            xref="paper", yref="paper",
            x=0.5, y=0.5, showarrow=False,
            font=dict(size=16)
        )
        fig.update_layout(
            title="Model Layer Parameter Counts",
            xaxis_title="Layer",
            yaxis_title="Number of Parameters",
            template="plotly_dark"
        )
        return fig

    # Count parameters by layer type
    layer_info = []
    for key, tensor in state_dict.items():
        if 'weight' in key:
            try:
                layer_name = key.replace('.weight', '')
                param_count = tensor.numel() if hasattr(tensor, 'numel') else len(tensor.flatten()) if hasattr(tensor, 'flatten') else 0
                shape = list(tensor.shape) if hasattr(tensor, 'shape') else [len(tensor)] if hasattr(tensor, '__len__') else []
                layer_info.append({
                    'layer': layer_name,
                    'parameters': param_count,
                    'shape': shape
                })
            except Exception as e:
                print(f"Warning: Could not process layer {key}: {e}")
                continue

    if not layer_info:
        # Handle case where no weight layers found
        fig = go.Figure()
        fig.add_annotation(
            text="No weight layers found in state dict",
            xref="paper", yref="paper",
            x=0.5, y=0.5, showarrow=False,
            font=dict(size=16)
        )
        fig.update_layout(
            title="Model Layer Parameter Counts",
            xaxis_title="Layer",
            yaxis_title="Number of Parameters",
            template="plotly_dark"
        )
        return fig

    # Create bar chart of parameter counts
    fig = go.Figure(data=[
        go.Bar(
            x=[info['layer'] for info in layer_info],
            y=[info['parameters'] for info in layer_info],
            text=[f"Shape: {info['shape']}" for info in layer_info],
            textposition='auto',
        )
    ])

    fig.update_layout(
        title="Model Layer Parameter Counts",
        xaxis_title="Layer",
        yaxis_title="Number of Parameters",
        template="plotly_dark"
    )

    return fig

def layer_weights_plot(state_dict: dict, layer_name: str = None) -> Figure:
    """Visualize weights for a specific layer."""
    if not state_dict:
        fig = go.Figure()
        fig.add_annotation(
            text="No data in state dict",
            xref="paper", yref="paper",
            x=0.5, y=0.5, showarrow=False,
            font=dict(size=16)
        )
        fig.update_layout(
            title="Layer Weights",
            template="plotly_dark"
        )
        return fig

    if layer_name is None:
        # Get first weight tensor
        weight_keys = [k for k in state_dict.keys() if 'weight' in k]
        if not weight_keys:
            fig = go.Figure()
            fig.add_annotation(
                text="No weight tensors found in state dict",
                xref="paper", yref="paper",
                x=0.5, y=0.5, showarrow=False,
                font=dict(size=16)
            )
            fig.update_layout(
                title="Layer Weights",
                template="plotly_dark"
            )
            return fig
        layer_name = weight_keys[0]

    try:
        weights = state_dict[layer_name]

        # Convert to numpy if it's a torch tensor
        if hasattr(weights, 'numpy'):
            weights_np = weights.detach().numpy() if hasattr(weights, 'detach') else weights.numpy()
        elif hasattr(weights, 'cpu'):
            weights_np = weights.cpu().detach().numpy()
        else:
            weights_np = np.array(weights)

        # For 2D weights, create heatmap
        if len(weights_np.shape) == 2:
            fig = go.Figure(data=go.Heatmap(
                z=weights_np,
                colorscale='RdBu',
                zmid=0
            ))
            fig.update_layout(
                title=f"Weights Heatmap: {layer_name}",
                template="plotly_dark"
            )
        else:
            # For other shapes, flatten and show histogram
            flat_weights = weights_np.flatten()
            fig = go.Figure(data=[go.Histogram(x=flat_weights, nbinsx=50)])
            fig.update_layout(
                title=f"Weight Distribution: {layer_name}",
                template="plotly_dark"
            )

        return fig

    except Exception as e:
        fig = go.Figure()
        fig.add_annotation(
            text=f"Error processing layer {layer_name}: {str(e)}",
            xref="paper", yref="paper",
            x=0.5, y=0.5, showarrow=False,
            font=dict(size=14)
        )
        fig.update_layout(
            title="Layer Weights - Error",
            template="plotly_dark"
        )
        return fig

def weight_distribution_plot(state_dict: dict) -> Figure:
    """Show distribution of weights across all layers."""
    if not state_dict:
        fig = go.Figure()
        fig.add_annotation(
            text="No data in state dict",
            xref="paper", yref="paper",
            x=0.5, y=0.5, showarrow=False,
            font=dict(size=16)
        )
        fig.update_layout(
            title="Overall Weight Distribution",
            xaxis_title="Weight Value",
            yaxis_title="Frequency",
            template="plotly_dark"
        )
        return fig

    all_weights = []
    layer_names = []

    for key, tensor in state_dict.items():
        if 'weight' in key:
            try:
                # Convert to numpy if it's a torch tensor
                if hasattr(tensor, 'numpy'):
                    weights_np = tensor.detach().numpy() if hasattr(tensor, 'detach') else tensor.numpy()
                elif hasattr(tensor, 'cpu'):
                    weights_np = tensor.cpu().detach().numpy()
                else:
                    weights_np = np.array(tensor)

                flat_weights = weights_np.flatten()
                all_weights.extend(flat_weights)
                layer_names.extend([key] * len(flat_weights))
            except Exception as e:
                print(f"Warning: Could not process weights for layer {key}: {e}")
                continue

    if not all_weights:
        fig = go.Figure()
        fig.add_annotation(
            text="No weight data found in state dict",
            xref="paper", yref="paper",
            x=0.5, y=0.5, showarrow=False,
            font=dict(size=16)
        )
        fig.update_layout(
            title="Overall Weight Distribution",
            xaxis_title="Weight Value",
            yaxis_title="Frequency",
            template="plotly_dark"
        )
        return fig

    fig = go.Figure(data=[
        go.Histogram(
            x=all_weights,
            nbinsx=100,
            name="All Weights"
        )
    ])

    fig.update_layout(
        title="Overall Weight Distribution",
        xaxis_title="Weight Value",
        yaxis_title="Frequency",
        template="plotly_dark"
    )

    return fig