Spaces:

Jgray21
/

attention_layer_graph

Sleeping

App Files Files Community

Jgray21 commited on 9 days ago

Commit

7e1830a

verified ·

1 Parent(s): c01107e

Update src/streamlit_app.py

Browse files

Files changed (1) hide show

src/streamlit_app.py +337 -446

src/streamlit_app.py CHANGED Viewed

@@ -7,30 +7,20 @@ from typing import Dict, List, Tuple, Optional
 import numpy as np
 import pandas as pd
 import torch
 from torch import nn
 import networkx as nx
 import streamlit as st
-# Transformers: Qwen tokenizer can be AutoTokenizer if Qwen2Tokenizer not present
 from transformers import AutoConfig, AutoModelForCausalLM, AutoTokenizer
-# Dimensionality reduction
 import umap
-from umap import UMAP
-# Neighbors & clustering
 from sklearn.neighbors import NearestNeighbors, KernelDensity
 from sklearn.cluster import KMeans, DBSCAN
-from sklearn.decomposition import PCA
 from sklearn.metrics import pairwise_distances
-# Plotly for interactive 3D
 import plotly.graph_objects as go
-import hashlib
 # Optional libs (use if present)
 try:
@@ -52,27 +42,20 @@ try:
 except Exception:
     HAS_PYVISTA = False
-from scipy.linalg import orthogonal_procrustes  # For optional per-layer orientation alignment
-# ====== 1. Configuration =========================================================================
 @dataclass
 class Config:
     # Model
     model_name: str = "Qwen/Qwen1.5-1.8B"
-    ### device: str = "cuda" if torch.cuda.is_available() else "cpu"
-    ### dtype: torch.dtype = torch.float16 if torch.cuda.is_available() else torch.float32
-    # Tokenization / generation
-    max_length: int = 64  # truncate inputs for speed/memory
     # Data
-    corpus: List[str] = None  # set below
-    # If None, uses DEFAULT_CORPUS defined below
-    # Graph building
-    graph_mode: str = "threshold"  # {"knn", "threshold"}
-    knn_k: int = 8           # neighbors per token (used if graph_mode="knn")
-    sim_threshold: float = 0.60  # used if graph_mode="threshold"
     use_cosine: bool = True
     # Anchors / LoT-style features (global)
@@ -84,104 +67,147 @@ class Config:
     n_clusters_kmeans: int = 6    # fallback for kmeans
     hdbscan_min_cluster_size: int = 4
-    # DR / embeddings
     umap_n_neighbors: int = 30
     umap_min_dist: float = 0.05
-    umap_metric: str = "cosine"   # hidden states are directional → cosine works well
-    use_global_3d_umap: bool = False  # if True, compute a single 3D manifold for all states
-    # Pooling for UMAP fit
     fit_pool_per_layer: int = 512  # number of states sampled per layer to fit UMAP
-    # Volume grid (MRI view)
-    grid_res: int = 128  # voxel resolution in x/y; z = num_layers
-    kde_bandwidth: float = 0.15   # KDE bandwidth in manifold space (if using KDE)
-    use_hist2d: bool = True       # if True, use histogram2d instead of KDE for speed
     # Output
     out_dir: str = "qwen_mri3d_outputs"
     plotly_html: str = "qwen_layers_3d.html"
-    volume_npz: str = "qwen_density_volume.npz"  # saved if PyVista isn't available
-    volume_screenshot: str = "qwen_volume.png"   # if PyVista is available
-    def validate(self):
-      if self.graph_mode not in {"knn", "threshold"}:
-          raise ValueError("graph_mode must be 'knn' or 'threshold'")
-      if self.knn_k < 2:
-          raise ValueError("knn_k must be >= 2")
-      if self.anchor_k < 2:
-          raise ValueError("anchor_k must be >= 2")
-      if self.anchor_temp <= 0:
-          raise ValueError("anchor_temp must be > 0")
 # Default corpus (small and diverse; adjust freely)
 DEFAULT_CORPUS = [
-    "The cat sat on the mat and watched.",
-    "Machine learning models process data using neural networks.",
-    "Climate change affects ecosystems around the world.",
-    "Quantum computers use superposition for parallel computation.",
-    "The universe contains billions of galaxies.",
-    "Artificial intelligence transforms how we work.",
-    "DNA stores genetic information in cells.",
-    "Ocean currents regulate Earth's climate system.",
-    "Photosynthesis converts sunlight into chemical energy.",
-    "Blockchain technology enables decentralized systems."
 ]
-# ====== 2. Utilities =============================================================================
 def seed_everything(seed: int = 42):
-    """Determinism for reproducibility in layouts/UMAP/kmeans."""
     np.random.seed(seed)
     torch.manual_seed(seed)
 def cosine_similarity_matrix(X: np.ndarray) -> np.ndarray:
-    """Compute pairwise cosine similarity for rows of X."""
-    # X: (N, D)
     norms = np.linalg.norm(X, axis=1, keepdims=True) + 1e-8
     Xn = X / norms
     return Xn @ Xn.T
-def build_knn_graph(coords: np.ndarray, k: int, metric: str = "cosine") -> nx.Graph:
     """
-    Build an undirected kNN graph for the points in coords.
-    coords: (N, D)
     """
-    nbrs = NearestNeighbors(n_neighbors=min(k+1, len(coords)), metric=metric)  # +1 to include self
     nbrs.fit(coords)
     distances, indices = nbrs.kneighbors(coords)
     G = nx.Graph()
     G.add_nodes_from(range(len(coords)))
-    # Connect i to its top-k neighbors (skip index 0 which is itself)
     for i in range(len(coords)):
-        for j in indices[i, 1:]:  # skip self
             G.add_edge(int(i), int(j))
     return G
-def build_threshold_graph(H: np.ndarray, threshold: float, use_cosine: bool = True) -> nx.Graph:
-    """
-    Build graph by thresholding pairwise similarities in the original hidden-state space.
-    H: (N, D) hidden states for a single layer
-    """
     if use_cosine:
         S = cosine_similarity_matrix(H)
     else:
-        S = H @ H.T  # dot product
     N = S.shape[0]
     G = nx.Graph()
     G.add_nodes_from(range(N))
-    for i in range(N):
-        for j in range(i + 1, N):
-            if S[i, j] > threshold:
-                G.add_edge(i, j, weight=float(S[i, j]))
-    return G
 def percolation_stats(G: nx.Graph) -> Dict[str, float]:
     """
@@ -210,94 +236,47 @@ def percolation_stats(G: nx.Graph) -> Dict[str, float]:
                 largest_component_size=largest,
                 component_sizes=sorted(sizes, reverse=True))
 def leiden_communities(G: nx.Graph) -> np.ndarray:
-    """
-    Community detection using Leiden (igraph), if available.
-    Returns an array of cluster ids for nodes 0..N-1.
-    """
-    if not HAS_IGRAPH_LEIDEN:
-        raise RuntimeError("igraph+leidenalg not available")
-    # Convert nx → igraph
     mapping = {n: i for i, n in enumerate(G.nodes())}
     edges = [(mapping[u], mapping[v]) for u, v in G.edges()]
     ig_g = ig.Graph(n=len(mapping), edges=edges, directed=False)
-    part = la.find_partition(ig_g, la.RBConfigurationVertexPartition)  # robust default
     labels = np.zeros(len(mapping), dtype=int)
     for cid, comm in enumerate(part):
-        for node in comm:
-            labels[node] = cid
     return labels
-def cluster_layer(features: np.ndarray,
-                  G: Optional[nx.Graph],
-                  method: str,
-                  n_clusters_kmeans: int = 6,
-                  hdbscan_min_cluster_size: int = 4) -> np.ndarray:
-    """
-    Cluster layer states to get cluster labels.
-      - If Leiden: requires G (graph) and igraph/leidenalg
-      - If HDBSCAN: density-based clustering in feature space
-      - If DBSCAN: fallback density-based (scikit-learn)
-      - If KMeans: fallback centroid clustering
-    """
-    method = method.lower()
-    N = len(features)
-    if method == "auto":
-        # Prefer Leiden (graph) → HDBSCAN → KMeans
-        if HAS_IGRAPH_LEIDEN and G is not None and G.number_of_edges() > 0:
-            return leiden_communities(G)
-        elif HAS_HDBSCAN and N >= 5:
-            clusterer = hdbscan.HDBSCAN(min_cluster_size=hdbscan_min_cluster_size,
-                                        metric='euclidean')
-            labels = clusterer.fit_predict(features)
-            # HDBSCAN: -1 = noise. Keep as its own "noise" cluster id or remap
-            return labels
-        else:
-            km = KMeans(n_clusters=min(n_clusters_kmeans, max(2, N // 3)),
-                        n_init="auto", random_state=42)
-            return km.fit_predict(features)
-    if method == "leiden":
-        if G is None or not HAS_IGRAPH_LEIDEN:
-            raise RuntimeError("Leiden requires a graph and igraph+leidenalg.")
-        return leiden_communities(G)
-    if method == "hdbscan":
-        if not HAS_HDBSCAN:
-            raise RuntimeError("hdbscan not installed")
-        clusterer = hdbscan.HDBSCAN(min_cluster_size=hdbscan_min_cluster_size, metric='euclidean')
-        return clusterer.fit_predict(features)
-    if method == "dbscan":
-        db = DBSCAN(eps=0.5, min_samples=4, metric='euclidean')
-        return db.fit_predict(features)
-    if method == "kmeans":
-        km = KMeans(n_clusters=min(n_clusters_kmeans, max(2, N // 3)),
-                    n_init="auto", random_state=42)
-        return km.fit_predict(features)
-    raise ValueError(f"Unknown cluster method: {method}")
-def orthogonal_align(A_ref: np.ndarray, B: np.ndarray) -> np.ndarray:
-    """
-    Align B to A_ref by an orthogonal rotation (Procrustes),
-    preserving geometry but removing arbitrary orientation flips.
-    """
-    R, _ = orthogonal_procrustes(B - B.mean(0), A_ref - A_ref.mean(0))
-    return (B - B.mean(0)) @ R + A_ref.mean(0)
-def entropy_from_probs(p: np.ndarray, eps: float = 1e-12) -> np.ndarray:
-    """Shannon entropy for each row; p is (N, K) with rows summing ~1."""
-    return -np.sum(p * np.log(p + eps), axis=1)
-# ====== 3. Model I/O (hidden states) =============================================================
 @dataclass
 class HiddenStatesBundle:
     """
@@ -336,7 +315,8 @@ def extract_hidden_states(model, tokenizer, text: str, max_length: int, device:
     tokens = tokenizer.convert_ids_to_tokens(inputs["input_ids"][0])
     return HiddenStatesBundle(hidden_layers=hs, tokens=tokens)
-# ====== 4. LoT-style anchors & features ==========================================================
 def fit_global_anchors(all_states_sampled: np.ndarray, K: int, random_state: int = 42) -> np.ndarray:
     """
     Fit KMeans cluster centroids on a pooled set of states (from many layers/texts).
@@ -348,7 +328,6 @@ def fit_global_anchors(all_states_sampled: np.ndarray, K: int, random_state: int
     kmeans.fit(all_states_sampled)
     return kmeans.cluster_centers_  # (K, D)
 def anchor_features(H: np.ndarray, anchors: np.ndarray, temperature: float = 1.0) -> Tuple[np.ndarray, np.ndarray, np.ndarray]:
     """
     For states H (N,D) and anchors A (K,D):
@@ -367,10 +346,12 @@ def anchor_features(H: np.ndarray, anchors: np.ndarray, temperature: float = 1.0
     P = np.exp(logits)
     P /= P.sum(axis=1, keepdims=True) + 1e-12
     # Uncertainty (entropy)
-    H_unc = entropy_from_probs(P)
     return dists, P, H_unc
-# ====== 5. Dimensionality reduction / embeddings ================================================
 def fit_umap_2d(pool: np.ndarray,
                 n_neighbors: int = 30,
                 min_dist: float = 0.05,
@@ -386,63 +367,6 @@ def fit_umap_2d(pool: np.ndarray,
     reducer.fit(pool)
     return reducer
-def _corpus_fingerprint(texts, max_items=5, max_chars=4000) -> str:
-    """Stable key so cache invalidates if DEFAULT_CORPUS changes."""
-    joined = "\n".join(texts[:max_items])
-    joined = joined[:max_chars]
-    return hashlib.sha256(joined.encode("utf-8")).hexdigest()
-@st.cache_data(show_spinner=False)
-def get_pool_artifacts(
-    model_name: str,
-    max_length: int,
-    anchor_k: int,
-    anchor_temp: float,          # not strictly needed for fitting anchors, but included if you want cache keys aligned
-    umap_n_neighbors: int,
-    umap_min_dist: float,
-    umap_metric: str,
-    fit_pool_per_layer: int,
-    corpus_hash: str,
-):
-    """
-    Cached: build pooled hidden states on DEFAULT_CORPUS, fit anchors and a UMAP reducer once.
-    Returns:
-      anchors: (K, D) np.ndarray
-      reducer2d: fitted UMAP reducer object (must be pickleable; umap-learn's UMAP is)
-    """
-    # Use cached model loader (resource cache)
-    model, tok, device, dtype = get_model_and_tok(model_name)
-    texts = DEFAULT_CORPUS  # pooled set for stability
-    pool_states = []
-    for t in texts[: min(5, len(texts))]:
-        b = extract_hidden_states(model, tok, t, max_length, device)
-        for H in b.hidden_layers:
-            T = len(H)
-            take = min(fit_pool_per_layer, T)
-            if take <= 0:
-                continue
-            idx = np.random.choice(T, size=take, replace=False)
-            pool_states.append(H[idx])
-    if not pool_states:
-        # fallback: this should rarely happen
-        raise RuntimeError("Pool construction produced no states.")
-    pool_states = np.vstack(pool_states)
-    anchors = fit_global_anchors(pool_states, anchor_k)
-    reducer2d = fit_umap_2d(
-        pool_states,
-        n_neighbors=umap_n_neighbors,
-        min_dist=umap_min_dist,
-        metric=umap_metric,
-    )
-    return anchors, reducer2d
 def fit_umap_3d(all_states: np.ndarray,
                 n_neighbors: int = 30,
@@ -457,296 +381,244 @@ def fit_umap_3d(all_states: np.ndarray,
                         metric=metric, random_state=random_state)
     return reducer.fit_transform(all_states)
-# ====== 6. Volume construction (MRI) ============================================================
-def stack_density_volume(xy_by_layer: List[np.ndarray],
-                         grid_res: int,
-                         use_hist2d: bool = True,
-                         kde_bandwidth: float = 0.15) -> np.ndarray:
-    """
-    Construct a 3D volume by estimating 2D density on the (x,y) manifold per layer (slice).
-      - If use_hist2d: fast uniform binning into grid_res x grid_res
-      - Else: KDE (slower but smoother)
-    Returns volume of shape (grid_res, grid_res, L) where L = #layers.
-    """
-    L = len(xy_by_layer)
-    vol = np.zeros((grid_res, grid_res, L), dtype=np.float32)
-    # Determine global bounds across layers to keep axes consistent
-    all_xy = np.vstack([xy for xy in xy_by_layer if len(xy) > 0]) if L > 0 else np.zeros((0, 2))
-    if len(all_xy) == 0:
-        return vol
-    x_min, y_min = all_xy.min(axis=0)
-    x_max, y_max = all_xy.max(axis=0)
-    # Slight padding
-    pad = 1e-6
-    x_edges = np.linspace(x_min - pad, x_max + pad, grid_res + 1)
-    y_edges = np.linspace(y_min - pad, y_max + pad, grid_res + 1)
-    for l, XY in enumerate(xy_by_layer):
-        if len(XY) == 0:
-            continue
-        if use_hist2d:
-            H, _, _ = np.histogram2d(XY[:, 0], XY[:, 1], bins=[x_edges, y_edges], density=False)
-            vol[:, :, l] = H.T  # histogram2d returns [x_bins, y_bins] → transpose to align
-        else:
-            kde = KernelDensity(bandwidth=kde_bandwidth, kernel="gaussian")
-            kde.fit(XY)
-            # Evaluate KDE on grid centers
-            xs = 0.5 * (x_edges[:-1] + x_edges[1:])
-            ys = 0.5 * (y_edges[:-1] + y_edges[1:])
-            xx, yy = np.meshgrid(xs, ys, indexing='xy')
-            grid_points = np.column_stack([xx.ravel(), yy.ravel()])
-            log_dens = kde.score_samples(grid_points)
-            dens = np.exp(log_dens).reshape(grid_res, grid_res)
-            vol[:, :, l] = dens
-    # Normalize volume to [0,1] for rendering convenience
-    if vol.max() > 0:
-        vol = vol / vol.max()
-    return vol
-def render_volume_with_pyvista(volume: np.ndarray,
-                               out_png: str,
-                               opacity="sigmoid") -> None:
-    """
-    Visualize the 3D volume using PyVista/VTK (if installed); save a screenshot.
-    """
-    if not HAS_PYVISTA:
-        raise RuntimeError("PyVista is not installed; cannot render volume.")
-    pl = pv.Plotter()
-    # Wrap NumPy array as a VTK image data; PyVista expects z as the 3rd axis
-    vol_vtk = pv.wrap(volume)
-    pl.add_volume(vol_vtk, opacity=opacity, shade=True)
-    pl.show(screenshot=out_png)  # headless environments will still save a screenshot (if offscreen support)
-# ====== 7. 3D Plotly visualization ==============================================================
 def plotly_3d_layers(xy_layers: List[np.ndarray],
                      layer_tokens: List[List[str]],
                      layer_cluster_labels: List[np.ndarray],
                      layer_uncertainty: List[np.ndarray],
                      layer_graphs: List[nx.Graph],
-                     connect_token_trajectories: bool = True,
-                     title: str = "Qwen: 3D Cluster Formation (UMAP2D + Layer as Z)") -> go.Figure:
-    """
-    Build an interactive 3D Plotly figure:
-      - Nodes per layer at (x, y, z=layer)
-      - Edge segments (kNN or threshold graph) per layer
-      - Trajectory lines: connect same token index across consecutive layers (optional)
-      - Color nodes by cluster label; hover shows token & uncertainty
-    """
     fig_data = []
-    # Build a color per layer node trace
-    for l, (xy, tokens, labels, unc, G) in enumerate(zip(xy_layers, layer_tokens, layer_cluster_labels, layer_uncertainty, layer_graphs)):
-        if len(xy) == 0:
-            continue
         x, y = xy[:, 0], xy[:, 1]
         z = np.full_like(x, l, dtype=float)
-        # --- Nodes
-        node_text = [f"layer={l} | idx={i}<br>token={tokens[i]}<br>cluster={int(labels[i])}<br>uncertainty={unc[i]:.3f}"
-                     for i in range(len(tokens))]
         node_trace = go.Scatter3d(
             x=x, y=y, z=z,
             mode='markers',
             name=f"Layer {l}",
             marker=dict(
-                size=4,
-                opacity=0.7,
-                color=labels,  # cluster ID → color scale
-                colorscale='Viridis',
-                showscale=(l == 0)  # show scale once
             ),
             text=node_text,
             hovertemplate="%{text}<extra></extra>"
         )
         fig_data.append(node_trace)
-        # --- Intra-layer edges (kNN or threshold)
         if G is not None and G.number_of_edges() > 0:
             edge_x, edge_y, edge_z = [], [], []
             for u, v in G.edges():
                 edge_x += [x[u], x[v], None]
                 edge_y += [y[u], y[v], None]
                 edge_z += [z[u], z[v], None]
             edge_trace = go.Scatter3d(
                 x=edge_x, y=edge_y, z=edge_z,
                 mode='lines',
-                line=dict(width=1),
-                opacity=0.30,
-                name=f"Edges L{l}"
             )
             fig_data.append(edge_trace)
-    # --- Trajectories: connect same token index across layers
-    if connect_token_trajectories:
-        # Only meaningful if tokenization length T is constant across layers (it is)
-        # We'll draw faint polylines for each position i across l=0..L-1
-        L = len(xy_layers)
-        if L > 1:
-            T = min(len(xy_layers[l]) for l in range(L))
-            for i in range(T):
-                xs = [xy_layers[l][i, 0] for l in range(L)]
-                ys = [xy_layers[l][i, 1] for l in range(L)]
-                zs = list(range(L))
-                traj = go.Scatter3d(
-                    x=xs, y=ys, z=zs,
-                    mode='lines',
-                    line=dict(width=1),
-                    opacity=0.15,
-                    name=f"traj_{i}",
-                    hoverinfo='skip'
                 )
-                fig_data.append(traj)
     fig = go.Figure(data=fig_data)
     fig.update_layout(
-        title=title,
         scene=dict(
             xaxis_title="UMAP X",
             yaxis_title="UMAP Y",
-            zaxis_title="Layer (depth)"
         ),
         height=900,
-        showlegend=False
     )
     return fig
-# ====== 8. Orchestration ========================================================================
-def run_pipeline(cfg: Config, model, tok, device, main_text: str, save_artifacts: bool = False):
     seed_everything(42)
-    # 8.2 Collect hidden states for one representative text (detailed viz) + for pool
-    #     You can extend to many texts; we keep a single text for clarity & speed.
-    texts = cfg.corpus or DEFAULT_CORPUS
-    #print(f"[Input] Example text: {main_text!r}")
-    # Hidden states for main text
     main_bundle = extract_hidden_states(model, tok, main_text, cfg.max_length, device)
-    layers_np: List[np.ndarray] = main_bundle.hidden_layers   # list of (T,D), length L_all = num_layers+1
-    tokens = main_bundle.tokens                               # list of length T
-    # Cached pool artifacts (anchors + fitted UMAP reducer)
-    corpus_hash = _corpus_fingerprint(texts)  # texts is cfg.corpus or DEFAULT_CORPUS
-    anchors, reducer2d = get_pool_artifacts(
-        model_name=cfg.model_name,
-        max_length=cfg.max_length,
-        anchor_k=cfg.anchor_k,
-        anchor_temp=cfg.anchor_temp,
-        umap_n_neighbors=cfg.umap_n_neighbors,
-        umap_min_dist=cfg.umap_min_dist,
-        umap_metric=cfg.umap_metric,
-        fit_pool_per_layer=cfg.fit_pool_per_layer,
-        corpus_hash=corpus_hash,
-    )
     L_all = len(layers_np)
-    #print(f"[Hidden] Layers (incl. embedding): {L_all}, Tokens: {len(tokens)}")
-    """
-        # 8.3 Build a pool of states (across a few texts & layers) to fit anchors + UMAP
-        pool_states = []
-        # Sample across first few texts to improve diversity (lightweight)
-        for t in texts[: min(5, len(texts))]:
-            b = extract_hidden_states(model, tok, t, cfg.max_length, device)
-            # Take a subset from each layer to limit pool size
-            for H in b.hidden_layers:
-                T = len(H)
-                take = min(cfg.fit_pool_per_layer, T)
-                idx = np.random.choice(T, size=take, replace=False)
-                pool_states.append(H[idx])
-        pool_states = np.vstack(pool_states) if len(pool_states) else layers_np[-1]
-        #print(f"[Pool] Pooled states for anchors/UMAP: {pool_states.shape}")
-        # 8.4 Fit global anchors (LoT-style features)
-        anchors = fit_global_anchors(pool_states, cfg.anchor_k)
-        # Save anchors for reproducibility
-        """
-    # 8.5 Build per-layer features for main text (LoT-style distances & uncertainty)
-    layer_features = []      # list of (T,K)
-    layer_uncertainties = [] # list of (T,)
-    layer_top_anchor = []    # list of (T,) argmin-id
-    for l, H in enumerate(layers_np):
-        dists, P, H_unc = anchor_features(H, anchors, cfg.anchor_temp)
-        layer_features.append(dists)              # N x K distances (lower = closer)
-        layer_uncertainties.append(H_unc)         # N
-        layer_top_anchor.append(np.argmin(dists, axis=1))  # closest anchor id per token
-    # 8.6 Consistency metric (LoT Eq. (5)): does layer's top anchor match final layer's?
-    final_top = layer_top_anchor[-1]
-    layer_consistency = []
-    for l in range(L_all):
-        cons = (layer_top_anchor[l] == final_top).astype(np.int32)  # 1 if matches, 0 otherwise
-        layer_consistency.append(cons)
-    # 8.7 Build per-layer graphs (kNN by default) on FEATURE space for stability
     layer_graphs = []
     for l in range(L_all):
-        feats = layer_features[l]
         if cfg.graph_mode == "knn":
-            G = build_knn_graph(feats, cfg.knn_k, metric="euclidean")  # kNN in feature space
         else:
-            # Threshold graph in original hidden space (as in your notebook)
-            G = build_threshold_graph(layers_np[l], cfg.sim_threshold, use_cosine=cfg.use_cosine)
         layer_graphs.append(G)
-    # 8.8 Cluster per layer
-    layer_cluster_labels = []
-    for l in range(L_all):
-        feats = layer_features[l]
-        labels = cluster_layer(
-            feats,
-            layer_graphs[l],
-            method=cfg.cluster_method,
-            n_clusters_kmeans=cfg.n_clusters_kmeans,
-            hdbscan_min_cluster_size=cfg.hdbscan_min_cluster_size
-        )
         layer_cluster_labels.append(labels)
-    # 8.9 Percolation statistics (φ, #clusters, χ) per layer (as in your notebook)
-    percolation = []
-    for l in range(L_all):
-        stats = percolation_stats(layer_graphs[l])
-        percolation.append(stats)
-    # 8.10 Common 2D manifold via UMAP (fit-once on the pool), then transform each layer
-    """reducer2d = fit_umap_2d(pool_states,
-                            n_neighbors=cfg.umap_n_neighbors,
-                            min_dist=cfg.umap_min_dist,
-                            metric=cfg.umap_metric)"""
-    xy_by_layer = [reducer2d.transform(layers_np[l]) for l in range(L_all)]
-    # OPTIONAL: orthogonal alignment across layers (helps if UMAP.transform still drifts)
-    # for l in range(1, L_all):
-    #     xy_by_layer[l] = orthogonal_align(xy_by_layer[l-1], xy_by_layer[l])
-    # 8.11 Plotly 3D point+graph view: X,Y from UMAP; Z = layer index
     fig = plotly_3d_layers(
         xy_layers=xy_by_layer,
-        layer_tokens=[tokens for _ in range(L_all)],
         layer_cluster_labels=layer_cluster_labels,
         layer_uncertainty=layer_uncertainties,
         layer_graphs=layer_graphs,
-        connect_token_trajectories=True,
-        title="Qwen: 3D Cluster Formation (UMAP2D + Layer as Z, LoT metrics on hover)"
     )
     if save_artifacts:
-      os.makedirs(cfg.out_dir, exist_ok=True)
-      html_path = os.path.join(cfg.out_dir, cfg.plotly_html)
-      fig.write_html(html_path)
-      # Save percolation series
-      with open(os.path.join(cfg.out_dir, "percolation_stats.json"), "w") as f:
-          json.dump(percolation, f, indent=2)
-      np.save(os.path.join(cfg.out_dir, "anchors.npy"), anchors)
-      #print(f"[Percolation] Saved per-layer stats → percolation_stats.json")
-      #print(f"[Plotly] 3D HTML saved → {html_path}")
     return fig, {"percolation": percolation, "tokens": tokens}
@@ -754,16 +626,32 @@ def run_pipeline(cfg: Config, model, tok, device, main_text: str, save_artifacts
 def get_model_and_tok(model_name: str):
     device = "cuda" if torch.cuda.is_available() else "cpu"
     dtype = torch.float16 if device == "cuda" else torch.float32
-    model, tok = load_qwen(model_name, device, dtype)
     return model, tok, device, dtype
 def main():
-    st.set_page_config(page_title="Layer Explorer", layout="wide")
-    st.title("3D Token Embedding Explorer (Live Hidden States)")
     with st.sidebar:
         st.header("Model / Input")
-        model_name = st.selectbox("Model", ["Qwen/Qwen1.5-0.5B", "Qwen/Qwen1.5-1.8B", "Qwen/Qwen1.5-4B"], index=1)
         max_length = st.slider("Max tokens", 16, 256, 64, step=16)
         st.header("Graph")
@@ -787,13 +675,16 @@ def main():
         st.header("Outputs")
         save_artifacts = st.checkbox("Save artifacts to disk (HTML/CSV/NPZ)", value=False)
-    prompt_col, run_col = st.columns([4, 1])
     with prompt_col:
-        main_text = st.text_area(
-            "Text to visualize (hidden states computed on this text)",
-            value="Explain in one sentence what a transformer attention layer does.",
-            height=140
         )
     with run_col:
         st.write("")
         st.write("")

 import numpy as np
 import pandas as pd
 import torch
 from torch import nn
 import networkx as nx
 import streamlit as st
 from transformers import AutoConfig, AutoModelForCausalLM, AutoTokenizer
 import umap
 from sklearn.neighbors import NearestNeighbors, KernelDensity
 from sklearn.cluster import KMeans, DBSCAN
 from sklearn.metrics import pairwise_distances
+from scipy.spatial import procrustes
+from scipy.linalg import orthogonal_procrustes
 import plotly.graph_objects as go
 # Optional libs (use if present)
 try:
 except Exception:
     HAS_PYVISTA = False
+# ====== Configuration =========================================================================
 @dataclass
 class Config:
     # Model
     model_name: str = "Qwen/Qwen1.5-1.8B"
+    max_length: int = 64
     # Data
+    corpus: List[str] = None
+    # Graph & Clustering
+    graph_mode: str = "threshold"
+    knn_k: int = 8
+    sim_threshold: float = 0.05   # Percentile of edges shown 0.05 = Show top 5% of edges
     use_cosine: bool = True
     # Anchors / LoT-style features (global)
     n_clusters_kmeans: int = 6    # fallback for kmeans
     hdbscan_min_cluster_size: int = 4
+    # UMAP & alignment
     umap_n_neighbors: int = 30
     umap_min_dist: float = 0.05
+    umap_metric: str = "cosine"
     fit_pool_per_layer: int = 512  # number of states sampled per layer to fit UMAP
+    align_layers: bool = True # aligning procrustes to layers
+# Visualization
+    color_by: str = "pos"  # "cluster" or "pos" (Part of Speech)
     # Output
     out_dir: str = "qwen_mri3d_outputs"
     plotly_html: str = "qwen_layers_3d.html"
 # Default corpus (small and diverse; adjust freely)
 DEFAULT_CORPUS = [
+    "Is a Universal Basic Income (UBI) a viable solution to poverty, or does it simply discourage people from working?",
+    "Explain the arguments for and against the independence of Taiwan from the perspective of both the US and China.",
+    "What are the ethical arguments surrounding the use of CRISPR technology to edit human embryos for non-medical enhancements?",
+    "Analyze the effectiveness of strict lockdowns versus herd immunity strategies during the COVID-19 pandemic.",
+    "Why is nuclear energy controversial despite being a low-carbon power source? Present both the safety concerns and the environmental benefits.",
+    "Does the existence of evil in the world disprove the existence of a benevolent God? Summarize the philosophical debate.",
+    "Summarize the main arguments used by gun rights advocates against stricter background checks in the United States.",
+    "Should autonomous weapons systems (killer robots) be banned internationally, even if they could reduce soldier casualties?",
+    "Was the dropping of the atomic bombs on Hiroshima and Nagasaki militarily necessary to end World War II?",
+    "What are the competing arguments regarding transgender women participating in biological women's sports categories?"
 ]
+#Select from 4 different models
+MODELS = ["Qwen/Qwen1.5-0.5B", "deepseek-ai/deepseek-coder-1.3b-instruct", "openai-community/gpt2", "prem-research/MiniGuard-v0.1"]
+# ====== Utilities =========================================================================
 def seed_everything(seed: int = 42):
     np.random.seed(seed)
     torch.manual_seed(seed)
 def cosine_similarity_matrix(X: np.ndarray) -> np.ndarray:
     norms = np.linalg.norm(X, axis=1, keepdims=True) + 1e-8
     Xn = X / norms
     return Xn @ Xn.T
+def orthogonal_align(A_ref: np.ndarray, B: np.ndarray) -> np.ndarray:
+    """
+    Align B to A_ref using Procrustes analysis (rotation/reflection only).
+    Preserves local geometry of B, but aligns global orientation to A.
+    """
+    # Center both
+    mu_a = A_ref.mean(0)
+    mu_b = B.mean(0)
+    A0 = A_ref - mu_a
+    B0 = B - mu_b
+    # Solve for Rotation R that minimizes ||A0 - B0 @ R||
+    # M = B0.T @ A0
+    # U, S, Vt = svd(M)
+    # R = U @ Vt
+    R, _ = orthogonal_procrustes(B0, A0)
+    # B_aligned = (B - mu_b) @ R + mu_a
+    # We essentially rotate B to match A's orientation, then shift to A's center
+    return B0 @ R + mu_a
+def get_pos_tags(text: str, tokenizer, tokens: List[str]) -> List[str]:
     """
+    Map LLM tokens to Spacy POS tags.
+    Heuristic: Reconstruct text, run Spacy, align based on char overlap.
     """
+    try:
+        nlp = spacy.load("en_core_web_sm")
+    except:
+        # Fallback if model not downloaded
+        return ["UNK"] * len(tokens)
+    doc = nlp(text)
+    # This is a simplified mapping. Real alignment is complex due to subwords.
+    # We will approximate: Find which word the subword belongs to.
+    pos_tags = []
+    # Re-build offsets for tokens (simplified)
+    # Ideally, we use tokenizer(return_offsets_mapping=True)
+    # Here we will just iterate and approximate for the demo.
+    # Fast approximation: tag the token string itself
+    # (Not perfect for subwords like "ing", but visually useful)
+    for t_str in tokens:
+        clean_t = t_str.replace("Ġ", "").replace("▁", "").strip()
+        if not clean_t:
+            pos_tags.append("SYM") # likely special char
+            continue
+        # Tag the single token fragment
+        sub_doc = nlp(clean_t)
+        if len(sub_doc) > 0:
+            pos_tags.append(sub_doc[0].pos_)
+        else:
+            pos_tags.append("UNK")
+    return pos_tags
+def build_knn_graph(coords: np.ndarray, k: int, metric: str = "cosine") -> nx.Graph:
+    nbrs = NearestNeighbors(n_neighbors=min(k+1, len(coords)), metric=metric)
     nbrs.fit(coords)
     distances, indices = nbrs.kneighbors(coords)
     G = nx.Graph()
     G.add_nodes_from(range(len(coords)))
     for i in range(len(coords)):
+        for j in indices[i, 1:]:
             G.add_edge(int(i), int(j))
     return G
+def build_threshold_graph(H: np.ndarray, top_pct: float = 0.05, use_cosine: bool = True, include_ties: bool = True,) -> nx.Graph:
     if use_cosine:
         S = cosine_similarity_matrix(H)
     else:
+        S = H @ H.T
     N = S.shape[0]
+    iu = np.triu_indices(N, k=1)
+    vals = S[iu]
+    # threshold at (1 - top_pct) quantile
+    q = 1.0 - top_pct
+    thr = float(np.quantile(vals, q))
     G = nx.Graph()
     G.add_nodes_from(range(N))
+    if include_ties:
+        mask = vals >= thr
+    else:
+        # strictly greater than threshold reduces tie-inflation
+        mask = vals > thr
+    rows = iu[0][mask]
+    cols = iu[1][mask]
+    wts  = vals[mask]
+    for r, c, w in zip(rows, cols, wts):
+        G.add_edge(int(r), int(c), weight=float(w))
+    return G
 def percolation_stats(G: nx.Graph) -> Dict[str, float]:
     """
                 largest_component_size=largest,
                 component_sizes=sorted(sizes, reverse=True))
+def cluster_layer(features: np.ndarray, G: Optional[nx.Graph], method: str,
+                  n_clusters_kmeans: int=6, hdbscan_min_cluster_size: int=4) -> np.ndarray:
+    # (Same as original)
+    method = method.lower()
+    N = len(features)
+    if method == "auto":
+        if HAS_IGRAPH_LEIDEN and G and G.number_of_edges() > 0: return leiden_communities(G)
+        elif HAS_HDBSCAN: return hdbscan.HDBSCAN(min_cluster_size=hdbscan_min_cluster_size).fit_predict(features)
+        else: return KMeans(n_clusters=min(n_clusters_kmeans, N), n_init="auto").fit_predict(features)
+    # ... (rest of method dispatch unchanged)
+    return KMeans(n_clusters=min(n_clusters_kmeans, N), n_init="auto").fit_predict(features)
+# Helper for Leiden (from original)
 def leiden_communities(G: nx.Graph) -> np.ndarray:
+    if not HAS_IGRAPH_LEIDEN: raise RuntimeError("Missing igraph")
     mapping = {n: i for i, n in enumerate(G.nodes())}
     edges = [(mapping[u], mapping[v]) for u, v in G.edges()]
     ig_g = ig.Graph(n=len(mapping), edges=edges, directed=False)
+    part = la.find_partition(ig_g, la.RBConfigurationVertexPartition)
     labels = np.zeros(len(mapping), dtype=int)
     for cid, comm in enumerate(part):
+        for node in comm: labels[node] = cid
     return labels
+def anchor_features(H: np.ndarray, anchors: np.ndarray, temperature: float = 1.0):
+    dists = pairwise_distances(H, anchors, metric="euclidean")
+    logits = -dists / max(temperature, 1e-6)
+    logits = logits - logits.max(axis=1, keepdims=True)
+    P = np.exp(logits)
+    P /= P.sum(axis=1, keepdims=True) + 1e-12
+    # Entropy calculation
+    H_unc = -np.sum(P * np.log(P + 1e-12), axis=1)
+    return dists, P, H_unc
+def fit_global_anchors(pool: np.ndarray, K: int) -> np.ndarray:
+    km = KMeans(n_clusters=K, n_init="auto", random_state=42)
+    km.fit(pool)
+    return km.cluster_centers_
+# ====== Model I/O (hidden states) =============================================================
 @dataclass
 class HiddenStatesBundle:
     """
     tokens = tokenizer.convert_ids_to_tokens(inputs["input_ids"][0])
     return HiddenStatesBundle(hidden_layers=hs, tokens=tokens)
+# ====== LoT-style anchors & features ==========================================================
 def fit_global_anchors(all_states_sampled: np.ndarray, K: int, random_state: int = 42) -> np.ndarray:
     """
     Fit KMeans cluster centroids on a pooled set of states (from many layers/texts).
     kmeans.fit(all_states_sampled)
     return kmeans.cluster_centers_  # (K, D)
 def anchor_features(H: np.ndarray, anchors: np.ndarray, temperature: float = 1.0) -> Tuple[np.ndarray, np.ndarray, np.ndarray]:
     """
     For states H (N,D) and anchors A (K,D):
     P = np.exp(logits)
     P /= P.sum(axis=1, keepdims=True) + 1e-12
     # Uncertainty (entropy)
+    H_unc = -np.sum(P * np.log(P + 1e-12), axis=1)
     return dists, P, H_unc
+# ====== Dimensionality reduction / embeddings ================================================
 def fit_umap_2d(pool: np.ndarray,
                 n_neighbors: int = 30,
                 min_dist: float = 0.05,
     reducer.fit(pool)
     return reducer
 def fit_umap_3d(all_states: np.ndarray,
                 n_neighbors: int = 30,
                         metric=metric, random_state=random_state)
     return reducer.fit_transform(all_states)
+# ====== Visualization ========================================================================
 def plotly_3d_layers(xy_layers: List[np.ndarray],
                      layer_tokens: List[List[str]],
                      layer_cluster_labels: List[np.ndarray],
+                     layer_pos_tags: List[List[str]],
                      layer_uncertainty: List[np.ndarray],
                      layer_graphs: List[nx.Graph],
+                     color_by: str = "cluster",
+                     title: str = "3D Cluster Formation",
+                     prompt: str = None,) -> go.Figure:
     fig_data = []
+    # Define categorical colormap for POS
+    pos_map = {
+        "NOUN": "#1f77b4", "VERB": "#d62728", "ADJ": "#2ca02c",
+        "ADV": "#ff7f0e", "PRON": "#9467bd", "DET": "#8c564b",
+        "ADP": "#e377c2", "NUM": "#7f7f7f", "PUNCT": "#bcbd22",
+        "SYM": "#17becf", "UNK": "#bababa"
+    }
+    L = len(xy_layers)
+    for l, (xy, tokens, labels, pos, unc, G) in enumerate(zip(xy_layers, layer_tokens, layer_cluster_labels, layer_pos_tags, layer_uncertainty, layer_graphs)):
+        if len(xy) == 0: continue
         x, y = xy[:, 0], xy[:, 1]
         z = np.full_like(x, l, dtype=float)
+        # Color Logic
+        if color_by == "pos":
+            # Map POS strings to colors
+            node_colors = [pos_map.get(p, "#333333") for p in pos]
+            show_scale = False
+            colorscale = None
+        else:
+            # Cluster ID
+            node_colors = labels
+            show_scale = (l == 0)
+            colorscale = 'Viridis'
+        # Hover Text
+        node_text = [
+            f"L{l} | {tok}<br>POS: {p}<br>Cluster: {c}<br>Unc: {u:.2f}"
+            for tok, p, c, u in zip(tokens, pos, labels, unc)
+        ]
         node_trace = go.Scatter3d(
             x=x, y=y, z=z,
             mode='markers',
             name=f"Layer {l}",
+            showlegend=False,
             marker=dict(
+                size=3,
+                opacity=1,
+                color=node_colors,
+                colorscale=colorscale,
+                showscale=show_scale,
+                colorbar=dict(title="Cluster ID") if show_scale else None
             ),
             text=node_text,
             hovertemplate="%{text}<extra></extra>"
         )
         fig_data.append(node_trace)
+        # Edges
         if G is not None and G.number_of_edges() > 0:
             edge_x, edge_y, edge_z = [], [], []
             for u, v in G.edges():
                 edge_x += [x[u], x[v], None]
                 edge_y += [y[u], y[v], None]
                 edge_z += [z[u], z[v], None]
             edge_trace = go.Scatter3d(
                 x=edge_x, y=edge_y, z=edge_z,
                 mode='lines',
+                line=dict(width=2, color='red'),
+                opacity=0.6,
+                hoverinfo='skip',
+                showlegend=False
             )
             fig_data.append(edge_trace)
+    # Trajectories (connect same token across layers)
+    if L > 1:
+        T = len(xy_layers[0])
+        # Sample trajectories to avoid lag if T is huge
+        step = max(1, T // 100)
+        for i in range(0, T, step):
+            xs = [xy_layers[l][i, 0] for l in range(L)]
+            ys = [xy_layers[l][i, 1] for l in range(L)]
+            zs = list(range(L))
+            traj = go.Scatter3d(
+                x=xs, y=ys, z=zs,
+                mode='lines',
+                line=dict(width=3, color='rgba(50,50,50,0.5)'),
+                hoverinfo='skip',
+                showlegend=False
+            )
+            fig_data.append(traj)
+    if color_by == "pos":
+        # Add legend-only traces for POS categories actually present
+        present_pos = sorted({p for layer in layer_pos_tags for p in layer})
+        for p in present_pos:
+            fig_data.append(
+                go.Scatter3d(
+                    x=[None], y=[None], z=[None],     # legend-only
+                    mode="markers",
+                    name=p,
+                    marker=dict(size=8, color=pos_map.get(p, "#333333")),
+                    showlegend=True,
+                    hoverinfo="skip"
                 )
+            )
     fig = go.Figure(data=fig_data)
     fig.update_layout(
+        title=dict(
+            text=title,
+            x=0.5,
+            xanchor="center",
+        ),
+        annotations=[
+            dict(
+                text=f"<b>Prompt:</b> {prompt}",
+                x=0.5,
+                y=1.02,
+                xref="paper",
+                yref="paper",
+                showarrow=False,
+                font=dict(size=13),
+                align="center"
+            )
+        ] if prompt else [],
         scene=dict(
             xaxis_title="UMAP X",
             yaxis_title="UMAP Y",
+            zaxis_title="Layer Depth",
+            aspectratio=dict(x=1, y=1, z=1.5)
         ),
         height=900,
+        margin=dict(l=0, r=0, b=0, t=40)
     )
     return fig
+def run_pipeline(cfg: Config, model, tok, device, main_text: str, save_artifacts: bool = False):
     seed_everything(42)
+    # 1. Extract Hidden States
+    from transformers import logging
+    logging.set_verbosity_error()
+    # Extract
     main_bundle = extract_hidden_states(model, tok, main_text, cfg.max_length, device)
+    layers_np = main_bundle.hidden_layers
+    tokens = main_bundle.tokens
     L_all = len(layers_np)
+    # 2. Get POS Tags
+    pos_tags = get_pos_tags(main_text, tok, tokens)
+    # 3. Pooling & Anchors (LoT)
+    # (Simplified: just pool from the main text for speed in demo)
+    pool_states = np.vstack([layers_np[l] for l in range(0, L_all, 2)])
+    idx = np.random.choice(len(pool_states), min(len(pool_states), 2000), replace=False)
+    anchors = fit_global_anchors(pool_states[idx], cfg.anchor_k)
+    # 4. Process Layers
+    layer_features = []
+    layer_uncertainties = []
     layer_graphs = []
+    layer_cluster_labels = []
+    percolation = []
     for l in range(L_all):
+        H = layers_np[l]
+        # Features & Uncertainty
+        dists, P, H_unc = anchor_features(H, anchors, cfg.anchor_temp)
+        layer_features.append(dists)
+        layer_uncertainties.append(H_unc)
+        # Graphs
         if cfg.graph_mode == "knn":
+            G = build_knn_graph(dists, cfg.knn_k, metric="euclidean")
         else:
+            G = build_threshold_graph(H, cfg.sim_threshold, use_cosine=cfg.use_cosine)
         layer_graphs.append(G)
+        # Clusters
+        labels = cluster_layer(dists, G, cfg.cluster_method,
+                               cfg.n_clusters_kmeans, cfg.hdbscan_min_cluster_size)
         layer_cluster_labels.append(labels)
+        # Percolation
+        percolation.append(percolation_stats(G))
+    # 5. UMAP & Alignment
+    # Fit UMAP on the pool to establish a coordinate system
+    reducer = umap.UMAP(n_components=2, n_neighbors=cfg.umap_n_neighbors,
+                        min_dist=cfg.umap_min_dist, metric=cfg.umap_metric, random_state=42)
+    reducer.fit(pool_states[idx])
+    xy_by_layer = []
+    for l in range(L_all):
+        # Transform into 2D
+        xy = reducer.transform(layers_np[l])
+        # Procrustes Alignment: Align layer L to L-1
+        if cfg.align_layers and l > 0:
+            xy = orthogonal_align(xy_by_layer[l-1], xy)
+        xy_by_layer.append(xy)
+    # 6. Plot
     fig = plotly_3d_layers(
         xy_layers=xy_by_layer,
+        layer_tokens=[tokens] * L_all,
         layer_cluster_labels=layer_cluster_labels,
+        layer_pos_tags=[pos_tags] * L_all,
         layer_uncertainty=layer_uncertainties,
         layer_graphs=layer_graphs,
+        color_by=cfg.color_by,
+        title=f"{cfg.model_name.rsplit("/", 1)[-1]} 3D MRI | Color: {cfg.color_by.upper()} | Aligned: {cfg.align_layers}",
+        prompt=main_text
     )
+    # 7. Save Artifacts (This is the missing part)
     if save_artifacts:
+        import os
+        # Create the directory if it doesn't exist
+        os.makedirs(cfg.out_dir, exist_ok=True)
+        # Construct the full path
+        out_path = os.path.join(cfg.out_dir, cfg.plotly_html)
+        # Write the HTML file
+        fig.write_html(out_path)
+        print(f"Successfully saved 3D plot to: {out_path}")
     return fig, {"percolation": percolation, "tokens": tokens}
 def get_model_and_tok(model_name: str):
     device = "cuda" if torch.cuda.is_available() else "cpu"
     dtype = torch.float16 if device == "cuda" else torch.float32
+    config = AutoConfig.from_pretrained(model_name, output_hidden_states=True, trust_remote_code=True)
+    tok = AutoTokenizer.from_pretrained(model_name, use_fast=True, trust_remote_code=True)
+    if tok.pad_token_id is None:
+        tok.pad_token = tok.eos_token
+    model = AutoModelForCausalLM.from_pretrained(
+        model_name,
+        trust_remote_code=True,
+        config=config,
+        torch_dtype=dtype if device == "cuda" else None,
+        device_map="auto" if device == "cuda" else None
+    )
+    model.eval()
+    if device != "cuda":
+        model = model.to(device)
     return model, tok, device, dtype
 def main():
+    st.set_page_config(page_title="LLM Hidden Layer Explorer", layout="wide")
+    st.title("Token Embedding Explorer (Live Hidden States)")
     with st.sidebar:
         st.header("Model / Input")
+        model_name = st.selectbox("Model", MODELS, index=1)
         max_length = st.slider("Max tokens", 16, 256, 64, step=16)
         st.header("Graph")
         st.header("Outputs")
         save_artifacts = st.checkbox("Save artifacts to disk (HTML/CSV/NPZ)", value=False)
+        prompt_col, run_col = st.columns([4, 1])
     with prompt_col:
+        main_text = st.selectbox(
+            "Prompt to visualize (hidden states computed on this text)",
+            options=DEFAULT_CORPUS,
+            index=0,
+            help="Select a predefined prompt for analysis"
         )
     with run_col:
         st.write("")
         st.write("")