Source code for uchrom.recon.bulk.mds.torch_mds

# PyTorch MDS with GPU acceleration (CUDA / MPS / CPU)

import torch
import numpy as np



[docs]
def get_device(device='auto'):
    """Get appropriate torch device."""
    if device == 'auto':
        if torch.cuda.is_available():
            return torch.device('cuda')
        elif torch.backends.mps.is_available():
            return torch.device('mps')
        else:
            return torch.device('cpu')
    return torch.device(device)




[docs]
def get_dtype(device):
    """MPS only supports float32."""
    if device.type == 'mps':
        return torch.float32
    return torch.float64




[docs]
def compute_stress(coords, dist_mat, weights=None):
    """Compute MDS stress, skipping missing-data pairs (dist_mat == 0)."""
    pred_dist = torch.cdist(coords, coords)
    diff_sq = (pred_dist - dist_mat) ** 2
    if weights is not None:
        diff_sq = weights * diff_sq
    # only sum over pairs with observed distances (nonzero upper triangle)
    mask = torch.triu(dist_mat > 0, diagonal=1)
    stress = (diff_sq * mask).sum()
    return stress




[docs]
def cmds_init(dist_mat):
    """Classical MDS initialization via eigendecomposition."""
    n = dist_mat.shape[0]
    dtype = dist_mat.dtype
    device = dist_mat.device

    D_sq = dist_mat ** 2
    row_mean = D_sq.mean(dim=1, keepdim=True)
    col_mean = D_sq.mean(dim=0, keepdim=True)
    grand_mean = D_sq.mean()
    B = -0.5 * (D_sq - row_mean - col_mean + grand_mean)

    try:
        eigenvalues, eigenvectors = torch.linalg.eigh(B)
        idx = torch.argsort(eigenvalues, descending=True)[:3]
        top_eigenvalues = torch.clamp(eigenvalues[idx], min=1e-10)
        top_eigenvectors = eigenvectors[:, idx]
        coords = top_eigenvectors * torch.sqrt(top_eigenvalues)
    except RuntimeError:
        coords = torch.randn(n, 3, dtype=dtype, device=device)

    return coords




[docs]
def smacof(dist_mat, device='auto', n_iter=1000, tol=1e-6,
           init='cmds', verbose=False):
    """Run SMACOF (Scaling by MAjorizing a Complicated Function) MDS.

    Unlike the Adam-based approach, SMACOF uses a majorization algorithm
    that does not require autograd, resulting in much lower per-iteration
    overhead on CPU."""
    dev = get_device(device)
    dtype = get_dtype(dev)

    if isinstance(dist_mat, np.ndarray):
        dist_mat = torch.from_numpy(dist_mat)
    dist_mat = dist_mat.to(dtype=dtype, device=dev)
    n = dist_mat.shape[0]

    # weight matrix: 1 for observed pairs, 0 for missing (precomputed)
    diag_mask = torch.eye(n, dtype=torch.bool, device=dev)
    W = ((dist_mat > 0) & ~diag_mask).to(dtype=dtype)

    # V diagonal (row sums of W) — used as denominator in Guttman transform
    V_diag = W.sum(dim=1)
    V_diag = torch.clamp(V_diag, min=1.0)  # avoid division by zero

    # initialize coordinates
    if init == 'cmds':
        coords = cmds_init(dist_mat)
    else:
        coords = torch.randn(n, 3, dtype=dtype, device=dev)

    prev_stress = float('inf')
    with torch.no_grad():
        for i in range(n_iter):
            # current pairwise distances
            d_current = torch.cdist(coords, coords)

            # compute stress (only on observed pairs, upper triangle)
            diff_sq = (d_current - dist_mat) ** 2
            mask_upper = torch.triu(W, diagonal=1)
            stress = (diff_sq * mask_upper).sum().item()

            if verbose and i % 100 == 0:
                print(f"Iteration {i}: stress = {stress:.6f}")

            # convergence check (relative)
            if prev_stress != float('inf'):
                rel_change = abs(prev_stress - stress) / max(prev_stress, 1e-12)
                if rel_change < tol:
                    if verbose:
                        print(f"Converged at iteration {i}")
                    break
            prev_stress = stress

            # Guttman transform: B matrix
            # B[i,j] = -W[i,j] * d_target[i,j] / d_current[i,j]
            safe_d = torch.clamp(d_current, min=1e-12)
            B = -W * dist_mat / safe_d
            B.fill_diagonal_(0)
            B.diagonal().copy_(-B.sum(dim=1))

            # update: coords = B @ coords / V_diag
            coords = B @ coords / V_diag.unsqueeze(1)

    coords = coords - coords.mean(dim=0, keepdim=True)
    return coords.cpu().numpy()




[docs]
def torch_mds(dist_mat, device='auto', n_iter=1000, lr=0.01,
              tol=1e-6, init='cmds', verbose=False, method='smacof'):
    """Run iterative MDS.

    Args:
        method: 'smacof' (default, fast) or 'adam' (gradient descent).
    """
    if method == 'smacof':
        return smacof(dist_mat, device=device, n_iter=n_iter,
                      tol=tol, init=init, verbose=verbose)

    # Adam-based gradient descent (original implementation)
    dev = get_device(device)
    dtype = get_dtype(dev)

    if isinstance(dist_mat, np.ndarray):
        dist_mat = torch.from_numpy(dist_mat)
    dist_mat = dist_mat.to(dtype=dtype, device=dev)
    n = dist_mat.shape[0]

    if init == 'cmds':
        coords = cmds_init(dist_mat)
    else:
        coords = torch.randn(n, 3, dtype=dtype, device=dev)
    coords = coords.requires_grad_(True)

    optimizer = torch.optim.Adam([coords], lr=lr)

    prev_loss = float('inf')
    for i in range(n_iter):
        optimizer.zero_grad()
        loss = compute_stress(coords, dist_mat)
        loss.backward()
        optimizer.step()

        current_loss = loss.item()
        if verbose and i % 100 == 0:
            print(f"Iteration {i}: stress = {current_loss:.6f}")
        if abs(prev_loss - current_loss) < tol:
            if verbose:
                print(f"Converged at iteration {i}")
            break
        prev_loss = current_loss

    result = coords.detach()
    result = result - result.mean(dim=0, keepdim=True)
    return result.cpu().numpy()




[docs]
def run_mds(contact_mat, alpha=4.0, device='auto', weight=0.05, **kwargs):
    """Full MDS pipeline: contact matrix -> 3D coordinates.

    Zero-contact bins (rows/columns with no observed contacts) are removed
    before MDS, matching miniMDS behavior. Returns coordinates only for
    non-zero bins.

    Returns:
        coords: np.ndarray of shape (n_nonzero, 3)
        nonzero_mask: np.ndarray boolean mask of shape (n_total,)
            indicating which bins were kept
    """
    from .core import (
        contact_to_distance,
        normalize_distances,
        apply_distance_decay_prior
    )

    dev = get_device(device)
    dtype = get_dtype(dev)
    contact_mat = contact_mat.to(dtype=dtype, device=dev)

    print(f"Processing on device: {dev} (dtype: {dtype})")

    # Identify zero-contact bins BEFORE applying distance decay prior
    row_sums = contact_mat.sum(dim=1)
    nonzero_mask = (row_sums > 0).cpu().numpy()
    n_total = len(nonzero_mask)
    n_nonzero = nonzero_mask.sum()

    if n_nonzero < n_total:
        idx = torch.where(torch.from_numpy(nonzero_mask).to(dev))[0]
        contact_mat = contact_mat[idx][:, idx]
        print(f"  Removed {n_total - n_nonzero} zero-contact bins "
              f"({n_nonzero}/{n_total} kept)")

    if weight > 0:
        contact_mat = apply_distance_decay_prior(contact_mat, weight)

    dist_mat = contact_to_distance(contact_mat, alpha)
    dist_mat = normalize_distances(dist_mat)

    coords = torch_mds(dist_mat, device=device, **kwargs)
    return coords, nonzero_mask