import equinox as eqx
import jax
import jax.numpy as jnp
import matplotlib.pyplot as plt
import numpy as np

from thrml.block_management import Block
from thrml.block_sampling import BlockGibbsSpec, SamplingSchedule, sample_states
from thrml.factor import FactorSamplingProgram
from thrml.models.discrete_ebm import (
    CategoricalEBMFactor,
    CategoricalGibbsConditional,
    SpinEBMFactor,
    SpinGibbsConditional,
)
from thrml.pgm import CategoricalNode, SpinNode

# First 100 amino acids of the SARS-CoV-2 spike protein.
SEQ = "MFVFLVLLPLVSSQCVNLTTRTQLPPAYTNSFTRGVYYPDKVFRSSVLHSTQDLFLPFFSNVTWFHAIHVSGTNGTKRFDNPVLPFNDGVYFASTEKSNI"

WEIGHT_USAGE = 1.0  # how much we care about avoiding rare codons
WEIGHT_REPEAT = 0.5  # how much we care about avoiding nucleotide repeats

N_CHAINS = 512  # number of independent optimization runs (annealed in parallel via vmap)
SEED = 42
K_MAX = 6  # the most synonymous codons any amino acid has

# Standard genetic code: synonymous codons (DNA) for each amino acid.
CODON_TABLE = {
    "A": ["GCT", "GCC", "GCA", "GCG"],
    "C": ["TGT", "TGC"],
    "D": ["GAT", "GAC"],
    "E": ["GAA", "GAG"],
    "F": ["TTT", "TTC"],
    "G": ["GGT", "GGC", "GGA", "GGG"],
    "H": ["CAT", "CAC"],
    "I": ["ATT", "ATC", "ATA"],
    "K": ["AAA", "AAG"],
    "L": ["TTA", "TTG", "CTT", "CTC", "CTA", "CTG"],
    "M": ["ATG"],
    "N": ["AAT", "AAC"],
    "P": ["CCT", "CCC", "CCA", "CCG"],
    "Q": ["CAA", "CAG"],
    "R": ["CGT", "CGC", "CGA", "CGG", "AGA", "AGG"],
    "S": ["TCT", "TCC", "TCA", "TCG", "AGT", "AGC"],
    "T": ["ACT", "ACC", "ACA", "ACG"],
    "V": ["GTT", "GTC", "GTA", "GTG"],
    "W": ["TGG"],
    "Y": ["TAT", "TAC"],
}

# E. coli K-12 codon usage frequencies (fraction within each amino acid),
# rounded to 2 decimals. Source: the python_codon_tables package (e_coli_316407).
ECOLI_FREQ = {
    "A": {"GCT": 0.16, "GCC": 0.27, "GCA": 0.21, "GCG": 0.36},
    "C": {"TGT": 0.44, "TGC": 0.56},
    "D": {"GAT": 0.63, "GAC": 0.37},
    "E": {"GAA": 0.69, "GAG": 0.31},
    "F": {"TTT": 0.57, "TTC": 0.43},
    "G": {"GGT": 0.34, "GGC": 0.41, "GGA": 0.11, "GGG": 0.15},
    "H": {"CAT": 0.57, "CAC": 0.43},
    "I": {"ATT": 0.51, "ATC": 0.42, "ATA": 0.07},
    "K": {"AAA": 0.76, "AAG": 0.24},
    "L": {"TTA": 0.13, "TTG": 0.13, "CTT": 0.10, "CTC": 0.10, "CTA": 0.04, "CTG": 0.50},
    "M": {"ATG": 1.00},
    "N": {"AAT": 0.45, "AAC": 0.55},
    "P": {"CCT": 0.16, "CCC": 0.12, "CCA": 0.19, "CCG": 0.53},
    "Q": {"CAA": 0.35, "CAG": 0.65},
    "R": {"CGT": 0.38, "CGC": 0.40, "CGA": 0.06, "CGG": 0.10, "AGA": 0.04, "AGG": 0.02},
    "S": {"TCT": 0.15, "TCC": 0.15, "TCA": 0.12, "TCG": 0.15, "AGT": 0.15, "AGC": 0.28},
    "T": {"ACT": 0.16, "ACC": 0.44, "ACA": 0.13, "ACG": 0.27},
    "V": {"GTT": 0.26, "GTC": 0.22, "GTA": 0.15, "GTG": 0.37},
    "W": {"TGG": 1.00},
    "Y": {"TAT": 0.57, "TAC": 0.43},
}


def ecoli_rarity_scores():
    """Rarity score |log(f / f_max)| per codon: 0 for the host's favorite, larger for rarer codons."""
    rarity = {}
    for aa, freqs in ECOLI_FREQ.items():
        f_max = max(freqs.values())
        for codon, f in freqs.items():
            rarity[codon] = abs(np.log(f / f_max))
    return rarity

def longest_run(s):
    """Length of the longest run of a single repeated character in s."""
    best = run = 1
    for a, b in zip(s, s[1:]):
        run = run + 1 if a == b else 1
        best = max(best, run)
    return best


def repeat_penalty(c1, c2):
    """Penalty for repeated nucleotides anywhere in the 6-nucleotide window of two adjacent codons."""
    return longest_run(c1 + c2) ** 2 - 1

def build_lookups(seq):
    L = len(seq)
    Ks = [len(CODON_TABLE[aa]) for aa in seq]  # number of valid codons at each position
    rarity = ecoli_rarity_scores()

    rarity_lookup = np.zeros((L, K_MAX), dtype=np.float32)
    for p, aa in enumerate(seq):
        for k, codon in enumerate(CODON_TABLE[aa]):
            rarity_lookup[p, k] = rarity[codon]

    repeat_lookup = np.zeros((L - 1, K_MAX, K_MAX), dtype=np.float32)
    for p in range(L - 1):
        for k, c1 in enumerate(CODON_TABLE[seq[p]]):
            for kp, c2 in enumerate(CODON_TABLE[seq[p + 1]]):
                repeat_lookup[p, k, kp] = repeat_penalty(c1, c2)

    return jnp.array(rarity_lookup), jnp.array(repeat_lookup), Ks


def codon_energy(indices):
    """Energy of one configuration, returned as (usage term, repeat term)."""
    L = indices.shape[-1]
    usage = WEIGHT_USAGE * rarity_lookup[jnp.arange(L), indices].sum()
    repeat = WEIGHT_REPEAT * repeat_lookup[jnp.arange(L - 1), indices[:-1], indices[1:]].sum()
    return usage, repeat

rarity_lookup, repeat_lookup, Ks = build_lookups(SEQ)
L = len(SEQ)
print(f"{L} amino acids; number of synonymous codons per position ranges from {min(Ks)} to {max(Ks)}")

100 amino acids; number of synonymous codons per position ranges from 1 to 6

W0601 19:51:55.681127  110732 cuda_executor.cc:1802] GPU interconnect information not available: INTERNAL: NVML doesn't support extracting fabric info or NVLink is not used by the device.
W0601 19:51:55.683414  110608 cuda_executor.cc:1802] GPU interconnect information not available: INTERNAL: NVML doesn't support extracting fabric info or NVLink is not used by the device.

INVALID_BIAS = -1e10  # effectively forbids a padded (invalid) codon slot


def potts_weights(rarity_lookup, repeat_lookup, Ks):
    """THRML weight arrays for the Potts model (weight = -energy contribution)."""
    biases = np.array(-WEIGHT_USAGE * rarity_lookup)
    for p, K in enumerate(Ks):
        biases[p, K:] = INVALID_BIAS  # forbid the unused codon slots at this position
    pairwise = -WEIGHT_REPEAT * repeat_lookup
    return jnp.array(biases), pairwise


def build_potts_program(biases, pairwise):
    """A Potts FactorSamplingProgram on the codon chain, 2-colored into even/odd blocks."""
    L = biases.shape[0]
    nodes = [CategoricalNode() for _ in range(L)]
    factors = [
        CategoricalEBMFactor([Block(nodes)], biases),  # usage (per node)
        CategoricalEBMFactor([Block(nodes[:-1]), Block(nodes[1:])], pairwise),  # repeat (adjacent pairs)
    ]
    free_blocks = [Block(nodes[0::2]), Block(nodes[1::2])]  # even / odd positions
    spec = BlockGibbsSpec(free_blocks, [])
    samplers = [CategoricalGibbsConditional(K_MAX) for _ in free_blocks]
    program = FactorSamplingProgram(spec, samplers, factors, [])
    return program, Block(nodes)


biases, pairwise = potts_weights(rarity_lookup, repeat_lookup, Ks)

# Annealing schedule (defaults taken from the paper's Potts configuration; generous
# for this simplified objective, so you can safely reduce POTTS_STEPS to speed things up).
POTTS_STEPS = 4000  # number of beta values in the schedule
POTTS_SWEEPS_PER_STEP = 10  # Gibbs sweeps run at each beta
POTTS_BETA_MIN, POTTS_BETA_MAX = 0.1, 8.0


@eqx.filter_jit
def anneal_potts(key):
    betas = jnp.logspace(jnp.log10(POTTS_BETA_MIN), jnp.log10(POTTS_BETA_MAX), POTTS_STEPS)
    # One annealing step = POTTS_SWEEPS_PER_STEP warmup sweeps, then take a single sample
    # (the configuration we carry into the next, colder step).
    schedule = SamplingSchedule(n_warmup=POTTS_SWEEPS_PER_STEP, n_samples=1, steps_per_sample=1)

    def step(state, step_input):
        step_key, beta = step_input
        # Cooling = scaling the energy by beta = scaling the weights by beta.
        program, all_block = build_potts_program(beta * biases, beta * pairwise)
        blocks = [state[:, 0::2], state[:, 1::2]]  # split the carried state into even/odd blocks
        chain_keys = jax.random.split(step_key, N_CHAINS)
        # sample_states returns a list with one array per observed block, each of shape
        # (n_samples, n_nodes). Here there is a single observed block ([all_block]) and
        # n_samples=1, so [0] picks that block and [0] picks its one sample: the codon vector.
        new_state = jax.vmap(lambda k, b: sample_states(k, program, schedule, b, [], [all_block])[0][0])(
            chain_keys, blocks
        )
        energies = jax.vmap(codon_energy)(new_state)
        return new_state, energies

    # Random valid starting codon at every position, for every chain.
    init_key, scan_key = jax.random.split(key)
    pos_keys = jax.random.split(init_key, L)
    init_state = jax.vmap(lambda k, n: jax.random.randint(k, (N_CHAINS,), 0, n, dtype=jnp.uint8))(
        pos_keys, jnp.array(Ks)
    ).T  # shape (N_CHAINS, L)

    final_state, (usage, repeat) = jax.lax.scan(step, init_state, (jax.random.split(scan_key, POTTS_STEPS), betas))
    # usage, repeat have shape (POTTS_STEPS, N_CHAINS); transpose to (N_CHAINS, POTTS_STEPS).
    return final_state, usage.T, repeat.T

potts_final, potts_usage, potts_repeat = anneal_potts(jax.random.key(SEED))
potts_final = np.array(potts_final)
potts_total = np.array(potts_usage + potts_repeat)

best_chain = int(np.argmin(potts_total[:, -1]))
print(
    f"final energy: {potts_total[:, -1].mean():.2f} +/- {potts_total[:, -1].std():.2f} "
    f"(mean over {N_CHAINS} chains)"
)
print(f"best energy found: {potts_total[best_chain, -1]:.2f}")

final energy: 107.36 +/- 0.54 (mean over 512 chains)
best energy found: 106.37

def plot_convergence(usage, repeat, color="C0", label=None):
    total = usage + repeat
    fig, axes = plt.subplots(1, 3, figsize=(14, 4))
    for ax, data, name in zip(axes, [total, usage, repeat], ["Total energy", "Usage term", "Repeat term"]):
        x = np.arange(data.shape[1])
        ax.plot(x, data.mean(0), color=color, label=label)
        ax.fill_between(x, np.percentile(data, 5, 0), np.percentile(data, 95, 0), color=color, alpha=0.25)
        ax.set(title=name, xlabel="annealing step", ylabel="energy")
        ax.grid(alpha=0.3)
    if label:
        axes[0].legend()
    fig.tight_layout()


plot_convergence(potts_usage, potts_repeat)

def indices_to_dna(seq, indices):
    return "".join(CODON_TABLE[aa][int(k)] for aa, k in zip(seq, indices))


best_dna = indices_to_dna(SEQ, potts_final[best_chain])
print(f"optimized coding DNA ({len(best_dna)} nucleotides), first 60:\n{best_dna[:60]}...")

K = 4
for state in range(K):
    spins = ["+1" if j < state else "-1" for j in range(K - 1)]
    print(f"state {state}:  [{', '.join(spins)}]")

state 0:  [-1, -1, -1]
state 1:  [+1, -1, -1]
state 2:  [+1, +1, -1]
state 3:  [+1, +1, +1]

def potts_to_spin(indices, pos_of_spin, spin_pos_index):
    """Codon indices [..., L] -> thermometer spins [..., n_spins] (bool, True means +1)."""
    return spin_pos_index < indices[..., pos_of_spin]


def spin_to_potts(spins, pos_matrix):
    """Thermometer spins -> codon indices [..., L] (the count of +1 spins at each position)."""
    return (spins.astype(jnp.int32) @ pos_matrix).astype(jnp.uint8)


def compile_dwc(biases, pairwise, Ks):
    """Compile the Potts weights into the static structure of the domain-wall Ising model."""
    biases, pairwise = np.asarray(biases), np.asarray(pairwise)
    L = len(Ks)

    # Lay out the spins: position p contributes Ks[p]-1 spins. Record, for each spin,
    # which position it belongs to (pos_of_spin) and its index within that position (spin_pos_index).
    pos_of_spin, spin_pos_index = [], []
    for p, K in enumerate(Ks):
        for j in range(K - 1):
            pos_of_spin.append(p)
            spin_pos_index.append(j)
    pos_of_spin = np.array(pos_of_spin)
    spin_pos_index = np.array(spin_pos_index)
    n_spins = len(pos_of_spin)
    offset = [sum(Ks[pp] - 1 for pp in range(p)) for p in range(L)]  # first spin index of position p

    # Per-spin Ising bias, split into a P-independent part (bias_base) and the boundary
    # term that scales with P (first_minus_last is +1 at a chain's start, -1 at its end).
    bias_base = np.zeros(n_spins, dtype=np.float32)
    first_minus_last = np.zeros(n_spins, dtype=np.float32)
    for s in range(n_spins):
        p, j, K = pos_of_spin[s], spin_pos_index[s], Ks[pos_of_spin[s]]
        b = (biases[p, j + 1] - biases[p, j]) / 2  # first difference of the unary bias
        if j == 0:
            first_minus_last[s] += 1.0
        if j == K - 2:
            first_minus_last[s] -= 1.0
        if p > 0:  # contribution from the coupling to the previous position
            W, Kl = pairwise[p - 1], Ks[p - 1]
            b += (W[0, j + 1] - W[0, j] + W[Kl - 1, j + 1] - W[Kl - 1, j]) / 4
        if p < L - 1:  # contribution from the coupling to the next position
            W, Kr = pairwise[p], Ks[p + 1]
            b += (W[j + 1, 0] - W[j, 0] + W[j + 1, Kr - 1] - W[j, Kr - 1]) / 4
        bias_base[s] = b

    # Constraint edges: the ferromagnetic chain inside each position (weight P/4).
    constraint_edges = [(offset[p] + j, offset[p] + j + 1) for p in range(L) for j in range(Ks[p] - 2)]

    # Coupling edges between adjacent positions, with weights from a second difference.
    inter_edges, inter_weights = [], []
    for p in range(L - 1):
        W = pairwise[p]
        for i in range(Ks[p] - 1):
            for j in range(Ks[p + 1] - 1):
                inter_edges.append((offset[p] + i, offset[p + 1] + j))
                inter_weights.append((W[i + 1, j + 1] - W[i, j + 1] - W[i + 1, j] + W[i, j]) / 4)

    spin_nodes = [SpinNode() for _ in range(n_spins)]

    # 4-coloring by (position parity, spin-index parity): no two same-color spins share an edge.
    colors = {}
    for s in range(n_spins):
        colors.setdefault((pos_of_spin[s] % 2, spin_pos_index[s] % 2), []).append(s)
    free_blocks = [Block([spin_nodes[s] for s in group]) for group in colors.values()]
    block_indices = [np.array(group, dtype=np.int32) for group in colors.values()]

    return {
        "spin_nodes": spin_nodes,
        "n_constraint": len(constraint_edges),
        "bias_base": jnp.array(bias_base),
        "first_minus_last": jnp.array(first_minus_last),
        "constraint_left": [spin_nodes[a] for a, b in constraint_edges],
        "constraint_right": [spin_nodes[b] for a, b in constraint_edges],
        "inter_left": [spin_nodes[a] for a, b in inter_edges],
        "inter_right": [spin_nodes[b] for a, b in inter_edges],
        "inter_weights": jnp.array(inter_weights, dtype=np.float32),
        "free_blocks": free_blocks,
        "block_indices": block_indices,
        "pos_of_spin": jnp.array(pos_of_spin),
        "spin_pos_index": jnp.array(spin_pos_index),
        "pos_matrix": jnp.array(np.eye(L, dtype=np.int32)[pos_of_spin]),
    }


dwc = compile_dwc(biases, pairwise, Ks)
n_spins = len(dwc["spin_nodes"])
print(
    f"{L} categorical codon variables  ->  {n_spins} binary spins "
    f"({dwc['n_constraint']} constraint edges, {len(dwc['inter_left'])} coupling edges)"
)

100 categorical codon variables  ->  266 binary spins (168 constraint edges, 707 coupling edges)

ISING_STEPS = 500
ISING_SWEEPS_PER_STEP = 10
ISING_BETA_MIN, ISING_BETA_MAX = 2.0, 200.0
ISING_P_MIN, ISING_P_MAX = 2.0, 200.0
ISING_N_CONST_P = 25  # keep P at its minimum for this many initial steps before ramping it up


def build_ising_program(beta, P):
    """An Ising FactorSamplingProgram for the given temperature (beta) and constraint strength (P)."""
    ising_biases = (dwc["bias_base"] + dwc["first_minus_last"] * (P / 4)) * beta
    factors = [SpinEBMFactor([Block(dwc["spin_nodes"])], ising_biases)]
    if dwc["n_constraint"] > 0:
        constraint_weights = jnp.full(dwc["n_constraint"], P * beta / 4)
        factors.append(
            SpinEBMFactor([Block(dwc["constraint_left"]), Block(dwc["constraint_right"])], constraint_weights)
        )
    if dwc["inter_left"]:
        factors.append(
            SpinEBMFactor([Block(dwc["inter_left"]), Block(dwc["inter_right"])], dwc["inter_weights"] * beta)
        )
    spec = BlockGibbsSpec(dwc["free_blocks"], [])
    samplers = [SpinGibbsConditional() for _ in spec.free_blocks]
    return FactorSamplingProgram(spec, samplers, factors, [])


@eqx.filter_jit
def anneal_ising(key):
    betas = jnp.logspace(jnp.log10(ISING_BETA_MIN), jnp.log10(ISING_BETA_MAX), ISING_STEPS)
    Ps = jnp.concatenate(
        [
            jnp.full(ISING_N_CONST_P, ISING_P_MIN),
            jnp.logspace(jnp.log10(ISING_P_MIN), jnp.log10(ISING_P_MAX), ISING_STEPS - ISING_N_CONST_P),
        ]
    )
    schedule = SamplingSchedule(n_warmup=ISING_SWEEPS_PER_STEP, n_samples=1, steps_per_sample=1)
    all_block = Block(dwc["spin_nodes"])

    def step(spins, step_input):
        step_key, beta, P = step_input
        program = build_ising_program(beta, P)
        blocks = [spins[:, idx] for idx in dwc["block_indices"]]  # split into the 4 color groups
        chain_keys = jax.random.split(step_key, N_CHAINS)
        # As in the Potts anneal, [0][0] pulls the single observed block's single sample
        # out of sample_states' output — here the new spin vector.
        new_spins = jax.vmap(lambda k, b: sample_states(k, program, schedule, b, [], [all_block])[0][0])(
            chain_keys, blocks
        )
        energies = jax.vmap(lambda s: codon_energy(spin_to_potts(s, dwc["pos_matrix"])))(new_spins)
        return new_spins, energies

    # Start from random valid codons, converted to thermometer spins.
    init_key, scan_key = jax.random.split(key)
    pos_keys = jax.random.split(init_key, L)
    init_codons = jax.vmap(lambda k, n: jax.random.randint(k, (N_CHAINS,), 0, n, dtype=jnp.uint8))(
        pos_keys, jnp.array(Ks)
    ).T
    init_spins = potts_to_spin(init_codons, dwc["pos_of_spin"], dwc["spin_pos_index"])

    final_spins, (usage, repeat) = jax.lax.scan(step, init_spins, (jax.random.split(scan_key, ISING_STEPS), betas, Ps))
    final_codons = spin_to_potts(final_spins, dwc["pos_matrix"])
    return final_codons, final_spins, usage.T, repeat.T

ising_codons, ising_spins, ising_usage, ising_repeat = anneal_ising(jax.random.key(SEED))
ising_codons, ising_spins = np.array(ising_codons), np.array(ising_spins)
ising_total = np.array(ising_usage + ising_repeat)

best_ising = int(np.argmin(ising_total[:, -1]))
print(
    f"final energy: {ising_total[:, -1].mean():.2f} +/- {ising_total[:, -1].std():.2f} "
    f"(mean over {N_CHAINS} chains)"
)
print(f"best energy found: {ising_total[best_ising, -1]:.2f}")

# Check that every final state is a valid thermometer (no leftover defects).
expected = np.array(dwc["spin_pos_index"]) < ising_codons[:, np.array(dwc["pos_of_spin"])]
valid_fraction = (expected == ising_spins).all(axis=1).mean()
print(f"defect-free final states: {100 * valid_fraction:.1f}%")

final energy: 107.41 +/- 0.68 (mean over 512 chains)
best energy found: 106.37
defect-free final states: 100.0%

plot_convergence(ising_usage, ising_repeat, color="C1")

plt.figure(figsize=(7, 4))
bins = np.linspace(
    min(potts_total[:, -1].min(), ising_total[:, -1].min()), max(potts_total[:, -1].max(), ising_total[:, -1].max()), 40
)
plt.hist(potts_total[:, -1], bins=bins, alpha=0.6, label=f"Potts ({L} categorical nodes)")
plt.hist(ising_total[:, -1], bins=bins, alpha=0.6, label=f"Ising ({n_spins} spins)")
plt.xlabel("final energy")
plt.ylabel("number of chains")
plt.legend()
plt.tight_layout()

print(f"Potts best: {potts_total[:, -1].min():.2f}    Ising best: {ising_total[:, -1].min():.2f}")

Potts best: 106.37    Ising best: 106.37

Codon Optimization with THRML¶

The pipeline at a glance¶

Optimization with energy-based models¶

The problem: choosing codons¶

The energy function¶

Problem settings¶

The genetic code and host codon usage¶

Turning the objective into arrays¶

Building the Potts model¶

Simulated annealing¶

From categorical to binary: the Ising model¶

Building and annealing the Ising model¶

Comparing the two models¶

Wrap-up¶