import numpy as np
from ex_color.data.color import hues
from ex_color.data.color_cube import ColorCube
from ex_color.data.cyclic import arange_cyclic, isbetween_cyclic
from ex_color.vis import plot_colors

all_hues = arange_cyclic(step_size=1 / 360)

cube = ColorCube.from_hsv(
    h=all_hues[~isbetween_cyclic(all_hues, hues.teal, hues.blue)],
    # h=all_hues,
    s=np.array([1]),
    v=np.array([0.9, 1]),
)
plot_colors(cube.permute('svh'))

import torch
import torch.nn as nn
import numpy as np


class ColorMLP(nn.Module):
    def __init__(self, normalize_bottleneck=False):
        super().__init__()
        # RGB input (3D) → hidden layer → 2D bottleneck → hidden layer → RGB output
        self.encoder = nn.Sequential(
            nn.Linear(3, 16),
            nn.ReLU(),
            nn.Linear(16, 2),  # Our critical 2D bottleneck!
        )

        self.decoder = nn.Sequential(
            nn.Linear(2, 16),
            nn.ReLU(),
            nn.Linear(16, 3),
            nn.Sigmoid(),  # Keep RGB values in [0,1]
        )

        self.normalize = normalize_bottleneck

    def forward(self, x):
        # Get our bottleneck representation
        bottleneck = self.encoder(x)

        # Optionally normalize to unit vectors (like nGPT)
        if self.normalize:
            norm = torch.norm(bottleneck, dim=1, keepdim=True)
            bottleneck = bottleneck / (norm + 1e-8)  # Avoid division by zero

        # Decode back to RGB
        output = self.decoder(bottleneck)
        return output, bottleneck


def train_color_model(model, data: torch.Tensor, epochs=500):
    from torch import optim
    from tqdm import tqdm

    optimizer = optim.Adam(model.parameters(), lr=0.001)
    criterion = nn.MSELoss()

    # Store bottleneck values for visualization
    bottleneck_history = []

    with tqdm(total=epochs) as pbar:
        for epoch in range(epochs):
            pbar.update(1)
            optimizer.zero_grad()

            # Forward pass
            outputs, _latents = model(data)
            loss = criterion(outputs, data)  # Autoencoder loss

            # Backward pass
            loss.backward()
            optimizer.step()

            pbar.set_postfix(loss=loss.item())
            if epoch % 50 == 0:
                # Save named colors' bottleneck representation
                with torch.no_grad():
                    _, latents = model(data)
                    bottleneck_history.append(latents.clone())

    return bottleneck_history


model = ColorMLP(normalize_bottleneck=True)
train_data = torch.tensor(cube.rgb_grid.reshape(-1, 3), dtype=torch.float32)
history = train_color_model(model, train_data, epochs=500)

100%|██████████| 500/500 [00:01<00:00, 441.27it/s, loss=0.0162]

print(history[-1][:3])
print(train_data[:3])

tensor([[ 0.7351, -0.6779],
        [ 0.7187, -0.6953],
        [ 0.7475, -0.6643]])
tensor([[0.9000, 0.0000, 0.0000],
        [1.0000, 0.0000, 0.0000],
        [0.9000, 0.0150, 0.0000]])

import matplotlib.pyplot as plt

# Get the final bottleneck representations
final_bottleneck = history[-1]

# Convert tensors to numpy arrays for plotting
bottleneck_np = final_bottleneck.detach().numpy()
colors_np = train_data.numpy()

# Create a scatter plot with points colored by their RGB values
plt.figure(figsize=(5, 5))
plt.scatter(bottleneck_np[:, 0], bottleneck_np[:, 1], c=colors_np, s=10, alpha=0.8)

plt.title('Color Space Embedding in 2D Bottleneck')
plt.xlabel('Dimension 1')
plt.ylabel('Dimension 2')
plt.grid(alpha=0.3)

plt.tight_layout()
plt.show()

# Let's also analyze the shape of the distribution
print(f'Bottleneck shape: {bottleneck_np.shape}')
print(f'Range - X: [{bottleneck_np[:, 0].min():.4f}, {bottleneck_np[:, 0].max():.4f}]')
print(f'Range - Y: [{bottleneck_np[:, 1].min():.4f}, {bottleneck_np[:, 1].max():.4f}]')

Bottleneck shape: (538, 2)
Range - X: [-0.9559, 1.0000]
Range - Y: [-1.0000, 1.0000]

Experiment 1.2: MLP Autoencoder with 2D Bottleneck

Training Data Setup

Model: Simple MLP Autoencoder

Model Definition and Training

Visualizing the Bottleneck Representation