colors/model.py

import pytorch_lightning as pl
import torch
import torch.nn as nn
from torch.optim.lr_scheduler import ReduceLROnPlateau

from losses import calculate_separation_loss, preservation_loss  # noqa: F401
from utils import PURE_HSV, PURE_RGB

# class ColorTransformerModel(pl.LightningModule):
# def __init__(self, params):
#     super().__init__()
#     self.save_hyperparameters(params)

#     # Model layers
#     self.layers = nn.Sequential(
#         nn.Linear(5, 128, bias=False),
#         nn.Linear(128, 3, bias=False),
#         nn.ReLU(),
#         nn.Linear(3, 64, bias=False),
#         nn.Linear(64, 128, bias=False),
#         nn.Linear(128, 256, bias=False),
#         nn.Linear(256, 128, bias=False),
#         nn.ReLU(),
#         nn.Linear(128, 1, bias=False),
#     )

# def forward(self, x):
#     x = self.layers(x)
#     x = (torch.sin(x) + 1) / 2
#     return x

# class ColorTransformerModel(pl.LightningModule):
#     def __init__(self, params):
#         super().__init__()
#         self.save_hyperparameters(params)

#         # Embedding layer to expand the input dimensions
#         self.embedding = nn.Linear(3, 128, bias=False)

#         # Transformer encoder-decoder
#         encoder = nn.TransformerEncoderLayer(
#             d_model=128, nhead=4, dim_feedforward=512, dropout=0.3
#         )
#         self.transformer_encoder = nn.TransformerEncoder(
#             encoder, num_layers=3
#         )
#         # lower dimensionality decoder
#         decoder = nn.TransformerDecoderLayer(
#             d_model=128, nhead=4, dim_feedforward=512, dropout=0.3
#         )
#         self.transformer_decoder = nn.TransformerDecoder(
#             decoder, num_layers=3
#         )

#         # Final linear layer to map back to 1D space
#         self.final_layer = nn.Linear(128, 1, bias=False)

#     def forward(self, x):
#         # Embedding the input
#         x = self.embedding(x)

#         # Adjusting the shape for the transformer
#         x = x.unsqueeze(1)  # Adding a fake sequence dimension

#         # Passing through the transformer
#         x = self.transformer_encoder(x)

#         # Passing through the decoder
#         x = self.transformer_decoder(x, memory=x)

#         # Reshape back to original shape
#         x = x.squeeze(1)

#         # Final linear layer
#         x = self.final_layer(x)

#         # Apply sigmoid activation to ensure output is in (0, 1)
#         # x = torch.sigmoid(x)
#         x = (torch.sin(x) + 1) / 2
#         return x


class ColorTransformerModel(pl.LightningModule):
    def __init__(self, params):
        super().__init__()
        self.save_hyperparameters(params)
        # self.a = nn.Sequential(
        #     nn.Linear(3, 3, bias=False),
        #     nn.ReLU(),
        #     nn.Linear(3, 3, bias=False),
        #     nn.ReLU(),
        #     nn.Linear(3, 1, bias=False),
        #     nn.ReLU(),
        # )
        # self.b = nn.Sequential(
        #     nn.Linear(3, 3, bias=False),
        #     nn.ReLU(),
        #     nn.Linear(3, 3, bias=False),
        #     nn.ReLU(),
        #     nn.Linear(3, 1, bias=False),
        #     nn.ReLU(),
        # )
        # Neural network layers
        self.network = nn.Sequential(
            nn.Linear(5, 64),
            nn.Tanh(),
            nn.Linear(64, self.hparams.width),
            nn.Tanh(),
            nn.Linear(self.hparams.width, 3),
            nn.Tanh(),
            nn.Linear(3, 1),
        )

    def forward(self, x):
        # Pass the input through the network
        # a = self.a(x)
        # b = self.b(x)
        # a = torch.sigmoid(a)
        # b = torch.sigmoid(b)
        # x = torch.cat([x, a, b], dim=-1)
        x = self.network(x)
        # Circular mapping
        # x = (torch.sin(x) + 1) / 2
        x = torch.sigmoid(x)
        return x

    def training_step(self, batch, batch_idx):
        inputs, labels = batch  # x are the RGB inputs, labels are the strings
        outputs = self.forward(inputs)
        # s_loss = calculate_separation_loss(model=self)
        # preserve distance to pure R, G, B. this acts kind of like labeled data.
        s_loss = preservation_loss(
            inputs,
            outputs,
            target_inputs=PURE_RGB,
            target_outputs=PURE_HSV,
        )
        p_loss = preservation_loss(
            inputs,
            outputs,
        )
        alpha = self.hparams.alpha
        loss = p_loss + alpha * s_loss
        self.log("hp_metric", loss)
        self.log("p_loss", p_loss)
        self.log("s_loss", s_loss)
        return loss

    def configure_optimizers(self):
        optimizer = torch.optim.SGD(
            self.parameters(),
            lr=self.hparams.learning_rate,
        )
        lr_scheduler = ReduceLROnPlateau(
            optimizer, mode="min", factor=0.05, patience=5, cooldown=10, verbose=True
        )
        return {
            "optimizer": optimizer,
            "lr_scheduler": {
                "scheduler": lr_scheduler,
                "monitor": "hp_metric",  # Specify the metric to monitor
            },
        }
initial commit 2023-12-30 04:37:06 +00:00			`import pytorch_lightning as pl`
			`import torch`
			`import torch.nn as nn`
optimizations 2023-12-30 05:30:52 +00:00			`from torch.optim.lr_scheduler import ReduceLROnPlateau`
initial commit 2023-12-30 04:37:06 +00:00
another attempt 2024-01-16 04:37:22 +00:00			`from losses import calculate_separation_loss, preservation_loss # noqa: F401`
			`from utils import PURE_HSV, PURE_RGB`
chkpt 2023-12-30 05:13:50 +00:00
diff arch, optimizer 2024-01-14 06:04:19 +00:00			`# class ColorTransformerModel(pl.LightningModule):`
			`# def __init__(self, params):`
			`# super().__init__()`
			`# self.save_hyperparameters(params)`

			`# # Model layers`
			`# self.layers = nn.Sequential(`
			`# nn.Linear(5, 128, bias=False),`
			`# nn.Linear(128, 3, bias=False),`
			`# nn.ReLU(),`
			`# nn.Linear(3, 64, bias=False),`
			`# nn.Linear(64, 128, bias=False),`
			`# nn.Linear(128, 256, bias=False),`
			`# nn.Linear(256, 128, bias=False),`
			`# nn.ReLU(),`
			`# nn.Linear(128, 1, bias=False),`
			`# )`

			`# def forward(self, x):`
			`# x = self.layers(x)`
			`# x = (torch.sin(x) + 1) / 2`
			`# return x`

			`# class ColorTransformerModel(pl.LightningModule):`
			`# def __init__(self, params):`
			`# super().__init__()`
			`# self.save_hyperparameters(params)`

			`# # Embedding layer to expand the input dimensions`
			`# self.embedding = nn.Linear(3, 128, bias=False)`

			`# # Transformer encoder-decoder`
			`# encoder = nn.TransformerEncoderLayer(`
			`# d_model=128, nhead=4, dim_feedforward=512, dropout=0.3`
			`# )`
			`# self.transformer_encoder = nn.TransformerEncoder(`
			`# encoder, num_layers=3`
			`# )`
			`# # lower dimensionality decoder`
			`# decoder = nn.TransformerDecoderLayer(`
			`# d_model=128, nhead=4, dim_feedforward=512, dropout=0.3`
			`# )`
			`# self.transformer_decoder = nn.TransformerDecoder(`
			`# decoder, num_layers=3`
			`# )`

			`# # Final linear layer to map back to 1D space`
			`# self.final_layer = nn.Linear(128, 1, bias=False)`

			`# def forward(self, x):`
			`# # Embedding the input`
			`# x = self.embedding(x)`

			`# # Adjusting the shape for the transformer`
			`# x = x.unsqueeze(1) # Adding a fake sequence dimension`

			`# # Passing through the transformer`
			`# x = self.transformer_encoder(x)`

			`# # Passing through the decoder`
			`# x = self.transformer_decoder(x, memory=x)`

			`# # Reshape back to original shape`
			`# x = x.squeeze(1)`

			`# # Final linear layer`
			`# x = self.final_layer(x)`

			`# # Apply sigmoid activation to ensure output is in (0, 1)`
			`# # x = torch.sigmoid(x)`
			`# x = (torch.sin(x) + 1) / 2`
			`# return x`

optimizations 2023-12-30 05:30:52 +00:00
initial commit 2023-12-30 04:37:06 +00:00			`class ColorTransformerModel(pl.LightningModule):`
this looks good 2023-12-31 06:17:15 +00:00			`def __init__(self, params):`
initial commit 2023-12-30 04:37:06 +00:00			`super().__init__()`
this looks good 2023-12-31 06:17:15 +00:00			`self.save_hyperparameters(params)`
another attempt 2024-01-16 04:37:22 +00:00			`# self.a = nn.Sequential(`
			`# nn.Linear(3, 3, bias=False),`
			`# nn.ReLU(),`
			`# nn.Linear(3, 3, bias=False),`
			`# nn.ReLU(),`
			`# nn.Linear(3, 1, bias=False),`
			`# nn.ReLU(),`
			`# )`
			`# self.b = nn.Sequential(`
			`# nn.Linear(3, 3, bias=False),`
			`# nn.ReLU(),`
			`# nn.Linear(3, 3, bias=False),`
			`# nn.ReLU(),`
			`# nn.Linear(3, 1, bias=False),`
			`# nn.ReLU(),`
			`# )`
diff arch, optimizer 2024-01-14 06:04:19 +00:00			`# Neural network layers`
			`self.network = nn.Sequential(`
another attempt 2024-01-16 04:37:22 +00:00			`nn.Linear(5, 64),`
			`nn.Tanh(),`
			`nn.Linear(64, self.hparams.width),`
			`nn.Tanh(),`
			`nn.Linear(self.hparams.width, 3),`
			`nn.Tanh(),`
			`nn.Linear(3, 1),`
optimizations 2023-12-30 05:30:52 +00:00			`)`
chkpt 2023-12-30 05:13:50 +00:00
initial commit 2023-12-30 04:37:06 +00:00			`def forward(self, x):`
diff arch, optimizer 2024-01-14 06:04:19 +00:00			`# Pass the input through the network`
another attempt 2024-01-16 04:37:22 +00:00			`# a = self.a(x)`
			`# b = self.b(x)`
			`# a = torch.sigmoid(a)`
			`# b = torch.sigmoid(b)`
			`# x = torch.cat([x, a, b], dim=-1)`
diff arch, optimizer 2024-01-14 06:04:19 +00:00			`x = self.network(x)`
			`# Circular mapping`
			`# x = (torch.sin(x) + 1) / 2`
			`x = torch.sigmoid(x)`
go back to simpler model 2023-12-30 06:35:19 +00:00			`return x`
chkpt 2023-12-30 05:13:50 +00:00
initial commit 2023-12-30 04:37:06 +00:00			`def training_step(self, batch, batch_idx):`
			`inputs, labels = batch # x are the RGB inputs, labels are the strings`
			`outputs = self.forward(inputs)`
another attempt 2024-01-16 04:37:22 +00:00			`# s_loss = calculate_separation_loss(model=self)`
			`# preserve distance to pure R, G, B. this acts kind of like labeled data.`
			`s_loss = preservation_loss(`
			`inputs,`
			`outputs,`
			`target_inputs=PURE_RGB,`
			`target_outputs=PURE_HSV,`
			`)`
this looks good 2023-12-31 06:17:15 +00:00			`p_loss = preservation_loss(`
initial commit 2023-12-30 04:37:06 +00:00			`inputs,`
			`outputs,`
			`)`
this looks good 2023-12-31 06:17:15 +00:00			`alpha = self.hparams.alpha`
slight refactors 2024-01-15 03:26:46 +00:00			`loss = p_loss + alpha * s_loss`
refactor loss functions 2024-01-14 03:11:49 +00:00			`self.log("hp_metric", loss)`
slight refactors 2024-01-15 03:26:46 +00:00			`self.log("p_loss", p_loss)`
			`self.log("s_loss", s_loss)`
initial commit 2023-12-30 04:37:06 +00:00			`return loss`

			`def configure_optimizers(self):`
diff arch, optimizer 2024-01-14 06:04:19 +00:00			`optimizer = torch.optim.SGD(`
			`self.parameters(),`
			`lr=self.hparams.learning_rate,`
go back to simpler model 2023-12-30 06:35:19 +00:00			`)`
			`lr_scheduler = ReduceLROnPlateau(`
use millions of colors 2024-01-15 19:18:28 +00:00			`optimizer, mode="min", factor=0.05, patience=5, cooldown=10, verbose=True`
go back to simpler model 2023-12-30 06:35:19 +00:00			`)`
optimizations 2023-12-30 05:30:52 +00:00			`return {`
go back to simpler model 2023-12-30 06:35:19 +00:00			`"optimizer": optimizer,`
			`"lr_scheduler": {`
			`"scheduler": lr_scheduler,`
slight refactors 2024-01-15 03:26:46 +00:00			`"monitor": "hp_metric", # Specify the metric to monitor`
go back to simpler model 2023-12-30 06:35:19 +00:00			`},`
			`}`