diff --git a/Makefile b/Makefile index 4b52ed8..b781e68 100644 --- a/Makefile +++ b/Makefile @@ -24,12 +24,49 @@ eval_frozen_encoder: eval.py training.csv train_frozen_layers: train.py training.csv @echo "Training coordinate regressor with first transformer layers frozen..." - @bash -c 'source .venv/bin/activate && python train.py --output-path output_frozen_layers --freeze-transformer-layers 4 --epochs 10' + @bash -c 'source .venv/bin/activate && python train.py --output-path output_frozen_layers --freeze-transformer-layers 4 --epochs 50 --num-workers 0' eval_frozen_layers: eval.py training.csv @echo "Evaluating frozen-layer coordinate regressor..." @bash -c 'source .venv/bin/activate && python eval.py --model-path output_frozen_layers --output-file predictions_frozen_layers.csv --plot-file plots/prediction_map_frozen_layers.png --scatter-plot-file plots/predicted_vs_actual_frozen_layers.png' +train_mpnet: train.py training.csv + @echo "Training with all-mpnet-base-v2 (encoder fully frozen, head only)..." + @bash -c 'source .venv/bin/activate && python train.py \ + --model-name sentence-transformers/all-mpnet-base-v2 \ + --output-path output_mpnet \ + --freeze-encoder \ + --hidden-dim 512 \ + --head-learning-rate 1e-2 \ + --epochs 50' + +train_mpnet_finetune: train.py training.csv + @echo "Training with all-mpnet-base-v2 (frozen first 10 of 12 layers)..." + @bash -c 'source .venv/bin/activate && python train.py \ + --model-name sentence-transformers/all-mpnet-base-v2 \ + --output-path output_mpnet_ft \ + --freeze-transformer-layers 10 \ + --hidden-dim 512 \ + --head-learning-rate 1e-2 \ + --batch-size 32 \ + --epochs 50' + +eval_mpnet_finetune: eval.py training.csv + @echo "Evaluating all-mpnet-base-v2 fine-tuned coordinate regressor..." + @bash -c 'source .venv/bin/activate && python eval.py \ + --model-path output_mpnet_ft \ + --output-file predictions_mpnet_ft.csv \ + --plot-file plots/prediction_map_mpnet_ft.png \ + --scatter-plot-file plots/predicted_vs_actual_mpnet_ft.png' + +eval_mpnet: eval.py training.csv + @echo "Evaluating all-mpnet-base-v2 coordinate regressor..." + @bash -c 'source .venv/bin/activate && python eval.py \ + --model-path output_mpnet \ + --output-file predictions_mpnet.csv \ + --plot-file plots/prediction_map_mpnet.png \ + --scatter-plot-file plots/predicted_vs_actual_mpnet.png' + lint: @echo "Auto-linting files and performing final style checks..." @bash -c 'source .venv/bin/activate && isort --profile=black *.py' @@ -41,4 +78,4 @@ clean: @rm -rf output/ @rm -f training.csv predictions.csv -.PHONY: data train eval train_frozen_encoder eval_frozen_encoder train_frozen_layers eval_frozen_layers lint clean all +.PHONY: data train eval train_frozen_encoder eval_frozen_encoder train_frozen_layers eval_frozen_layers train_mpnet eval_mpnet train_mpnet_finetune eval_mpnet_finetune lint clean all