From 6faa9716477fee7d573fcaec280af0cd507e2dc0 Mon Sep 17 00:00:00 2001 From: Filya Geikyan Date: Wed, 28 Aug 2024 15:34:08 +0400 Subject: [PATCH] aim is ready except for resuming part --- .ci/docker/requirements.txt | 1 + train_configs/chemlactica_125m.toml | 6 ++++-- train_configs/debug_model.toml | 4 ++-- train_configs/galactica_125m_hf_to_titan.toml | 6 ++++-- 4 files changed, 11 insertions(+), 6 deletions(-) diff --git a/.ci/docker/requirements.txt b/.ci/docker/requirements.txt index 06e953ff..69e9d89d 100644 --- a/.ci/docker/requirements.txt +++ b/.ci/docker/requirements.txt @@ -6,3 +6,4 @@ sentencepiece tiktoken blobfile tabulate +transformers \ No newline at end of file diff --git a/train_configs/chemlactica_125m.toml b/train_configs/chemlactica_125m.toml index 5f303f55..842946c3 100644 --- a/train_configs/chemlactica_125m.toml +++ b/train_configs/chemlactica_125m.toml @@ -15,8 +15,10 @@ save_memory_snapshot_folder = "memory_snapshot" [metrics] log_freq = 1 enable_color_printing = true -enable_tensorboard = true -save_tb_folder = "tb" +enable_aim = true +save_aim_folder = "aim" +#aim_hash = "c6b4d8b340f74287b82ef928" +#aim_experiment_name = "hello" [model] name = "opt" diff --git a/train_configs/debug_model.toml b/train_configs/debug_model.toml index 3eba5fef..fd2718d2 100644 --- a/train_configs/debug_model.toml +++ b/train_configs/debug_model.toml @@ -17,8 +17,8 @@ log_freq = 1 enable_color_printing = true enable_aim = true save_aim_folder = "aim" -aim_hash = "c6b4d8b340f74287b82ef928" -aim_experiment_name = "hello" +#aim_hash = "c6b4d8b340f74287b82ef928" +#aim_experiment_name = "hello" [model] name = "llama3" diff --git a/train_configs/galactica_125m_hf_to_titan.toml b/train_configs/galactica_125m_hf_to_titan.toml index 1318d4cf..f6e0a314 100644 --- a/train_configs/galactica_125m_hf_to_titan.toml +++ b/train_configs/galactica_125m_hf_to_titan.toml @@ -15,8 +15,10 @@ save_memory_snapshot_folder = "memory_snapshot" [metrics] log_freq = 1 enable_color_printing = true -enable_tensorboard = true -save_tb_folder = "tb" +enable_aim = true +save_aim_folder = "aim" +#aim_hash = "c6b4d8b340f74287b82ef928" +#aim_experiment_name = "hello" [model] name = "opt"