Showing
- output/pretrain/output_pretraining_llama_60m_c4_batch-size-256_galore8bit+lora_2025-04-17_18-51-10.csv 101 additions, 0 deletions...c4_batch-size-256_galore8bit+lora_2025-04-17_18-51-10.csv
- output/pretrain/output_pretraining_llama_60m_c4_batch-size-256_galore8bit_2025-04-17_12-52-31.csv 101 additions, 0 deletions..._60m_c4_batch-size-256_galore8bit_2025-04-17_12-52-31.csv
- output/pretrain/output_pretraining_llama_60m_c4_batch-size-256_galore_2025-04-17_09-58-04.csv 101 additions, 0 deletions...lama_60m_c4_batch-size-256_galore_2025-04-17_09-58-04.csv
- output/pretrain_memory/output_pretraining_llama_1b_c4_batch-size-1_adamw+lomo_2025-04-21_11-22-09.csv 2 additions, 0 deletions...ama_1b_c4_batch-size-1_adamw+lomo_2025-04-21_11-22-09.csv
- output/pretrain_memory/output_pretraining_llama_1b_c4_batch-size-1_adamw+lora+lomo_2025-04-21_11-35-11.csv 2 additions, 0 deletions...b_c4_batch-size-1_adamw+lora+lomo_2025-04-21_11-35-11.csv
- output/pretrain_memory/output_pretraining_llama_1b_c4_batch-size-1_adamw+lora_2025-04-21_11-35-18.csv 2 additions, 0 deletions...ama_1b_c4_batch-size-1_adamw+lora_2025-04-21_11-35-18.csv
- output/pretrain_memory/output_pretraining_llama_1b_c4_batch-size-1_adamw_2025-04-21_11-35-13.csv 2 additions, 0 deletions...ng_llama_1b_c4_batch-size-1_adamw_2025-04-21_11-35-13.csv
- output/pretrain_memory/output_pretraining_llama_1b_c4_batch-size-1_galore+lomo_2025-04-21_11-43-06.csv 2 additions, 0 deletions...ma_1b_c4_batch-size-1_galore+lomo_2025-04-21_11-43-06.csv
- output/pretrain_memory/output_pretraining_llama_1b_c4_batch-size-1_galore+lora+lomo_2025-04-21_11-44-13.csv 2 additions, 0 deletions..._c4_batch-size-1_galore+lora+lomo_2025-04-21_11-44-13.csv
- output/pretrain_memory/output_pretraining_llama_1b_c4_batch-size-1_galore+lora_2025-04-21_11-44-51.csv 2 additions, 0 deletions...ma_1b_c4_batch-size-1_galore+lora_2025-04-21_11-44-51.csv
- output/pretrain_memory/output_pretraining_llama_1b_c4_batch-size-1_galore8bit+lomo_2025-04-21_12-10-32.csv 2 additions, 0 deletions...b_c4_batch-size-1_galore8bit+lomo_2025-04-21_12-10-32.csv
- output/pretrain_memory/output_pretraining_llama_1b_c4_batch-size-1_galore8bit+lora+lomo_2025-04-21_11-54-08.csv 2 additions, 0 deletions...batch-size-1_galore8bit+lora+lomo_2025-04-21_11-54-08.csv
- output/pretrain_memory/output_pretraining_llama_1b_c4_batch-size-1_galore8bit+lora_2025-04-21_11-54-46.csv 2 additions, 0 deletions...b_c4_batch-size-1_galore8bit+lora_2025-04-21_11-54-46.csv
- output/pretrain_memory/output_pretraining_llama_1b_c4_batch-size-1_galore8bit_2025-04-21_12-19-49.csv 2 additions, 0 deletions...ama_1b_c4_batch-size-1_galore8bit_2025-04-21_12-19-49.csv
- output/pretrain_memory/output_pretraining_llama_1b_c4_batch-size-1_galore_2025-04-21_11-53-14.csv 2 additions, 0 deletions...g_llama_1b_c4_batch-size-1_galore_2025-04-21_11-53-14.csv
- output/pretrain_memory/output_pretraining_llama_350m_c4_batch-size-1_adamw+lomo_2025-04-19_10-48-25.csv 2 additions, 0 deletions...a_350m_c4_batch-size-1_adamw+lomo_2025-04-19_10-48-25.csv
- output/pretrain_memory/output_pretraining_llama_350m_c4_batch-size-1_adamw+lora+lomo_2025-04-19_11-58-23.csv 2 additions, 0 deletions...m_c4_batch-size-1_adamw+lora+lomo_2025-04-19_11-58-23.csv
- output/pretrain_memory/output_pretraining_llama_350m_c4_batch-size-1_adamw+lora_2025-04-19_10-19-44.csv 2 additions, 0 deletions...a_350m_c4_batch-size-1_adamw+lora_2025-04-19_10-19-44.csv
- output/pretrain_memory/output_pretraining_llama_350m_c4_batch-size-1_adamw_2025-04-19_09-23-59.csv 2 additions, 0 deletions..._llama_350m_c4_batch-size-1_adamw_2025-04-19_09-23-59.csv
- output/pretrain_memory/output_pretraining_llama_350m_c4_batch-size-1_galore+lomo_2025-04-19_11-03-57.csv 2 additions, 0 deletions..._350m_c4_batch-size-1_galore+lomo_2025-04-19_11-03-57.csv
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.