@@ -839,6 +839,9 @@ def test_training_recipe_for_cpu(sagemaker_session):
839
839
container_log_level = '"logging.INFO"'
840
840
841
841
recipe_overrides = {
842
+ "run" : {
843
+ "results_dir" : "/opt/ml/model" ,
844
+ },
842
845
"exp_manager" : {
843
846
"explicit_log_dir" : "/opt/ml/output/tensorboard" ,
844
847
"checkpoint_dir" : "/opt/ml/checkpoints" ,
@@ -860,7 +863,7 @@ def test_training_recipe_for_cpu(sagemaker_session):
860
863
instance_type = INSTANCE_TYPE ,
861
864
base_job_name = "job" ,
862
865
container_log_level = container_log_level ,
863
- training_recipe = "llama/hf_llama3_8b_seq8192_gpu" ,
866
+ training_recipe = "training/ llama/hf_llama3_8b_seq8192_gpu" ,
864
867
recipe_overrides = recipe_overrides ,
865
868
)
866
869
@@ -877,6 +880,9 @@ def test_training_recipe_for_gpu(sagemaker_session, recipe, model):
877
880
container_log_level = '"logging.INFO"'
878
881
879
882
recipe_overrides = {
883
+ "run" : {
884
+ "results_dir" : "/opt/ml/model" ,
885
+ },
880
886
"exp_manager" : {
881
887
"explicit_log_dir" : "/opt/ml/output" ,
882
888
"checkpoint_dir" : "/opt/ml/checkpoints" ,
@@ -896,7 +902,7 @@ def test_training_recipe_for_gpu(sagemaker_session, recipe, model):
896
902
instance_type = INSTANCE_TYPE_GPU ,
897
903
base_job_name = "job" ,
898
904
container_log_level = container_log_level ,
899
- training_recipe = f"{ model } /{ recipe } " ,
905
+ training_recipe = f"training/ { model } /{ recipe } " ,
900
906
recipe_overrides = recipe_overrides ,
901
907
)
902
908
@@ -922,6 +928,9 @@ def test_training_recipe_with_override(sagemaker_session):
922
928
container_log_level = '"logging.INFO"'
923
929
924
930
recipe_overrides = {
931
+ "run" : {
932
+ "results_dir" : "/opt/ml/model" ,
933
+ },
925
934
"exp_manager" : {
926
935
"explicit_log_dir" : "/opt/ml/output" ,
927
936
"checkpoint_dir" : "/opt/ml/checkpoints" ,
@@ -943,7 +952,7 @@ def test_training_recipe_with_override(sagemaker_session):
943
952
instance_type = INSTANCE_TYPE_GPU ,
944
953
base_job_name = "job" ,
945
954
container_log_level = container_log_level ,
946
- training_recipe = "llama/hf_llama3_8b_seq8192_gpu" ,
955
+ training_recipe = "training/ llama/hf_llama3_8b_seq8192_gpu" ,
947
956
recipe_overrides = recipe_overrides ,
948
957
)
949
958
@@ -956,6 +965,9 @@ def test_training_recipe_for_trainium(sagemaker_session):
956
965
container_log_level = '"logging.INFO"'
957
966
958
967
recipe_overrides = {
968
+ "run" : {
969
+ "results_dir" : "/opt/ml/model" ,
970
+ },
959
971
"exp_manager" : {
960
972
"explicit_log_dir" : "/opt/ml/output" ,
961
973
},
0 commit comments