SageMaker: Fix sagemaker DDP & metric logs (#13181)
* Barrier -> barrier * added logger for metrics * removed stream handler in trainer * moved handler * removed streamhandler from trainer * updated test image and instance type added datasets version to test * Update tests/sagemaker/scripts/pytorch/requirements.txt Co-authored-by: Stas Bekman <stas00@users.noreply.github.com> Co-authored-by: Stas Bekman <stas00@users.noreply.github.com>
This commit is contained in:
@@ -27,21 +27,21 @@ if is_sagemaker_available():
|
||||
"framework": "pytorch",
|
||||
"script": "run_glue.py",
|
||||
"model_name_or_path": "distilbert-base-cased",
|
||||
"instance_type": "ml.p3dn.24xlarge",
|
||||
"instance_type": "ml.p3.16xlarge",
|
||||
"results": {"train_runtime": 650, "eval_accuracy": 0.7, "eval_loss": 0.6},
|
||||
},
|
||||
{
|
||||
"framework": "pytorch",
|
||||
"script": "run_ddp.py",
|
||||
"model_name_or_path": "distilbert-base-cased",
|
||||
"instance_type": "ml.p3dn.24xlarge",
|
||||
"instance_type": "ml.p3.16xlarge",
|
||||
"results": {"train_runtime": 600, "eval_accuracy": 0.7, "eval_loss": 0.6},
|
||||
},
|
||||
{
|
||||
"framework": "tensorflow",
|
||||
"script": "run_tf_dist.py",
|
||||
"model_name_or_path": "distilbert-base-cased",
|
||||
"instance_type": "ml.p3dn.24xlarge",
|
||||
"instance_type": "ml.p3.16xlarge",
|
||||
"results": {"train_runtime": 600, "eval_accuracy": 0.6, "eval_loss": 0.7},
|
||||
},
|
||||
]
|
||||
|
||||
Reference in New Issue
Block a user