[s2s] distill: --normalize_hidden --supervise_forward (#6834)
This commit is contained in:
@@ -31,6 +31,8 @@ logging.basicConfig(level=logging.DEBUG)
|
||||
logger = logging.getLogger()
|
||||
CUDA_AVAILABLE = torch.cuda.is_available()
|
||||
CHEAP_ARGS = {
|
||||
"supervise_forward": True,
|
||||
"normalize_hidden": True,
|
||||
"label_smoothing": 0.2,
|
||||
"eval_beams": 1,
|
||||
"val_metric": "loss",
|
||||
|
||||
Reference in New Issue
Block a user