diff --git a/gpt-2/config/train_gpt2_default.py b/gpt-2/config/train_gpt2_default.py index b08e147..ee4df45 100644 --- a/gpt-2/config/train_gpt2_default.py +++ b/gpt-2/config/train_gpt2_default.py @@ -24,4 +24,4 @@ # weight decay weight_decay = 1e-1 -model_type = "gpt2_attn_bias" \ No newline at end of file +model_type = "gpt2_default"