boris commited on
Commit
cdefdd0
1 Parent(s): 0f2cf98

feat(mega): switch to gelu

Browse files
tools/train/config/mega/config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "activation_dropout": 0.0,
3
- "activation_function": "swish",
4
  "attention_dropout": 0.0,
5
  "bos_token_id": 16385,
6
  "d_model": 2048,
 
1
  {
2
  "activation_dropout": 0.0,
3
+ "activation_function": "gelu",
4
  "attention_dropout": 0.0,
5
  "bos_token_id": 16385,
6
  "d_model": 2048,