Now it will convert the weights of 24 encoder layers rather than 12
Browse files- convert.py +1 -1
convert.py
CHANGED
@@ -21,7 +21,7 @@ import torch
|
|
21 |
from paddle import fluid
|
22 |
import numpy as np
|
23 |
|
24 |
-
def build_params_map(attention_num=
|
25 |
"""
|
26 |
build params map from paddle-paddle's ERNIE to transformer's BERT
|
27 |
:return:
|
|
|
21 |
from paddle import fluid
|
22 |
import numpy as np
|
23 |
|
24 |
+
def build_params_map(attention_num=24):
|
25 |
"""
|
26 |
build params map from paddle-paddle's ERNIE to transformer's BERT
|
27 |
:return:
|