InternLM-Math
commited on
Commit
•
3e7e1f3
1
Parent(s):
8fd7d8a
Update configuration_internlm.py
Browse files
configuration_internlm.py
CHANGED
@@ -108,6 +108,7 @@ class InternLMConfig(PretrainedConfig):
|
|
108 |
bias=True,
|
109 |
rope_theta=10000,
|
110 |
rope_scaling=None,
|
|
|
111 |
**kwargs,
|
112 |
):
|
113 |
self.vocab_size = vocab_size
|
@@ -129,6 +130,10 @@ class InternLMConfig(PretrainedConfig):
|
|
129 |
self.rope_theta = rope_theta
|
130 |
self.rope_scaling = rope_scaling
|
131 |
self._rope_scaling_validation()
|
|
|
|
|
|
|
|
|
132 |
super().__init__(
|
133 |
pad_token_id=pad_token_id,
|
134 |
bos_token_id=bos_token_id,
|
|
|
108 |
bias=True,
|
109 |
rope_theta=10000,
|
110 |
rope_scaling=None,
|
111 |
+
attn_implementation="eager",
|
112 |
**kwargs,
|
113 |
):
|
114 |
self.vocab_size = vocab_size
|
|
|
130 |
self.rope_theta = rope_theta
|
131 |
self.rope_scaling = rope_scaling
|
132 |
self._rope_scaling_validation()
|
133 |
+
|
134 |
+
self.attn_implementation = attn_implementation
|
135 |
+
if self.attn_implementation is None:
|
136 |
+
self.attn_implementation = "eager"
|
137 |
super().__init__(
|
138 |
pad_token_id=pad_token_id,
|
139 |
bos_token_id=bos_token_id,
|