Update README.md
Browse files
README.md
CHANGED
@@ -87,8 +87,10 @@ set_seed(42)
|
|
87 |
```python
|
88 |
gpt_web_bg("По професия той е ")
|
89 |
|
|
|
90 |
```
|
91 |
[{'generated_text': 'По професия той е строителен работник, който е �'}]
|
|
|
92 |
|
93 |
|
94 |
|
@@ -103,7 +105,39 @@ gpt_web_bg("По професия той е ")
|
|
103 |
|
104 |
<!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
|
105 |
|
106 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
107 |
|
108 |
#### Preprocessing [optional]
|
109 |
|
|
|
87 |
```python
|
88 |
gpt_web_bg("По професия той е ")
|
89 |
|
90 |
+
```
|
91 |
```
|
92 |
[{'generated_text': 'По професия той е строителен работник, който е �'}]
|
93 |
+
```
|
94 |
|
95 |
|
96 |
|
|
|
105 |
|
106 |
<!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
|
107 |
|
108 |
+
```
|
109 |
+
{
|
110 |
+
"activation_function": "gelu_new",
|
111 |
+
"architectures": [
|
112 |
+
"GPT2LMHeadModel"
|
113 |
+
],
|
114 |
+
"attn_pdrop": 0.1,
|
115 |
+
"bos_token_id": 50256,
|
116 |
+
"embd_pdrop": 0.1,
|
117 |
+
"eos_token_id": 50256,
|
118 |
+
"initializer_range": 0.02,
|
119 |
+
"layer_norm_epsilon": 1e-05,
|
120 |
+
"model_type": "gpt2",
|
121 |
+
"n_embd": 768,
|
122 |
+
"n_head": 12,
|
123 |
+
"n_inner": null,
|
124 |
+
"n_layer": 12,
|
125 |
+
"n_positions": 1024,
|
126 |
+
"reorder_and_upcast_attn": false,
|
127 |
+
"resid_pdrop": 0.1,
|
128 |
+
"scale_attn_by_inverse_layer_idx": false,
|
129 |
+
"scale_attn_weights": true,
|
130 |
+
"summary_activation": null,
|
131 |
+
"summary_first_dropout": 0.1,
|
132 |
+
"summary_proj_to_labels": true,
|
133 |
+
"summary_type": "cls_index",
|
134 |
+
"summary_use_proj": true,
|
135 |
+
"torch_dtype": "float32",
|
136 |
+
"transformers_version": "4.22.0.dev0",
|
137 |
+
"use_cache": true,
|
138 |
+
"vocab_size": 50257
|
139 |
+
}
|
140 |
+
```
|
141 |
|
142 |
#### Preprocessing [optional]
|
143 |
|