mehmetkeremturkcan commited on
Commit
695acf6
·
verified ·
1 Parent(s): 4eb5142

Upload 7 files

Browse files
input_encoder/README.md CHANGED
@@ -1,5 +1,5 @@
1
  ---
2
- base_model: WinKawaks/vit-tiny-patch16-224
3
  library_name: peft
4
  ---
5
 
 
1
  ---
2
+ base_model: google/vit-base-patch16-224
3
  library_name: peft
4
  ---
5
 
input_encoder/adapter_config.json CHANGED
@@ -4,7 +4,7 @@
4
  "base_model_class": "ViTForImageClassification",
5
  "parent_library": "transformers.models.vit.modeling_vit"
6
  },
7
- "base_model_name_or_path": "WinKawaks/vit-tiny-patch16-224",
8
  "bias": "none",
9
  "eva_config": null,
10
  "exclude_modules": null,
 
4
  "base_model_class": "ViTForImageClassification",
5
  "parent_library": "transformers.models.vit.modeling_vit"
6
  },
7
+ "base_model_name_or_path": "google/vit-base-patch16-224",
8
  "bias": "none",
9
  "eva_config": null,
10
  "exclude_modules": null,
input_encoder/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:183292dcb45713e81163c0c16c880b20c4a99f2f1c2106fb756ae2de0377b368
3
- size 1779320
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08bee08fef6e0f86bedf5c2839296129f0d332a7a73fdac29a07c2cb92d5d7ae
3
+ size 7087824
input_tokenizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b17e4c8096c3ccce8fe7040656dbea93041b7cddd30034ec425f9f4fd8deaf29
3
- size 1773080
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f22680395c72b9e061d145dd6e2a474b32c29adb30e9e54edff2fb963d85fef
3
+ size 23615640
language_model/README.md CHANGED
@@ -1,5 +1,5 @@
1
  ---
2
- base_model: mehmetkeremturkcan/SmollerLM2-100M-Instruct-sft
3
  library_name: peft
4
  ---
5
 
 
1
  ---
2
+ base_model: deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
3
  library_name: peft
4
  ---
5
 
language_model/adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "mehmetkeremturkcan/SmollerLM2-100M-Instruct-sft",
5
  "bias": "none",
6
  "eva_config": null,
7
  "exclude_modules": null,
@@ -23,13 +23,13 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "k_proj",
27
- "v_proj",
28
- "o_proj",
29
  "gate_proj",
 
 
30
  "q_proj",
31
  "up_proj",
32
- "down_proj"
 
33
  ],
34
  "task_type": "CAUSAL_LM",
35
  "use_dora": false,
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B",
5
  "bias": "none",
6
  "eva_config": null,
7
  "exclude_modules": null,
 
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
 
 
 
26
  "gate_proj",
27
+ "k_proj",
28
+ "down_proj",
29
  "q_proj",
30
  "up_proj",
31
+ "o_proj",
32
+ "v_proj"
33
  ],
34
  "task_type": "CAUSAL_LM",
35
  "use_dora": false,
language_model/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:38b9adbd9e29a5cdf932906c3d3d185f180934bbb83ebfff62f26b80bd371dad
3
- size 7281104
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edd68e64e83b499f8fa146fa4e46c33068fa385ac0309df9a7765e8dcce4b14d
3
+ size 36981072