numen-tech
/

openchat-3.5-0106-w4a16g128asym

numen-tech commited on Mar 29

Commit

a31a765

•

1 Parent(s): 2ea4e60

Update model

Files changed (3) hide show

ndarray-cache.json CHANGED Viewed

@@ -2,7 +2,7 @@
     "metadata": {
         "ParamSize": 325,
         "ParamBytes": 3734421760.0,
-        "BitsPerParam": 4.125436579647682
     },
     "records": [
         {

     "metadata": {
         "ParamSize": 325,
         "ParamBytes": 3734421760.0,
+        "BitsPerParam": 3.0339086581997106
     },
     "records": [
         {

private-llm-config.json CHANGED Viewed

@@ -22,11 +22,12 @@
   "prefill_chunk_size": 128,
   "attention_sink_size": 4,
   "tensor_parallel_shards": 1,
-  "max_batch_size": 80,
   "mean_gen_len": 128,
   "max_gen_len": 512,
   "shift_fill_factor": 0.3,
   "temperature": 0.7,
   "repetition_penalty": 1.0,
   "top_p": 0.95,
   "conv_template": "openchat3.5",
@@ -36,7 +37,8 @@
   "tokenizer_files": [
     "tokenizer.model",
     "added_tokens.json",
-    "tokenizer_config.json"
   ],
   "version": "0.1.0"
-}

   "prefill_chunk_size": 128,
   "attention_sink_size": 4,
   "tensor_parallel_shards": 1,
   "mean_gen_len": 128,
   "max_gen_len": 512,
   "shift_fill_factor": 0.3,
   "temperature": 0.7,
+  "presence_penalty": 0.0,
+  "frequency_penalty": 0.0,
   "repetition_penalty": 1.0,
   "top_p": 0.95,
   "conv_template": "openchat3.5",
   "tokenizer_files": [
     "tokenizer.model",
     "added_tokens.json",
+    "tokenizer_config.json",
+    "tokenizer.json"
   ],
   "version": "0.1.0"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff