Devops-hestabit
/

mixtral-instruct-trt

Model card Files Files and versions Community

Devops-hestabit commited on Jul 16, 2024

Commit

4c71db6

verified ·

1 Parent(s): 88372d7

Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

postprocessing/1/__pycache__/model.cpython-310.pyc +0 -0
postprocessing/config.pbtxt +1 -1
preprocessing/1/__pycache__/model.cpython-310.pyc +0 -0
preprocessing/config.pbtxt +1 -1
tensorrt_llm/1/config.json +1 -1
tensorrt_llm/1/rank1.engine +2 -2
tensorrt_llm_bls/1/__pycache__/model.cpython-310.pyc +0 -0
tensorrt_llm_bls/1/lib/__pycache__/decode.cpython-310.pyc +0 -0
tensorrt_llm_bls/1/lib/__pycache__/triton_decoder.cpython-310.pyc +0 -0

postprocessing/1/__pycache__/model.cpython-310.pyc CHANGED Viewed

Binary files a/postprocessing/1/__pycache__/model.cpython-310.pyc and b/postprocessing/1/__pycache__/model.cpython-310.pyc differ

postprocessing/config.pbtxt CHANGED Viewed

@@ -101,7 +101,7 @@ parameters {
 parameters {
   key: "skip_special_tokens"
   value: {
-    string_value: "${skip_special_tokens}"
   }
 }

 parameters {
   key: "skip_special_tokens"
   value: {
+    string_value: "false"
   }
 }

preprocessing/1/__pycache__/model.cpython-310.pyc CHANGED Viewed

Binary files a/preprocessing/1/__pycache__/model.cpython-310.pyc and b/preprocessing/1/__pycache__/model.cpython-310.pyc differ

preprocessing/config.pbtxt CHANGED Viewed

@@ -144,7 +144,7 @@ parameters {
 parameters {
   key: "add_special_tokens"
   value: {
-    string_value: "${add_special_tokens}"
   }
 }

 parameters {
   key: "add_special_tokens"
   value: {
+    string_value: "false"
   }
 }

tensorrt_llm/1/config.json CHANGED Viewed

@@ -129,7 +129,7 @@
             "context_fmha_fp32_acc": false,
             "paged_kv_cache": true,
             "remove_input_padding": true,
-            "use_custom_all_reduce": true,
             "reduce_fusion": false,
             "multi_block_mode": false,
             "enable_xqa": true,

             "context_fmha_fp32_acc": false,
             "paged_kv_cache": true,
             "remove_input_padding": true,
+            "use_custom_all_reduce": false,
             "reduce_fusion": false,
             "multi_block_mode": false,
             "enable_xqa": true,

tensorrt_llm/1/rank1.engine CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1397dbb8fc710907448a5c58da6c17004b8b8fa398780b1e593b383e6b150b6f
-size 46857271996

 version https://git-lfs.github.com/spec/v1
+oid sha256:cce3cc78a466ba00ef6b65fafa85a18c8e8c177b8445ece1ce1d8539e764fcbb
+size 46857273788

tensorrt_llm_bls/1/__pycache__/model.cpython-310.pyc CHANGED Viewed

Binary files a/tensorrt_llm_bls/1/__pycache__/model.cpython-310.pyc and b/tensorrt_llm_bls/1/__pycache__/model.cpython-310.pyc differ

tensorrt_llm_bls/1/lib/__pycache__/decode.cpython-310.pyc CHANGED Viewed

Binary files a/tensorrt_llm_bls/1/lib/__pycache__/decode.cpython-310.pyc and b/tensorrt_llm_bls/1/lib/__pycache__/decode.cpython-310.pyc differ

tensorrt_llm_bls/1/lib/__pycache__/triton_decoder.cpython-310.pyc CHANGED Viewed

Binary files a/tensorrt_llm_bls/1/lib/__pycache__/triton_decoder.cpython-310.pyc and b/tensorrt_llm_bls/1/lib/__pycache__/triton_decoder.cpython-310.pyc differ