Spaces:

markqiu
/

prinvest_mate

Sleeping

App Files Files Community

Tuchuanhuhuhu commited on Mar 13, 2023

Commit

72e1ed6

1 Parent(s): 9c45970

使用tiktoken精确计数输入token

Browse files

Files changed (1) hide show

utils.py +5 -4

utils.py CHANGED Viewed

@@ -51,7 +51,7 @@ def postprocess(
 def count_token(input_str):
     print("计算输入Token计数中……")
     encoding = tiktoken.encoding_for_model("gpt-3.5-turbo")
-    length = len(encoding.encode("tiktoken is great!"))
     print("计算完成！")
     return length
@@ -138,7 +138,8 @@ def stream_predict(openai_api_key, system_prompt, history, inputs, chatbot, prev
     history.append(construct_user(inputs))
     user_token_count = 0
     if len(previous_token_count) == 0:
-        user_token_count = count_token(inputs) + count_token(system_prompt)
     else:
         user_token_count = count_token(inputs)
     print(f"输入token计数: {user_token_count}")
@@ -200,7 +201,7 @@ def predict_all(openai_api_key, system_prompt, history, inputs, chatbot, previou
 def predict(openai_api_key, system_prompt, history, inputs, chatbot, token_count, top_p, temperature, stream=False, should_check_token_count = True):  # repetition_penalty, top_k
-    print(colorama.Fore.BLUE + f"输入为：{inputs}" + colorama.Style.RESET_ALL)
     if stream:
         print("使用流式传输")
         iter = stream_predict(openai_api_key, system_prompt, history, inputs, chatbot, token_count, top_p, temperature)
@@ -211,7 +212,7 @@ def predict(openai_api_key, system_prompt, history, inputs, chatbot, token_count
         chatbot, history, status_text, token_count = predict_all(openai_api_key, system_prompt, history, inputs, chatbot, token_count, top_p, temperature)
         yield chatbot, history, status_text, token_count
     print(f"传输完毕。当前token计数为{token_count}")
-    print(colorama.Fore.BLUE + f"回答为：{history[-1]['content']}" + colorama.Style.RESET_ALL)
     if stream:
         max_token = max_token_streaming
     else:

 def count_token(input_str):
     print("计算输入Token计数中……")
     encoding = tiktoken.encoding_for_model("gpt-3.5-turbo")
+    length = len(encoding.encode(input_str))
     print("计算完成！")
     return length
     history.append(construct_user(inputs))
     user_token_count = 0
     if len(previous_token_count) == 0:
+        system_prompt_token_count = count_token(system_prompt)
+        user_token_count = count_token(inputs) + system_prompt_token_count
     else:
         user_token_count = count_token(inputs)
     print(f"输入token计数: {user_token_count}")
 def predict(openai_api_key, system_prompt, history, inputs, chatbot, token_count, top_p, temperature, stream=False, should_check_token_count = True):  # repetition_penalty, top_k
+    print("输入为：" +colorama.Fore.BLUE + f"{inputs}" + colorama.Style.RESET_ALL)
     if stream:
         print("使用流式传输")
         iter = stream_predict(openai_api_key, system_prompt, history, inputs, chatbot, token_count, top_p, temperature)
         chatbot, history, status_text, token_count = predict_all(openai_api_key, system_prompt, history, inputs, chatbot, token_count, top_p, temperature)
         yield chatbot, history, status_text, token_count
     print(f"传输完毕。当前token计数为{token_count}")
+    print("回答为：" +colorama.Fore.BLUE + f"{history[-1]['content']}" + colorama.Style.RESET_ALL)
     if stream:
         max_token = max_token_streaming
     else: