Spaces:

alexkueck
/

test-endpoint-li

Paused

alexkueck commited on Jul 9, 2023

Commit

28d01d6

1 Parent(s): 8f40683

Create app.py

Files changed (1) hide show

app.py ADDED Viewed

+from huggingface_hub import InferenceClient
+# HF Inference Endpoints parameter
+endpoint_url = "https://YOUR_ENDPOINT.endpoints.huggingface.cloud"
+hf_token = "hf_YOUR_TOKEN"
+# Streaming Client
+client = InferenceClient(endpoint_url, token=hf_token)
+# generation parameter
+gen_kwargs = dict(
+    max_new_tokens=512,
+    top_k=30,
+    top_p=0.9,
+    temperature=0.2,
+    repetition_penalty=1.02,
+    stop_sequences=["\nUser:", "<|endoftext|>", "</s>"],
+)
+# prompt
+prompt = "What can you do in Nuremberg, Germany? Give me 3 Tips"
+stream = client.text_generation(prompt, stream=True, details=True, **gen_kwargs)
+# yield each generated token
+for r in stream:
+    # skip special tokens
+    if r.token.special:
+        continue
+    # stop if we encounter a stop sequence
+    if r.token.text in gen_kwargs["stop_sequences"]:
+        break
+    # yield the generated token
+    print(r.token.text, end = "")
+    # yield r.token.text