Spaces:

sailfish
/

lightweight-chat

Running

sailfish commited on Oct 24

Commit

e3be437

•

1 Parent(s): e520569

fix 5

Files changed (1) hide show

app.py CHANGED Viewed

@@ -6,8 +6,10 @@ from huggingface_hub import InferenceClient
 For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
 """
 huggingface_token = os.getenv("SECRET_ENV_VARIABLE")
-client = InferenceClient(api_key=huggingface_token)
 '''
 import requests
@@ -45,8 +47,7 @@ def respond(
     response = ""
     for message in client.chat_completion(
-        model="meta-llama/Llama-3.2-1B",
-        messages=messages,
         max_tokens=max_tokens,
         stream=True,
         temperature=temperature,

 For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
 """
+model_name = "meta-llama/Llama-3.2-1B"
 huggingface_token = os.getenv("SECRET_ENV_VARIABLE")
+#client = InferenceClient(api_key=huggingface_token)
+client = InferenceClient(model=model_name, token=huggingface_token)
 '''
 import requests
     response = ""
     for message in client.chat_completion(
+        messages,
         max_tokens=max_tokens,
         stream=True,
         temperature=temperature,