Spaces:

GIZ
/

audit_assistant

Running on T4

ppsingh commited on Aug 8, 2024

Commit

620ccce

verified ·

1 Parent(s): 488567e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -185,17 +185,11 @@ async def chat(query,history,sources,reports,subtype,year):
     # llama-3_1 endpoint = https://howaqfw0lpap12sg.us-east-1.aws.endpoints.huggingface.cloud
     # llama-3 endpoint = https://nhe9phsr2zhs0e36.eu-west-1.aws.endpoints.huggingface.cloud
-    callbacks = [StreamingStdOutCallbackHandler()]
     llm_qa = HuggingFaceEndpoint(
         endpoint_url="https://howaqfw0lpap12sg.us-east-1.aws.endpoints.huggingface.cloud",
-        max_new_tokens=1024,
-        top_k=10,
-        top_p=0.95,
-        typical_p=0.95,
-        temperature=0.01,
-        callbacks=callbacks,
-        streaming=True,
-        repetition_penalty=1.03,)
     # create rag chain
     chat_model = ChatHuggingFace(llm=llm_qa)

     # llama-3_1 endpoint = https://howaqfw0lpap12sg.us-east-1.aws.endpoints.huggingface.cloud
     # llama-3 endpoint = https://nhe9phsr2zhs0e36.eu-west-1.aws.endpoints.huggingface.cloud
+    #callbacks = [StreamingStdOutCallbackHandler()]
     llm_qa = HuggingFaceEndpoint(
         endpoint_url="https://howaqfw0lpap12sg.us-east-1.aws.endpoints.huggingface.cloud",
+        task="text-generation",
+        huggingfacehub_api_token=HF_token)
     # create rag chain
     chat_model = ChatHuggingFace(llm=llm_qa)