Update appStore/rag.py
Browse files- appStore/rag.py +6 -2
appStore/rag.py
CHANGED
|
@@ -56,8 +56,12 @@ def run_query(context, label, model_sel_name):
|
|
| 56 |
#messages = [{"role": "system", "content": chatbot_role},{"role": "user", "content": get_prompt(context, label)}]
|
| 57 |
|
| 58 |
# Initialize the client, pointing it to one of the available models
|
| 59 |
-
client = InferenceClient(model_sel_name, token=hf_token)
|
| 60 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
| 61 |
# Instantiate ChatCompletion as a generator object (stream is set to True)
|
| 62 |
chat_completion = client.chat.completions.create(
|
| 63 |
messages=messages,
|
|
|
|
| 56 |
#messages = [{"role": "system", "content": chatbot_role},{"role": "user", "content": get_prompt(context, label)}]
|
| 57 |
|
| 58 |
# Initialize the client, pointing it to one of the available models
|
| 59 |
+
#client = InferenceClient(model_sel_name, token=hf_token)
|
| 60 |
+
client = InferenceClient(
|
| 61 |
+
provider='nebius',
|
| 62 |
+
api_key=hf_token,
|
| 63 |
+
bill_to="GIZ",
|
| 64 |
+
)
|
| 65 |
# Instantiate ChatCompletion as a generator object (stream is set to True)
|
| 66 |
chat_completion = client.chat.completions.create(
|
| 67 |
messages=messages,
|