main.py aktualisiert
This commit is contained in:
18
main.py
18
main.py
@@ -123,6 +123,22 @@ async def get_ai_response(user_input, system_prompt):
|
|||||||
messages=messages
|
messages=messages
|
||||||
)
|
)
|
||||||
ai_msg = response.choices[0].message.content
|
ai_msg = response.choices[0].message.content
|
||||||
|
|
||||||
|
elif AI_PROVIDER == "nvidia":
|
||||||
|
if not NVIDIA_API_KEY:
|
||||||
|
return "Fehler: NVIDIA_API_KEY fehlt!"
|
||||||
|
|
||||||
|
# NVIDIA nutzt ebenfalls das OpenAI Interface
|
||||||
|
client = openai.OpenAI(
|
||||||
|
base_url="https://integrate.api.nvidia.com/v1",
|
||||||
|
api_key=NVIDIA_API_KEY
|
||||||
|
)
|
||||||
|
messages = [{"role": "system", "content": system_prompt}] + chat_history
|
||||||
|
response = client.chat.completions.create(
|
||||||
|
model=NVIDIA_MODEL,
|
||||||
|
messages=messages
|
||||||
|
)
|
||||||
|
ai_msg = response.choices[0].message.content
|
||||||
|
|
||||||
elif AI_PROVIDER == "google":
|
elif AI_PROVIDER == "google":
|
||||||
# Für Google Gemini
|
# Für Google Gemini
|
||||||
@@ -430,14 +446,12 @@ async def get_models(provider: str, url: str = None):
|
|||||||
|
|
||||||
elif provider == "nvidia":
|
elif provider == "nvidia":
|
||||||
if not NVIDIA_API_KEY or "hier" in NVIDIA_API_KEY: return {"models": []}
|
if not NVIDIA_API_KEY or "hier" in NVIDIA_API_KEY: return {"models": []}
|
||||||
|
|
||||||
# NVIDIA nutzt das OpenAI SDK!
|
# NVIDIA nutzt das OpenAI SDK!
|
||||||
import openai
|
import openai
|
||||||
client = openai.AsyncOpenAI(
|
client = openai.AsyncOpenAI(
|
||||||
api_key=NVIDIA_API_KEY,
|
api_key=NVIDIA_API_KEY,
|
||||||
base_url="https://integrate.api.nvidia.com/v1"
|
base_url="https://integrate.api.nvidia.com/v1"
|
||||||
)
|
)
|
||||||
|
|
||||||
try:
|
try:
|
||||||
response = await client.models.list()
|
response = await client.models.list()
|
||||||
# Bei NVIDIA heißen die Modelle oft nach dem Schema "nvidia/llama-3.1-405b"
|
# Bei NVIDIA heißen die Modelle oft nach dem Schema "nvidia/llama-3.1-405b"
|
||||||
|
|||||||
Reference in New Issue
Block a user