import os
from openai import OpenAI
client = OpenAI(
base_url = "https://integrate.api.nvidia.com/v1",
api_key = os.getenv("NVIDIA_API_KEY", "$NVIDIA_API_KEY")
)
completion = client.chat.completions.create(
model="nvidia/nemotron-3-nano-omni-30b-a3b-reasoning",
messages=[{"role":"user","content":""}],
temperature=0.6,
top_p=0.95,
max_tokens=65536,
extra_body={"chat_template_kwargs":{"enable_thinking":True},"reasoning_budget":16384},
stream=False
)
reasoning = getattr(completion.choices[0].message, "reasoning_content", None)
if reasoning:
print(reasoning)
print(completion.choices[0].message.content)Deploy this model now on your endpoint provider of choice