2d:["$","div",null,{"className":"px-4 mx-auto flex max-w-screen-xl flex-col pt-0 lg:px-0","children":["$","section",null,{"className":"flex w-full flex-col justify-between rounded-4 border-manitoulinBorderColor bg-manitoulinDarkBlack sm:rounded-6 lg:rounded-8 p-ms lg:p-lg","children":["$","$L33",null,{"artifact":{"artifactType":"ENDPOINT","name":"llama-3_1-nemotron-70b-reward","displayName":"llama-3.1-nemotron-70b-reward","publisher":"nvidia","shortDescription":"Leaderboard topping reward model supporting RLHF for better alignment with human preferences.","logo":"https://assets.ngc.nvidia.com/products/api-catalog/images/llama-3_1-nemotron-70b-reward.jpg","labels":"$2c:props:children:1:props:children:props:children:props:children:3:props:children:0:props:children:props:labels","attributes":[{"key":"DEPRECATION","value":"04/15/2026"},{"key":"PREVIEW","value":"true"}],"updatedDate":"2024-11-18T22:31:06.314Z","bias":"Field | Response\n:---------------------------------------------------------------------------------------------------|:---------------\nParticipation considerations from adversely impacted groups [protected classes](https://www.senate.ca.gov/content/protected-classes) in model design and testing: | None\nMeasures taken to mitigate against unwanted bias: | None","canGuestDownload":true,"createdDate":"2024-09-30T16:45:05.774Z","description":"$34","explainability":"$35","isPublic":true,"isReadOnly":true,"orgName":"qc69jvmznzxy","privacy":"$36","safetyAndSecurity":"Field | Response\n:---------------------------------------------------|:----------------------------------\nModel Application(s): | Conversation, Question Answering, Summarization\nDescribe the life-critical impact (if present). | None Known\nUse Case Restrictions: | See https://github.com/meta-llama/llama-models/blob/main/models/llama3_1/LICENSE \nModel and dataset restrictions: | The Principle of least privilege (PoLP) is applied limiting access for dataset generation and model development. Restrictions enforce dataset access during training, and dataset license constraints adhered to."},"endpointName":"llama-3_1-nemotron-70b-reward","endpointSpec":{"openAPISpec":{"openapi":"3.1.0","info":{"title":"NVIDIA NIM API for nvidia/llama-3.1-nemotron-70b-reward","description":"The NVIDIA NIM REST API. Please see https://docs.api.nvidia.com/nim/reference/nvidia-llama-3_1-nemotron-70b-reward for more details. for more details.","version":"1.0.0","termsOfService":"https://www.nvidia.com/en-us/data-center/products/nvidia-ai-enterprise/eula/","contact":{"name":"NVIDIA Enterprise Support","url":"https://www.nvidia.com/en-us/support/enterprise/"},"license":{"name":"NVIDIA AI Foundation Models Community License Agreement","url":"https://www.nvidia.com/en-us/agreements/enterprise-software/nvidia-ai-foundation-models-community-license-agreement/"}},"servers":[{"url":"https://integrate.api.nvidia.com/v1/"}],"tags":[{"name":"NVCF API","description":"Run inference on the model"}],"paths":{"/chat/completions":{"post":{"operationId":"create_chat_completion_v1_chat_completions_post","tags":["Chat"],"summary":"Creates a model response for the given chat conversation.","description":"Given a list of messages comprising a conversation, the model will return a response. Compatible with OpenAI. See https://platform.openai.com/docs/api-reference/chat/create","requestBody":{"content":{"application/json":{"schema":{"$ref":"#/components/schemas/ChatRequest"}}},"required":true},"responses":{"200":{"description":"Invocation is fulfilled","content":{"application/json":{"schema":{"$ref":"#/components/schemas/ChatCompletion"}}}},"202":{"description":"Result is pending. Client should poll using the requestId.","content":{"application/json":{"example":{},"schema":{}}},"headers":{"NVCF-REQID":{"description":"requestId required for pooling","schema":{"type":"string","format":"uuid"}},"NVCF-STATUS":{"description":"Invocation status","schema":{"type":"string"}}}},"422":{"description":"Validation failed, provided entity could not be processed.","content":{"application/json":{"schema":{"$ref":"#/components/schemas/Errors"},"example":{"type":"urn:nvcf-worker-service:problem-details:unprocessable-entity","title":"Unprocessable Entity","status":422,"detail":"string","instance":"/v2/nvcf/pexec/functions/c53ee0e9-bad9-4e09-b365-52c9d6b71254","requestId":"3fa85f64-5717-4562-b3fc-2c963f66afa6"}}}},"500":{"description":"The invocation ended with an error.","content":{"application/json":{"schema":{"$ref":"#/components/schemas/Errors"},"example":{"type":"urn:nvcf-worker-service:problem-details:internal-server-error","title":"Internal Server Error","status":500,"detail":"string","instance":"/v2/nvcf/pexec/functions/c53ee0e9-bad9-4e09-b365-52c9d6b71254","requestId":"3fa85f64-5717-4562-b3fc-2c963f66afa6"}}}}},"x-nvai-meta":{"name":"Create chat completion","returns":"Returns a [chat completion](/docs/api-reference/chat/object) object\n","path":"create","examples":[{"name":"Grade the assistant response","requestJson":"{\n \"model\": \"nvidia/llama-3.1-nemotron-70b-reward\",\n \"messages\": [\n {\n \"role\": \"user\",\n \"content\": \"I am going to Paris, what should I see?\"\n },\n {\n \"role\": \"assistant\",\n \"content\": \"Ah, Paris, the City of Light! There are so many amazing things to see and do in this beautiful city ...\"\n }\n ]\n}\n","responseJson":"{\n \"id\": \"id-123\",\n \"choices\": [\n {\n \"index\": 0,\n \"message\": {\n \"content\": \"reward:-19.875\",\n \"role\": \"assistant\"\n },\n \"finish_reason\": \"length\"\n }\n ],\n \"usage\": {\n \"completion_tokens\": 1,\n \"prompt_tokens\": 78,\n \"total_tokens\": 79\n }\n}\n"},{"name":"Grade the assistant response in multiturn","requestJson":"{\n \"model\": \"nvidia/llama-3.1-nemotron-70b-reward\",\n \"messages\": [\n {\n \"role\": \"user\",\n \"content\": \"I am going to Paris, what should I see?\"\n },\n {\n \"role\": \"assistant\",\n \"content\": \"Ah, Paris, the City of Light! There are so many amazing things to see and do in this beautiful city ...\"\n },\n {\n \"role\": \"user\",\n \"content\": \"What cafes do you recommend?\"\n },\n {\n \"role\": \"assistant\",\n \"content\": \"A very popular cafe in the heart of Paris is ...\"\n }\n ]\n}\n","responseJson":"{\n \"id\": \"id-123\",\n \"choices\": [\n {\n \"index\": 0,\n \"message\": {\n \"content\": \"reward:-27.375\",\n \"role\": \"assistant\"\n },\n \"finish_reason\": \"length\"\n }\n ],\n \"usage\": {\n \"completion_tokens\": 1,\n \"prompt_tokens\": 103,\n \"total_tokens\": 104\n }\n}\n"}],"templates":[{"title":"No Streaming","requestEjs":{"python":"from openai import OpenAI\n\nclient = OpenAI(\n base_url = \"https://integrate.api.nvidia.com/v1\",\n api_key = \"$NVIDIA_API_KEY\"\n)\n\ncompletion = client.chat.completions.create(\n model=\"<%- request.model %>\",\n messages=<%- JSON.stringify(request.messages) %>,\n)\nprint(completion)\n","node.js":"import OpenAI from 'openai';\n\nconst openai = new OpenAI({\n apiKey: '$NVIDIA_API_KEY',\n baseURL: 'https://integrate.api.nvidia.com/v1',\n})\n\nasync function main() {\n const completion = await openai.chat.completions.create({\n model: \"<%- request.model %>\",\n messages: <%- JSON.stringify(request.messages) %>,\n })\n process.stdout.write(JSON.stringify(completion));\n}\n\nmain();","curl":"curl https://integrate.api.nvidia.com/v1/chat/completions \\\n -H \"Content-Type: application/json\" \\\n -H \"Authorization: Bearer $NVIDIA_API_KEY\" \\\n -d '{\n \"model\": \"nvidia/llama-3.1-nemotron-70b-reward\",\n \"messages\": <%- JSON.stringify(request.messages).replaceAll(\"'\", \"'\\\"'\\\"'\") %> }'\n"},"response":"{\n \"id\": \"id-123\",\n \"choices\": [\n {\n \"index\": 0,\n \"message\": {\n \"content\": \"reward:-27.375\",\n \"role\": \"assistant\"\n },\n \"finish_reason\": \"length\"\n }\n ],\n \"usage\": {\n \"completion_tokens\": 1,\n \"prompt_tokens\": 67,\n \"total_tokens\": 68\n }\n}\n"}]}}}},"security":[{"Token":[]}],"components":{"securitySchemes":{"Token":{"type":"http","scheme":"bearer"}},"schemas":{"Errors":{"properties":{"type":{"type":"string","description":"Error type"},"title":{"type":"string","description":"Error title"},"status":{"type":"integer","description":"Error status code"},"detail":{"type":"string","description":"Detailed information about the error"},"instance":{"type":"string","description":"Function instance used to invoke the request"},"requestId":{"type":"string","format":"uuid","description":"UUID of the request"}},"type":"object","required":["type","title","status","detail","instance","requestId"],"title":"InvokeError"},"ChatCompletion":{"properties":{"id":{"description":"A unique identifier for the completion.","format":"uuid","title":"Id","type":"string"},"choices":{"description":"The list of completion choices the model generated for the input prompt.","items":{"$ref":"#/components/schemas/Choice"},"title":"Choices","type":"array"},"usage":{"allOf":[{"$ref":"#/components/schemas/Usage"}],"description":"Usage statistics for the completion request."}},"required":["id","choices","usage"],"title":"ChatCompletion","type":"object"},"ChatCompletionMessage":{"properties":{"content":{"anyOf":[{"type":"string"},{"type":"null"}],"description":"The contents of the message.","title":"Content"},"role":{"const":"assistant","description":"The role of the author of this message.","enum":["assistant"],"title":"Role","type":"string"}},"required":["content","role"],"title":"ChatCompletionMessage","type":"object"},"ChatRequest":{"additionalProperties":false,"properties":{"model":{"type":"string","title":"Model","default":"nvidia/llama-3.1-nemotron-70b-reward"},"messages":{"description":"A list of messages comprising the conversation so far that is to be graded. The roles of the messages must be alternating between `user` and `assistant`. The last input message should have role `assistant`.","examples":[[{"content":"I am going to Paris, what should I see?","role":"user"},{"content":"Ah, Paris, the City of Light! There are so many amazing things to see and do in this beautiful city ...","role":"assistant"}]],"items":{"$ref":"#/components/schemas/Message"},"title":"Messages","type":"array"}},"required":["messages"],"title":"ChatRequest","type":"object"},"Choice":{"properties":{"index":{"description":"The index of the choice in the list of choices (always 0).","title":"Index","type":"integer"},"message":{"description":"The score key:value pairs separated by a comma.","examples":[{"content":"reward:-19.875","role":"assistant"}],"items":{"$ref":"#/components/schemas/ChatCompletionMessage"},"title":"Message","type":"array"},"finish_reason":{"anyOf":[{"enum":["stop","length"],"type":"string"},{"type":"null"}],"default":null,"description":"The reason the model stopped generating tokens. This will be `stop` if the model hit a natural stop point or a provided stop sequence, or `length` if the maximum number of tokens specified in the request was reached.","examples":["stop"],"title":"Finish Reason"}},"required":["index","message"],"title":"Choice","type":"object"},"Message":{"additionalProperties":false,"properties":{"role":{"description":"The role of the message author.","enum":["user","assistant"],"title":"Role","type":"string"},"content":{"description":"The contents of the message.","title":"Content","type":"string"}},"required":["role","content"],"title":"Message","type":"object"},"Usage":{"properties":{"completion_tokens":{"description":"Number of tokens in the generated completion.","examples":[1],"title":"Completion Tokens","type":"integer"},"prompt_tokens":{"description":"Number of tokens in the prompt.","examples":[9],"title":"Prompt Tokens","type":"integer"},"total_tokens":{"description":"Total number of tokens used in the request (prompt + completion).","examples":[10],"title":"Total Tokens","type":"integer"}},"required":["completion_tokens","prompt_tokens","total_tokens"],"title":"Usage","type":"object"}}}},"namespace":"qc69jvmznzxy","updatedDate":"2026-04-15T11:24:09.523Z","nvcfFunctionId":"2d732656-1ffd-4125-9e29-20e2180a736f","createdDate":"2024-09-30T16:45:06.041Z","attributes":{"apiDocsUrl":"https://docs.api.nvidia.com/nim/reference/nvidia-llama-3_1-nemotron-70b-reward","termsOfUse":"GOVERNING TERMS: The trial service is governed by the NVIDIA API Service Agreement; and the use of this model is governed by the NVIDIA AI Foundation Models Community License Agreement.\n","deprecationNotice":"This API will be deprecated on 04/15/2026. It will no longer be supported after 04/15/2026. Please use openai/gpt-oss-120b instead. For more information, visit our API Reference.","showUnavailableBanner":false,"cta":"$2c:props:children:1:props:children:props:children:props:children:3:props:children:1:props:children:1:props:cta","playground":{"type":"reward","options":{"reward":{"outputToolTip":""}}}},"artifactName":"llama-3_1-nemotron-70b-reward"},"hasAcceptedLicense":false,"isLoginRequired":true,"license":"$undefined","playgroundElement":"$undefined","publisherName":"nvidia","searchParams":{},"tabs":[{"label":"Experience","bare":true,"icon":"play","kind":"default","id":"experience","href":"/nvidia/llama-3_1-nemotron-70b-reward","aliases":["/nvidia/llama-3_1-nemotron-70b-reward/experience"]}]}]}]}]