2d:["$","div",null,{"className":"px-4 mx-auto flex max-w-screen-xl flex-col pt-0 lg:px-0","children":["$","section",null,{"className":"flex w-full flex-col justify-between rounded-4 border-manitoulinBorderColor bg-manitoulinDarkBlack sm:rounded-6 lg:rounded-8 p-ms lg:p-lg","children":["$","$L33",null,{"artifact":{"artifactType":"ENDPOINT","name":"vila","displayName":"vila","publisher":"nvidia","shortDescription":"Multi-modal vision-language model that understands text/img/video and creates informative responses","logo":"https://assets.ngc.nvidia.com/products/api-catalog/images/vila.jpg","labels":"$2c:props:children:1:props:children:props:children:props:children:3:props:children:0:props:children:props:labels","attributes":[{"key":"AVAILABLE","value":"false"},{"key":"DEPRECATION","value":"12/19/2025"},{"key":"PREVIEW","value":"true"}],"updatedDate":"2025-04-25T18:45:34.460Z","bias":"| Field | Response |\n| -- | -- |\n|Participation considerations from adversely impacted groups [(protected classes)](https://www.senate.ca.gov/content/protected-classes) in model design and testing: | None of the Above |\n| Measures taken to mitigate against unwanted bias: | No measures taken to mitigate against unwanted bias.|","canGuestDownload":true,"createdDate":"2024-09-09T17:13:43.347Z","description":"$34","explainability":"$35","isPublic":true,"isReadOnly":true,"orgName":"qc69jvmznzxy","privacy":"$36","safetyAndSecurity":"| Field | Response |\n| -- | -- |\n| Model Application(s): | Visual Question Answering and Conversation. Agent to understand and answer the scene. |\n| Describe the life-critical application (if present). | None: Not within Operational Design Domain |\n| Use Case Restrictions: | Abide by [https://www.nvidia.com/en-us/data-center/products/nvidia-ai-enterprise/eula/\"](https://www.nvidia.com/en-us/data-center/products/nvidia-ai-enterprise/eula/). |\n| Describe access restrictions (if any): | The Principle of least privilege (PoLP) is applied limiting access for dataset generation and model development. Restrictions enforce dataset access during training, and dataset license constraints adhered to. |"},"endpointName":"vila","endpointSpec":{"openAPISpec":{"openapi":"3.1.0","info":{"title":"NVIDIA NIM API for nvidia/vila","description":"The NVIDIA NIM REST API. Please see https://docs.api.nvidia.com/nim for more details.","version":"1.0.0","termsOfService":"https://nvidia.com/legal/terms-of-use","contact":{"name":"NVIDIA Support","url":"https://help.nvidia.com/"},"license":{"name":"NVIDIA AI Foundation Models Community License","url":"https://docs.nvidia.com/ai-foundation-models-community-license.pdf"}},"servers":[{"url":"https://ai.api.nvidia.com/v1"}],"tags":[{"name":"Multimodal API","description":"This API performs inference using visual language understanding models"}],"paths":{"/vlm/nvidia/vila":{"post":{"tags":["Multimodal API"],"summary":"Request response from the model","description":"Invokes inference using the model chat parameters. If uploading large images, this POST should be used in conjunction with the NVCF API which allows for the upload of large assets. \nYou can find details on how to use NVCF Asset APIs here: https://docs.api.nvidia.com/cloud-functions/reference/createasset","operationId":"invokeFunction","parameters":[{"in":"header","name":"NVCF-INPUT-ASSET-REFERENCES","schema":{"type":"string","maxLength":370,"format":"uuid"},"required":false,"description":"String of asset IDs separated by commas. Data is uploaded to AWS S3 using NVCF Asset APIs and associated with these asset IDs.If the size of an image is more than 180KB, it needs to be uploaded to a presigned S3 URL bucket. The presigned URL allows for secure and temporary access to the S3 bucket for uploading the image. Once the asset is requested, an asset ID is generated for it. Please include this asset ID in this header and to use the uploaded image in a prompt, you need to refer to it using the following format: `

`."}],"requestBody":{"content":{"application/json":{"schema":{"$ref":"#/components/schemas/NIMLLMChatCompletionRequest"}}},"required":true},"responses":{"200":{"description":"Invocation is fulfilled","content":{"application/json":{"schema":{"$ref":"#/components/schemas/NIMLLMChatCompletionResponse"}},"text/event-stream":{"schema":{"$ref":"#/components/schemas/NIMLLMChatCompletionStreamResponse"}}}},"202":{"description":"Result is pending. Client should poll using the requestId.\n","content":{"application/json":{"example":{},"schema":{}}},"headers":{"NVCF-REQID":{"description":"requestId required for pooling","schema":{"type":"string","format":"uuid","maxLength":36}},"NVCF-STATUS":{"description":"Invocation status","schema":{"type":"string","format":"^[a-zA-Z-]{1,64}$","maxLength":64}}}},"422":{"description":"Validation failed, provided entity could not be processed.","content":{"application/json":{"schema":{"$ref":"#/components/schemas/Errors"},"example":{"type":"urn:nvcf-worker-service:problem-details:unprocessable-entity","title":"Unprocessable Entity","status":422,"detail":"string","instance":"/v2/nvcf/pexec/functions/bc205f8e-1740-40df-8d32-c4321763498a","requestId":"3fa85f64-5717-4562-b3fc-2c963f66afa6"}}}},"500":{"description":"The invocation ended with an error.","content":{"application/json":{"schema":{"$ref":"#/components/schemas/Errors"},"example":{"type":"urn:nvcf-worker-service:problem-details:internal-server-error","title":"Internal Server Error","status":500,"detail":"string","instance":"/v2/nvcf/pexec/functions/bc205f8e-1740-40df-8d32-c4321763498a","requestId":"3fa85f64-5717-4562-b3fc-2c963f66afa6"}}}}},"x-nvai-meta":{"name":"Create chat completion","returns":"Returns a [chat completion](/docs/api-reference/chat/object) object.\n","path":"create","examples":[{"name":"warehouse_warning_tape.mp4","input":{"text":"Elaborate what the worker is doing, why he would be taking this action and also provide information on what he is wearing.","image":"https://assets.ngc.nvidia.com/products/api-catalog/vila/warehouse_warning_tape.jpeg","video":"https://assets.ngc.nvidia.com/products/api-catalog/vila/warehouse_warning_tape.mp4"},"output":{"text":"The worker, who is wearing a neon vest, black pants, and a yellow hard hat, is pulling a yellow caution tape across the aisle. This action suggests that he is cordoning off the area, likely for safety or maintenance reasons. The caution tape is a common safety measure used to block off areas that are not safe to enter or that require special attention."},"requestJson":"{ \"max_tokens\": 1024, \"temperature\": 0.2, \"top_p\": 0.7, \"seed\": 50, \"model\": \"nvidia/vila\", \"messages\": [ { \"role\": \"user\", \"content\": \"<%- input.text %>: