17:["$","$L30",null,{"state":{"mutations":[],"queries":[{"state":{"data":null,"dataUpdateCount":1,"dataUpdatedAt":1752392850389,"error":null,"errorUpdateCount":0,"errorUpdatedAt":0,"fetchFailureCount":0,"fetchFailureReason":null,"fetchMeta":null,"isInvalidated":false,"status":"success","fetchStatus":"idle"},"queryKey":["killswitches/rerank/chat-v2.enabled"],"queryHash":"[\"killswitches/rerank/chat-v2.enabled\"]"},{"state":{"data":false,"dataUpdateCount":1,"dataUpdatedAt":1752392850389,"error":null,"errorUpdateCount":0,"errorUpdatedAt":0,"fetchFailureCount":0,"fetchFailureReason":null,"fetchMeta":null,"isInvalidated":false,"status":"success","fetchStatus":"idle"},"queryKey":["killswitches/chatWithTools/chat-v2.enabled"],"queryHash":"[\"killswitches/chatWithTools/chat-v2.enabled\"]"},{"state":{"data":false,"dataUpdateCount":1,"dataUpdatedAt":1752392850389,"error":null,"errorUpdateCount":0,"errorUpdatedAt":0,"fetchFailureCount":0,"fetchFailureReason":null,"fetchMeta":null,"isInvalidated":false,"status":"success","fetchStatus":"idle"},"queryKey":["killswitches/chatWithFeatures/chat-v2.enabled"],"queryHash":"[\"killswitches/chatWithFeatures/chat-v2.enabled\"]"},{"state":{"data":null,"dataUpdateCount":1,"dataUpdatedAt":1752392850393,"error":null,"errorUpdateCount":0,"errorUpdatedAt":0,"fetchFailureCount":0,"fetchFailureReason":null,"fetchMeta":null,"isInvalidated":false,"status":"success","fetchStatus":"idle"},"queryKey":["killswitches/nv-rerankqa-mistral-4b-v3/playground.enabled"],"queryHash":"[\"killswitches/nv-rerankqa-mistral-4b-v3/playground.enabled\"]"},{"state":{"data":false,"dataUpdateCount":1,"dataUpdatedAt":1752392850389,"error":null,"errorUpdateCount":0,"errorUpdatedAt":0,"fetchFailureCount":0,"fetchFailureReason":null,"fetchMeta":null,"isInvalidated":false,"status":"success","fetchStatus":"idle"},"queryKey":["killswitches/chat-metrics.enabled"],"queryHash":"[\"killswitches/chat-metrics.enabled\"]"},{"state":{"data":true,"dataUpdateCount":1,"dataUpdatedAt":1752392850389,"error":null,"errorUpdateCount":0,"errorUpdatedAt":0,"fetchFailureCount":0,"fetchFailureReason":null,"fetchMeta":null,"isInvalidated":false,"status":"success","fetchStatus":"idle"},"queryKey":["killswitches/vss-2.enabled"],"queryHash":"[\"killswitches/vss-2.enabled\"]"},{"state":{"data":true,"dataUpdateCount":1,"dataUpdatedAt":1752392850389,"error":null,"errorUpdateCount":0,"errorUpdatedAt":0,"fetchFailureCount":0,"fetchFailureReason":null,"fetchMeta":null,"isInvalidated":false,"status":"success","fetchStatus":"idle"},"queryKey":["killswitches/mega-2.enabled"],"queryHash":"[\"killswitches/mega-2.enabled\"]"},{"state":{"data":true,"dataUpdateCount":1,"dataUpdatedAt":1752392850389,"error":null,"errorUpdateCount":0,"errorUpdatedAt":0,"fetchFailureCount":0,"fetchFailureReason":null,"fetchMeta":null,"isInvalidated":false,"status":"success","fetchStatus":"idle"},"queryKey":["killswitches/riva-magpie-2.enabled"],"queryHash":"[\"killswitches/riva-magpie-2.enabled\"]"}]},"children":["$undefined",["$","div",null,{"className":"px-4 pt-4 md:px-8 mx-auto flex max-w-[1600px] flex-col gap-md","children":[["$","div",null,{"className":"relative flex min-h-[150px] flex-col overflow-hidden rounded-4 border-sm border-solid border-n700 bg-manitoulinDarkBlack p-md sm:rounded-6 md:rounded-8 md:px-ml md:py-ml","children":[["$","$L31",null,{"alt":"","className":"object-cover object-center !left-1/2 z-10 !w-1/2 brightness-20 md:brightness-100","fill":true,"priority":true,"src":"https://assets.ngc.nvidia.com/products/api-catalog/images/nv-rerankqa-mistral-4b-v3.jpg","style":{"maskImage":"linear-gradient(to left, rgba(0,0,0,1), rgba(0,0,0,0))"}}],["$","div",null,{"className":"z-20 flex min-w-0 flex-1 flex-col justify-between gap-ml md:flex-row","children":[["$","div",null,{"className":"flex min-w-0 flex-1 flex-col","children":["$","div",null,{"className":"flex flex-col gap-0.5 whitespace-pre-wrap","children":[["$","h2",null,{"className":"text-ml lowercase text-n300 hover:text-n050","children":["$","$L26",null,{"href":"/nvidia","children":"nvidia"}]}],["$","div",null,{"className":"flex items-center gap-3","children":[["$","h1",null,{"className":"text-lg font-medium leading-heading","data-testid":"resource-name","children":"nv-rerankqa-mistral-4b-v3"}],["$","span",null,{"className":"inline-flex h-5 w-fit items-center gap-1 rounded-1 px-2 align-bottom text-xs font-bold uppercase leading-caps tracking-more border-0 bg-p300 text-p700","children":["$undefined","Run Anywhere"]}],"$undefined"]}],["$","p",null,{"className":"text-ms","children":"Multilingual text reranking model."}],["$","div",null,{"className":"mt-2 flex flex-wrap gap-sm","children":["$","$L32",null,{"density":"standard","labels":["Reranking","nemo retriever","Retrieval Augmented Generation"]}]}]]}]}],["$","div",null,{"className":"mt-auto flex gap-ms","children":["$undefined",["$","$L33",null,{"cta":{"text":"Apply to Self-Host","url":"https://www.nvidia.com/en-us/ai/nim-notifyme/"},"isNIMAvailable":true}]]}]]}]]}],["$","section",null,{"className":"flex w-full flex-col justify-between rounded-4 border-manitoulinBorderColor bg-manitoulinDarkBlack sm:rounded-6 md:rounded-8 p-ms md:p-lg","children":["$","$L34",null,{"artifact":{"artifactType":"ENDPOINT","name":"nv-rerankqa-mistral-4b-v3","displayName":"nv-rerankqa-mistral-4b-v3","publisher":"nvidia","shortDescription":"Multilingual text reranking model.","logo":"https://assets.ngc.nvidia.com/products/api-catalog/images/nv-rerankqa-mistral-4b-v3.jpg","labels":"$35","attributes":[{"key":"AVAILABLE","value":"true"},{"key":"PREVIEW","value":"false"}],"bias":"| Field | Response |\n|:-------------------|:---------|\n| Participation considerations from adversely impacted groups [protected classes](https://www.senate.ca.gov/content/protected-classes) in model design and testing | None |\n| Measures taken to mitigate against unwanted bias | None |","canGuestDownload":true,"createdDate":"2024-07-17T21:20:00.445Z","description":"$36","explainability":"$37","isPublic":true,"isReadOnly":true,"orgName":"qc69jvmznzxy","privacy":"$38","safetyAndSecurity":"| Field | Response |\n|:-------------------|:---------|\n|Verified to have met prescribed quality standards: | Yes |\n|Target Key Performance Indicator(s) (KPI(s)): | Accuracy, Latency, Throughput |\n|Model Application(s): | Text Reranking for Retrieval |\n|Describe the physical safety impact (if present). | Not Applicable |\n|Use Case Restrictions:| Commercial license available from NVIDIA AI Enterprise. |\n|Model and dataset restrictions:| The Principle of least privilege (PoLP) is applied limiting access for dataset generation and model development. Restrictions enforce dataset access during training, and dataset license constraints adhered to. |","updatedDate":"2025-03-21T13:13:39.852Z"},"endpointName":"nv-rerankqa-mistral-4b-v3","endpointSpec":{"openAPISpec":{"openapi":"3.1.0","info":{"title":"NVIDIA NIM API for nvidia/nv-rerankqa-mistral-4b-v3","description":"The NVIDIA NIM REST API. Please see https://docs.api.nvidia.com/nim/reference/nvidia-nv-rerankqa-mistral-4b-v3 for more details.","version":"1.0.0","termsOfService":"https://nvidia.com/legal/terms-of-use","contact":{"name":"NVIDIA Support","url":"https://help.nvidia.com/"},"license":{"name":"CC-BY-NC-4.0","url":"https://spdx.org/licenses/CC-BY-NC-4.0"}},"servers":[{"url":"https://ai.api.nvidia.com/v1"}],"paths":{"/retrieval/nvidia/nv-rerankqa-mistral-4b-v3/reranking":{"post":{"tags":["Reranking"],"summary":"Rank passages by their relation to a query.","description":"Order a list of passages by their relation to a query.\n\nNote that if a given query + passage pair is longer than the ranking model's context window,\nit will be automatically truncated.","operationId":"rank","requestBody":{"content":{"application/json":{"schema":{"$ref":"#/components/schemas/RankRequest"}}},"required":true},"x-nvai-meta":{"name":"Passage Reranking","description":"Ranks a list of passages based on their relevance to a provided query using a specific model.","path":"create","examples":[{"name":"Passage Reranking","description":"Ranks a list of passages based on their relevance to a provided query using a specific model.","requestJson":"$39","responseJson":"{\n \"rankings\": [\n {\n \"index\": 2,\n \"logit\": 4.74609375\n },\n {\n \"index\": 1,\n \"logit\": -6.11328125\n },\n {\n \"index\": 0,\n \"logit\": -7.25390625\n }\n ]\n}\n"},{"name":"Passage Reranking","description":"Ranks a list of passages based on their relevance to a provided query using a specific model.","requestJson":"$3a","responseJson":"{\n \"rankings\": [\n {\n \"index\": 0,\n \"logit\": 5.3046875\n },\n {\n \"index\": 2,\n \"logit\": 4.7890625\n },\n {\n \"index\": 1,\n \"logit\": 2.671875\n },\n {\n \"index\": 4,\n \"logit\": -12.0859375\n },\n {\n \"index\": 3,\n \"logit\": -12.3359375\n },\n {\n \"index\": 5,\n \"logit\": -15.9296875\n }\n ]\n}\n"}],"templates":[{"title":"Synchronous requests","requestEjs":{"python":"","langchain":"from langchain_nvidia_ai_endpoints import NVIDIARerank\nfrom langchain_core.documents import Document\n\nquery = <%- JSON.stringify(request.query.text) %>\npassages = [<% request.passages.forEach(function(passage) { %>\n \"<%- passage.text %>\", <% }); %>\n]\n\nclient = NVIDIARerank(\n model=\"<%- request.model %>\", \n api_key=\"$NVIDIA_API_KEY\",\n)\n\nresponse = client.compress_documents(\n query=query,\n documents=[Document(page_content=passage) for passage in passages]\n)\n\nprint(f\"Most relevant: {response[0].page_content}\\nLeast relevant: {response[-1].page_content}\")\n","node.js":"","curl":""}}]},"responses":{"200":{"description":"The ranked list of texts.","content":{"application/json":{"schema":{"$ref":"#/components/schemas/RankResponse"}}}},"402":{"description":"Payment Required","content":{"application/json":{"schema":{"$ref":"#/components/schemas/PaymentRequiredError"}}}},"422":{"description":"The request was invalid.","content":{"application/json":{"schema":{"$ref":"#/components/schemas/HTTPValidationError"}}}}}}}},"security":[{"Token":[]}],"components":{"securitySchemes":{"Token":{"type":"http","scheme":"bearer"}},"schemas":{"MultiModalData":{"properties":{"text":{"type":"string","maxLength":14598366,"minLength":1,"pattern":".*","title":"Text"}},"additionalProperties":false,"type":"object","required":["text"],"title":"MultiModalData","description":"A type signifier for multimodal data.\n\nSupported data types: text."},"Rank":{"properties":{"index":{"type":"integer","maximum":512,"minimum":0,"format":"int32","title":"Index"},"logit":{"type":"number","title":"Logit"}},"type":"object","required":["index","logit"],"title":"Rank","description":"A single ranked text."},"RankRequest":{"properties":{"model":{"description":"Model identifier","type":"string","maxLength":128,"minLength":1,"pattern":".*","title":"Model","default":"nvidia/nv-rerankqa-mistral-4b-v3","examples":["nvidia/nv-rerankqa-mistral-4b-v3"]},"query":{"allOf":[{"$ref":"#/components/schemas/MultiModalData"}],"description":"A text query for ranking the passages","examples":[{"text":"What is the GPU memory bandwidth of H100 SXM?"}]},"passages":{"items":{"$ref":"#/components/schemas/MultiModalData"},"type":"array","maxItems":512,"minItems":1,"title":"Passages","description":"Text passages to rank based on the query","examples":[[{"text":"The Hopper GPU is paired with the Grace CPU using NVIDIA's ultra-fast chip-to-chip interconnect, delivering 900GB/s of bandwidth, 7X faster than PCIe Gen5. This innovative design will deliver up to 30X higher aggregate system memory bandwidth to the GPU compared to today's fastest servers and up to 10X higher performance for applications running terabytes of data."},{"text":"A100 provides up to 20X higher performance over the prior generation and can be partitioned into seven GPU instances to dynamically adjust to shifting demands. The A100 80GB debuts the world's fastest memory bandwidth at over 2 terabytes per second (TB/s) to run the largest models and datasets."},{"text":"Accelerated servers with H100 deliver the compute power—along with 3 terabytes per second (TB/s) of memory bandwidth per GPU and scalability with NVLink and NVSwitch™."}]]},"truncate":{"type":"string","enum":["END","NONE"],"title":"Truncate","default":"NONE"}},"type":"object","required":["model","query","passages"],"title":"RankRequest","description":"A request to the rank endpoint."},"RankResponse":{"properties":{"rankings":{"items":{"$ref":"#/components/schemas/Rank"},"type":"array","maxItems":512,"minItems":1,"title":"Rankings","examples":[[{"index":2,"logit":4.74609375},{"index":1,"logit":-6.11328125},{"index":0,"logit":-7.25390625}]]}},"type":"object","required":["rankings"],"title":"RankResponse","description":"A response from the rank endpoint."},"ValidationError":{"properties":{"loc":{"items":{"anyOf":[{"type":"string"},{"type":"integer"}]},"type":"array","title":"Location"},"msg":{"type":"string","title":"Message"},"type":{"type":"string","title":"Error Type"}},"type":"object","required":["loc","msg","type"],"title":"ValidationError"},"HTTPValidationError":{"properties":{"detail":{"items":{"$ref":"#/components/schemas/ValidationError"},"type":"array","title":"Detail"}},"type":"object","title":"HTTPValidationError"},"PaymentRequiredError":{"properties":{"detail":{"type":"string","description":"Contains specific information related to the error and why it occurred.","example":"You have reached your limit of credits."}},"type":"object","title":"PaymentRequiredError"}}},"tags":[{"name":"Reranking","description":"Rank passages by their relation to a query."}]},"namespace":"qc69jvmznzxy","updatedDate":"2025-03-21T13:13:40.470Z","nvcfFunctionId":"98b83903-f595-48c4-b727-b69067b7c069","createdDate":"2024-07-17T21:20:00.670Z","attributes":{"apiDocsUrl":"https://docs.api.nvidia.com/nim/reference/nvidia-nv-rerankqa-mistral-4b-v3","termsOfUse":"GOVERNING TERMS: Your use of this API is governed by the NVIDIA API Trial Service Terms of Use; and the use of this model is governed by the Apache 2.0 License.\n","showUnavailableBanner":false,"cta":"$3b","playground":{"type":"rerank"},"deploy":[{"label":"Linux with Docker","filename":"linux.md","contents":"$3c"}]},"artifactName":"nv-rerankqa-mistral-4b-v3"},"hasAcceptedLicense":false,"isLoginRequired":true,"license":null,"playgroundElement":"$undefined","publisherName":"nvidia","searchParams":{}}]}]]}],["$","$L3d",null,{"spec":"$3e"}]]}]