import * as z from "zod/v4"; import { OpenEnum } from "../types/enums.js"; import { Result as SafeParseResult } from "../types/fp.js"; import { EndpointStatus } from "./endpointstatus.js"; import { SDKValidationError } from "./errors/sdkvalidationerror.js"; import { Parameter } from "./parameter.js"; import { PercentileStats } from "./percentilestats.js"; import { ProviderName } from "./providername.js"; export type Pricing = { audio?: string | undefined; audioOutput?: string | undefined; completion: string; discount?: number | undefined; image?: string | undefined; imageOutput?: string | undefined; imageToken?: string | undefined; inputAudioCache?: string | undefined; inputCacheRead?: string | undefined; inputCacheWrite?: string | undefined; internalReasoning?: string | undefined; prompt: string; request?: string | undefined; webSearch?: string | undefined; }; export declare const PublicEndpointQuantization: { readonly Int4: "int4"; readonly Int8: "int8"; readonly Fp4: "fp4"; readonly Fp6: "fp6"; readonly Fp8: "fp8"; readonly Fp16: "fp16"; readonly Bf16: "bf16"; readonly Fp32: "fp32"; readonly Unknown: "unknown"; }; export type PublicEndpointQuantization = OpenEnum; /** * Information about a specific model endpoint */ export type PublicEndpoint = { contextLength: number; /** * Latency percentiles in milliseconds over the last 30 minutes. Latency measures time to first token. Only visible when authenticated with an API key or cookie; returns null for unauthenticated requests. */ latencyLast30m: PercentileStats | null; maxCompletionTokens: number | null; maxPromptTokens: number | null; /** * The unique identifier for the model (permaslug) */ modelId: string; modelName: string; name: string; pricing: Pricing; providerName: ProviderName; quantization: PublicEndpointQuantization | null; status?: EndpointStatus | undefined; supportedParameters: Array; supportsImplicitCaching: boolean; tag: string; throughputLast30m: PercentileStats | null; /** * Uptime percentage over the last 1 day, calculated as successful requests / (successful + error requests) * 100. Rate-limited requests are excluded. Returns null if insufficient data. */ uptimeLast1d: number | null; uptimeLast30m: number | null; /** * Uptime percentage over the last 5 minutes, calculated as successful requests / (successful + error requests) * 100. Rate-limited requests are excluded. Returns null if insufficient data. */ uptimeLast5m: number | null; }; /** @internal */ export declare const Pricing$inboundSchema: z.ZodType; export declare function pricingFromJSON(jsonString: string): SafeParseResult; /** @internal */ export declare const PublicEndpointQuantization$inboundSchema: z.ZodType; /** @internal */ export declare const PublicEndpoint$inboundSchema: z.ZodType; export declare function publicEndpointFromJSON(jsonString: string): SafeParseResult; //# sourceMappingURL=publicendpoint.d.ts.map