interface ModelSupportedQuantization {
    allowed: boolean;
    maxContextSize: number;
    quantizationBits: number;
}

Properties

allowed: boolean

Tells whether this quantization is allowed for this node type.

maxContextSize: number

Maximum inference context size available for this node type and quantization.

quantizationBits: number

Number of bits for this supported quantization.