{ "dtype": "int8_int8_int8", "input_info": null, "optimum_version": "1.26.1", "quantization_config": { "dataset": "contextual", "ignored_scope": null, "num_samples": 50, "processor": null, "quantization_configs": { "lm_model": { "bits": 8, "dataset": null, "dtype": "int8", "fast_bias_correction": true, "ignored_scope": null, "model_type": "transformer", "num_samples": null, "overflow_fix": "disable", "processor": null, "smooth_quant_alpha": null, "sym": false, "tokenizer": null, "trust_remote_code": false }, "text_embeddings_model": { "all_layers": null, "backup_precision": null, "bits": 8, "dataset": null, "dtype": "int8", "gptq": null, "group_size": -1, "ignored_scope": null, "lora_correction": null, "num_samples": null, "processor": null, "quant_method": "default", "ratio": 1.0, "scale_estimation": null, "sensitivity_metric": null, "sym": false, "tokenizer": null, "trust_remote_code": false }, "vision_embeddings_model": { "all_layers": null, "backup_precision": null, "bits": 8, "dataset": null, "dtype": "int8", "gptq": null, "group_size": -1, "ignored_scope": null, "lora_correction": null, "num_samples": null, "processor": null, "quant_method": "default", "ratio": 1.0, "scale_estimation": null, "sensitivity_metric": null, "sym": false, "tokenizer": null, "trust_remote_code": false } }, "tokenizer": null, "trust_remote_code": false }, "save_onnx_model": false, "transformers_version": "4.52.4" }