Add MLX 8-bit quantized model with KV cache compression

cfb84ae verified about 2 months ago

660 Bytes

	{
	"image_break_token": "[IMG_BREAK]",
	"image_end_token": "[IMG_END]",
	"image_processor": {
	"do_convert_rgb": true,
	"do_normalize": true,
	"do_rescale": true,
	"do_resize": true,
	"image_mean": [
	0.48145466,
	0.4578275,
	0.40821073
	],
	"image_processor_type": "PixtralImageProcessor",
	"image_std": [
	0.26862954,
	0.26130258,
	0.27577711
	],
	"patch_size": 14,
	"resample": 3,
	"rescale_factor": 0.00392156862745098,
	"size": {
	"longest_edge": 1540
	}
	},
	"image_token": "[IMG]",
	"patch_size": 14,
	"processor_class": "PixtralProcessor",
	"spatial_merge_size": 2
	}