| { | |
| "_commit_hash": null, | |
| "compression": { | |
| "algorithm": "quantization", | |
| "ignored_scopes": [ | |
| "{re}.*Embeddings.*", | |
| "{re}.*__add___[0-1]", | |
| "{re}.*layer_norm_0", | |
| "{re}.*matmul_1", | |
| "{re}.*__truediv__*" | |
| ], | |
| "initializer": { | |
| "batchnorm_adaptation": { | |
| "num_bn_adaptation_samples": 0 | |
| }, | |
| "range": { | |
| "num_init_samples": 300, | |
| "type": "mean_min_max" | |
| } | |
| }, | |
| "overflow_fix": "disable", | |
| "preset": "mixed", | |
| "scope_overrides": { | |
| "activations": { | |
| "{re}.*matmul_0": { | |
| "mode": "symmetric" | |
| } | |
| } | |
| } | |
| }, | |
| "input_info": [ | |
| { | |
| "sample_size": [ | |
| 8, | |
| 128 | |
| ], | |
| "type": "long" | |
| }, | |
| { | |
| "sample_size": [ | |
| 8, | |
| 128 | |
| ], | |
| "type": "long" | |
| }, | |
| { | |
| "sample_size": [ | |
| 8, | |
| 128 | |
| ], | |
| "type": "long" | |
| } | |
| ], | |
| "optimum_version": "1.4.0", | |
| "transformers_version": "4.23.0" | |
| } | |