Instructions to use ApacheOne/expimodel with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers
How to use ApacheOne/expimodel with Transformers:
# Load model directly from transformers import AutoModel model = AutoModel.from_pretrained("ApacheOne/expimodel", dtype="auto") - Notebooks
- Google Colab
- Kaggle
| { | |
| "quant_cfg": { | |
| "*weight_quantizer": { | |
| "num_bits": [ | |
| 2, | |
| 1 | |
| ], | |
| "block_sizes": { | |
| "-1": 16, | |
| "type": "dynamic", | |
| "scale_bits": [ | |
| 4, | |
| 3 | |
| ] | |
| }, | |
| "enable": true | |
| }, | |
| "*input_quantizer": { | |
| "enable": false | |
| }, | |
| "nn.BatchNorm1d": { | |
| "*": { | |
| "enable": false | |
| } | |
| }, | |
| "nn.BatchNorm2d": { | |
| "*": { | |
| "enable": false | |
| } | |
| }, | |
| "nn.BatchNorm3d": { | |
| "*": { | |
| "enable": false | |
| } | |
| }, | |
| "nn.LeakyReLU": { | |
| "*": { | |
| "enable": false | |
| } | |
| }, | |
| "*lm_head*": { | |
| "enable": false | |
| }, | |
| "*proj_out.*": { | |
| "enable": false | |
| }, | |
| "*block_sparse_moe.gate*": { | |
| "enable": false | |
| }, | |
| "*router*": { | |
| "enable": false | |
| }, | |
| "*mlp.gate.*": { | |
| "enable": false | |
| }, | |
| "*mlp.shared_expert_gate.*": { | |
| "enable": false | |
| }, | |
| "*linear_attn.conv1d*": { | |
| "enable": false | |
| }, | |
| "*mixer.conv1d*": { | |
| "enable": false | |
| }, | |
| "*output_layer*": { | |
| "enable": false | |
| }, | |
| "output.*": { | |
| "enable": false | |
| }, | |
| "default": { | |
| "enable": false | |
| }, | |
| "*embed_tokens*": { | |
| "enable": false | |
| }, | |
| "*norm*": { | |
| "enable": false | |
| }, | |
| "*layernorm*": { | |
| "enable": false | |
| }, | |
| "*LayerNorm*": { | |
| "enable": false | |
| }, | |
| "*rotary*": { | |
| "enable": false | |
| }, | |
| "*pos_embed*": { | |
| "enable": false | |
| }, | |
| "*patch_embed*": { | |
| "enable": false | |
| }, | |
| "*bias*": { | |
| "enable": false | |
| }, | |
| "*final_layer2*": { | |
| "enable": false | |
| }, | |
| "*t_embedder1*": { | |
| "enable": false | |
| }, | |
| "*x_embedder*": { | |
| "enable": false | |
| }, | |
| "*visual*": { | |
| "enable": false | |
| }, | |
| "*visual.*": { | |
| "enable": false | |
| }, | |
| "model.visual*": { | |
| "enable": false | |
| }, | |
| "model.visual.*": { | |
| "enable": false | |
| }, | |
| "*model.visual*": { | |
| "enable": false | |
| }, | |
| "*model.visual.*": { | |
| "enable": false | |
| }, | |
| "*visual*weight_quantizer": { | |
| "enable": false | |
| }, | |
| "*visual*input_quantizer": { | |
| "enable": false | |
| }, | |
| "model.visual*weight_quantizer": { | |
| "enable": false | |
| }, | |
| "model.visual*input_quantizer": { | |
| "enable": false | |
| }, | |
| "*visual.blocks*": { | |
| "enable": false | |
| }, | |
| "*visual.blocks.*": { | |
| "enable": false | |
| }, | |
| "*visual.blocks.*.attn.qkv*": { | |
| "enable": false | |
| } | |
| }, | |
| "algorithm": null | |
| } |