{ "$schema": "https://huggingface.co/software-mansion/react-native-executorch-spec/resolve/main/config.schema.json", "model": "phi_4_mini", "family": "phi", "capabilities": [ "text-generation" ], "backend": "xnnpack", "license": "mit", "variants": [ { "file": "phi_4_mini_xnnpack_bf16.pte", "precision": "bf16", "quantized": false, "default": true, "methods": { "enable_dynamic_shape": { "inputs": [], "outputs": [] }, "forward": { "inputs": [ { "shape": [ 1, 127 ], "dtype": "int64" }, { "shape": [ 1 ], "dtype": "int64" } ], "outputs": [ { "shape": [ 1, 200064 ], "dtype": "bfloat16" } ] }, "get_bos_id": { "inputs": [], "outputs": [] }, "get_eos_ids": { "inputs": [], "outputs": [] }, "get_max_context_len": { "inputs": [], "outputs": [] }, "get_max_seq_len": { "inputs": [], "outputs": [] }, "get_n_layers": { "inputs": [], "outputs": [] }, "get_vocab_size": { "inputs": [], "outputs": [] }, "use_kv_cache": { "inputs": [], "outputs": [] }, "use_sdpa_with_kv_cache": { "inputs": [], "outputs": [] } } }, { "file": "phi_4_mini_xnnpack_8da4w.pte", "precision": "8da4w", "quantized": true, "default": true, "methods": { "enable_dynamic_shape": { "inputs": [], "outputs": [] }, "forward": { "inputs": [ { "shape": [ 1, 2047 ], "dtype": "int64" }, { "shape": [ 1 ], "dtype": "int64" } ], "outputs": [ { "shape": [ 1, 200064 ], "dtype": "float32" } ] }, "get_bos_id": { "inputs": [], "outputs": [] }, "get_eos_ids": { "inputs": [], "outputs": [] }, "get_max_context_len": { "inputs": [], "outputs": [] }, "get_max_seq_len": { "inputs": [], "outputs": [] }, "get_n_layers": { "inputs": [], "outputs": [] }, "get_vocab_size": { "inputs": [], "outputs": [] }, "use_kv_cache": { "inputs": [], "outputs": [] }, "use_sdpa_with_kv_cache": { "inputs": [], "outputs": [] } } } ] }