File size: 1,114 Bytes
5ecf91a | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 | {
"model_type": "depthformer_base_decoder_step",
"inputs": [
{
"name": "target_token",
"shape": [
1,
1
],
"dtype": "int32"
},
{
"name": "encoder_hidden_states",
"shape": [
1,
1006,
768
],
"dtype": "float32"
},
{
"name": "kv_cache_keys",
"shape": "dynamic",
"dtype": "float32"
},
{
"name": "kv_cache_values",
"shape": "dynamic",
"dtype": "float32"
}
],
"outputs": [
{
"name": "logits",
"shape": [
1,
16384
],
"dtype": "float32"
},
{
"name": "new_kv_cache_keys",
"shape": "dynamic",
"dtype": "float32"
},
{
"name": "new_kv_cache_values",
"shape": "dynamic",
"dtype": "float32"
}
],
"model_config": {
"embed_dim": 768,
"num_heads": 12,
"num_decoder_layers": 12,
"mlp_dim": 2048
},
"kv_cache": {
"max_length": 1806,
"num_heads": 12,
"head_dim": 64
},
"opset_version": 18,
"ir_version": 8,
"precision": "fp16"
} |