mirror of
https://github.com/saymrwulf/onnxruntime.git
synced 2026-05-17 21:10:43 +00:00
Use components = 4 if possible. llama3.2-1B becomes 20 tokens/s from 18 tokens/s on my iGPUs.
260 lines
5.5 KiB
Text
260 lines
5.5 KiB
Text
[
|
|
{
|
|
"name": "Expand 1 - float32",
|
|
"operator": "Expand",
|
|
"attributes": [],
|
|
"cases": [
|
|
{
|
|
"name": "Expand 1 - float32",
|
|
"inputs": [
|
|
{
|
|
"data": [1],
|
|
"dims": [1, 1],
|
|
"type": "float32"
|
|
},
|
|
{
|
|
"data": [1, 4],
|
|
"dims": [2],
|
|
"type": "int64"
|
|
}
|
|
],
|
|
"outputs": [
|
|
{
|
|
"data": [1, 1, 1, 1],
|
|
"dims": [1, 4],
|
|
"type": "float32"
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
{
|
|
"name": "Expand 2 - float32",
|
|
"operator": "Expand",
|
|
"attributes": [],
|
|
"cases": [
|
|
{
|
|
"name": "Expand 2 - float32",
|
|
"inputs": [
|
|
{
|
|
"data": [1],
|
|
"dims": [1, 1],
|
|
"type": "float32"
|
|
},
|
|
{
|
|
"data": [1, 6],
|
|
"dims": [2],
|
|
"type": "int64"
|
|
}
|
|
],
|
|
"outputs": [
|
|
{
|
|
"data": [1, 1, 1, 1, 1, 1],
|
|
"dims": [1, 6],
|
|
"type": "float32"
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
{
|
|
"name": "Expand 1D - float32",
|
|
"operator": "Expand",
|
|
"attributes": [],
|
|
"cases": [
|
|
{
|
|
"name": "Expand 1D - float32",
|
|
"inputs": [
|
|
{
|
|
"data": [1],
|
|
"dims": [1],
|
|
"type": "float32"
|
|
},
|
|
{
|
|
"data": [4],
|
|
"dims": [1],
|
|
"type": "int64"
|
|
}
|
|
],
|
|
"outputs": [
|
|
{
|
|
"data": [1, 1, 1, 1],
|
|
"dims": [4],
|
|
"type": "float32"
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
{
|
|
"name": "Expand 5D - float32",
|
|
"operator": "Expand",
|
|
"attributes": [],
|
|
"cases": [
|
|
{
|
|
"name": "Expand 5 - float32",
|
|
"inputs": [
|
|
{
|
|
"data": [1],
|
|
"dims": [1, 1, 1, 1, 1],
|
|
"type": "float32"
|
|
},
|
|
{
|
|
"data": [1, 1, 1, 1, 6],
|
|
"dims": [5],
|
|
"type": "int64"
|
|
}
|
|
],
|
|
"outputs": [
|
|
{
|
|
"data": [1, 1, 1, 1, 1, 1],
|
|
"dims": [1, 1, 1, 1, 6],
|
|
"type": "float32"
|
|
}
|
|
]
|
|
},
|
|
{
|
|
"name": "Expand 5 - shape < input.size()",
|
|
"inputs": [
|
|
{
|
|
"data": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12],
|
|
"dims": [1, 1, 1, 2, 6],
|
|
"type": "float32"
|
|
},
|
|
{
|
|
"data": [2, 1, 6],
|
|
"dims": [3],
|
|
"type": "int64"
|
|
}
|
|
],
|
|
"outputs": [
|
|
{
|
|
"data": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12],
|
|
"dims": [1, 1, 2, 2, 6],
|
|
"type": "float32"
|
|
}
|
|
]
|
|
},
|
|
{
|
|
"name": "Expand in components = 1, out components = 4",
|
|
"inputs": [
|
|
{
|
|
"data": [1, 2, 3, 4, 5, 6],
|
|
"dims": [3, 2, 1],
|
|
"type": "float32"
|
|
},
|
|
{
|
|
"data": [3, 1, 8],
|
|
"dims": [3],
|
|
"type": "int64"
|
|
}
|
|
],
|
|
"outputs": [
|
|
{
|
|
"data": [
|
|
1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 4, 4, 4, 4, 4, 4, 4, 4, 5, 5, 5,
|
|
5, 5, 5, 5, 5, 6, 6, 6, 6, 6, 6, 6, 6
|
|
],
|
|
"dims": [3, 2, 8],
|
|
"type": "float32"
|
|
}
|
|
]
|
|
},
|
|
{
|
|
"name": "Expand in components = 4, out components = 4",
|
|
"inputs": [
|
|
{
|
|
"data": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16],
|
|
"dims": [1, 1, 2, 8],
|
|
"type": "float32"
|
|
},
|
|
{
|
|
"data": [2, 1, 8],
|
|
"dims": [3],
|
|
"type": "int64"
|
|
}
|
|
],
|
|
"outputs": [
|
|
{
|
|
"data": [
|
|
1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15,
|
|
16
|
|
],
|
|
"dims": [1, 2, 2, 8],
|
|
"type": "float32"
|
|
}
|
|
]
|
|
}
|
|
]
|
|
},
|
|
{
|
|
"name": "Expand - bool",
|
|
"operator": "Expand",
|
|
"attributes": [],
|
|
"cases": [
|
|
{
|
|
"name": "Expand - last dim is divisible by 4",
|
|
"inputs": [
|
|
{
|
|
"data": [true, false, false, true],
|
|
"dims": [4],
|
|
"type": "bool"
|
|
},
|
|
{
|
|
"data": [2, 4],
|
|
"dims": [2],
|
|
"type": "int64"
|
|
}
|
|
],
|
|
"outputs": [
|
|
{
|
|
"data": [true, false, false, true, true, false, false, true],
|
|
"dims": [2, 4],
|
|
"type": "bool"
|
|
}
|
|
]
|
|
},
|
|
{
|
|
"name": "Expand - last dim is not divisible by 4",
|
|
"inputs": [
|
|
{
|
|
"data": [true, false, false, true, true, true],
|
|
"dims": [1, 6],
|
|
"type": "bool"
|
|
},
|
|
{
|
|
"data": [3, 1],
|
|
"dims": [2],
|
|
"type": "int64"
|
|
}
|
|
],
|
|
"outputs": [
|
|
{
|
|
"data": [
|
|
true,
|
|
false,
|
|
false,
|
|
true,
|
|
true,
|
|
true,
|
|
true,
|
|
false,
|
|
false,
|
|
true,
|
|
true,
|
|
true,
|
|
true,
|
|
false,
|
|
false,
|
|
true,
|
|
true,
|
|
true
|
|
],
|
|
"dims": [3, 6],
|
|
"type": "bool"
|
|
}
|
|
]
|
|
}
|
|
]
|
|
}
|
|
]
|