Skip to content

Commit d9591f2

Browse files
authored
[xnn update prep] Update Dtypes for XNNPACK (#11505)
Update our dtypes table in xnnpack
1 parent acc3e25 commit d9591f2

File tree

4 files changed

+30
-0
lines changed

4 files changed

+30
-0
lines changed

backends/xnnpack/runtime/XNNCompiler.cpp

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -121,6 +121,14 @@ xnn_datatype getDataType(const DataType& data_type) {
121121
return xnn_datatype::xnn_datatype_qdint8;
122122
case DataType::xnn_datatype_qbint4:
123123
return xnn_datatype::xnn_datatype_qbint4;
124+
case DataType::xnn_datatype_qpint8:
125+
return xnn_datatype::xnn_datatype_qpint8;
126+
case DataType::xnn_datatype_int32:
127+
return xnn_datatype::xnn_datatype_int32;
128+
case DataType::xnn_datatype_pfp32:
129+
return xnn_datatype::xnn_datatype_pfp32;
130+
case DataType::xnn_datatype_bf16:
131+
return xnn_datatype::xnn_datatype_bf16;
124132
default:
125133
return xnn_datatype::xnn_datatype_invalid;
126134
}

backends/xnnpack/serialization/runtime_schema.fbs

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -29,6 +29,15 @@ enum XNNDatatype : short {
2929
xnn_datatype_qdint8 = 9,
3030
/// Quantized 4-bit signed integer with shared blockwise quantization parameters.
3131
xnn_datatype_qbint4 = 10,
32+
/// Dynamically quantized 8-bit signed integers packed with their per-row
33+
/// quantization parameters.
34+
xnn_datatype_qpint8 = 11,
35+
/// 32-bit signed integers.
36+
xnn_datatype_int32 = 12,
37+
/// IEEE754 single-precision packed floating-point.
38+
xnn_datatype_pfp32 = 13,
39+
/// BFloat16, i.e. the upper 16 bits of a float32.
40+
xnn_datatype_bf16 = 14,
3241
}
3342

3443
// type of quantization

backends/xnnpack/serialization/schema.fbs

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -29,6 +29,15 @@ enum XNNDatatype : short {
2929
xnn_datatype_qdint8 = 9,
3030
/// Quantized 4-bit signed integer with shared blockwise quantization parameters.
3131
xnn_datatype_qbint4 = 10,
32+
/// Dynamically quantized 8-bit signed integers packed with their per-row
33+
/// quantization parameters.
34+
xnn_datatype_qpint8 = 11,
35+
/// 32-bit signed integers.
36+
xnn_datatype_int32 = 12,
37+
/// IEEE754 single-precision packed floating-point.
38+
xnn_datatype_pfp32 = 13,
39+
/// BFloat16, i.e. the upper 16 bits of a float32.
40+
xnn_datatype_bf16 = 14,
3241
}
3342

3443
// type of quantization

backends/xnnpack/serialization/xnnpack_graph_schema.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -430,6 +430,10 @@ class XNNDatatype(IntEnum):
430430
xnn_datatype_qcint4 = 8
431431
xnn_datatype_qdint8 = 9
432432
xnn_datatype_qbint4 = 10
433+
xnn_datatype_qpint8 = 11
434+
xnn_datatype_int32 = 12
435+
xnn_datatype_pfp32 = 13
436+
xnn_datatype_bf16 = 14
433437

434438

435439
@dataclass

0 commit comments

Comments
 (0)