Skip to content

Commit 49a9438

Browse files
committed
Bump dependency versions; Bump ONNX version; Update README
1 parent e36ed46 commit 49a9438

File tree

4 files changed

+79
-20
lines changed

4 files changed

+79
-20
lines changed

README.md

+1-1
Original file line numberDiff line numberDiff line change
@@ -89,7 +89,7 @@ If your input shapes are static, feel free to wrap your calls into it in a facad
8989

9090
ONNX-Scala is cross-built against Scala JVM, Scala.js/JavaScript and Scala Native (for Scala 3 / Dotty )
9191

92-
Currently at ONNX 1.14.1 (Backward compatible to at least 1.2.0 for the full model API, 1.7.0 for the fine-grained API), ONNX Runtime 1.16.3.
92+
Currently at ONNX 1.17.0 (Backward compatible to at least 1.2.0 for the full model API, 1.7.0 for the fine-grained API), ONNX Runtime 1.20.0.
9393

9494
### Fine-grained API
9595
A complete\*, versioned, numerically generic, type-safe / typeful API to ONNX(Open Neural Network eXchange, an open format to represent deep learning and classical machine learning models), derived from the Protobuf definitions and the operator schemas (defined in C++).

build.sbt

+2-2
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@ import scala.sys.process.Process
33
import sbtcrossproject.CrossPlugin.autoImport.{crossProject, CrossType}
44

55
//val dottyVersion = dottyLatestNightlyBuild.get
6-
val dottyVersion = "3.6.2"
6+
val dottyVersion = "3.6.3"
77
val spireVersion = "0.18.0"
88
val scalaTestVersion = "3.2.19"
99

@@ -30,7 +30,7 @@ lazy val commonSettings = Seq(
3030
"-deprecation",
3131
// "-release:21",
3232
"-rewrite",
33-
"-source:3.4-migration"
33+
"-source:3.6-migration"
3434
),
3535
versionPolicyIntention := Compatibility.BinaryCompatible, // As long as we are pre 1.0.0, BinaryCompatible for a patch version bump and None for a minor version bump
3636
versionScheme := Some("early-semver"),

project/plugins.sbt

+1-1
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ addDependencyTreePlugin
22
addSbtPlugin("ch.epfl.scala" % "sbt-version-policy" % "3.2.1")
33
addSbtPlugin("org.portable-scala" % "sbt-scalajs-crossproject" % "1.3.2")
44
addSbtPlugin("org.portable-scala" % "sbt-scala-native-crossproject" % "1.3.2")
5-
addSbtPlugin("org.scala-js" % "sbt-scalajs" % "1.18.1")
5+
addSbtPlugin("org.scala-js" % "sbt-scalajs" % "1.18.2")
66
addSbtPlugin("org.scala-native" % "sbt-scala-native" % "0.5.6")
77
addSbtPlugin("ch.epfl.scala" % "sbt-scalafix" % "0.13.0")
88
addSbtPlugin("org.scalameta" % "sbt-scalafmt" % "2.5.2")

proto/src/main/protobuf/onnx.proto

+75-16
Original file line numberDiff line numberDiff line change
@@ -96,13 +96,21 @@ enum Version {
9696
// - Implicitly add inference graph into each TrainingInfoProto's algorithm.
9797
IR_VERSION_2020_5_8 = 0x0000000000000007;
9898

99-
// IR VERSION 8 published on <TBD>
99+
// IR VERSION 8 published on July 30, 2021
100100
// Introduce TypeProto.SparseTensor
101101
// Introduce TypeProto.Optional
102102
// Added a list of FunctionProtos local to the model
103103
// Deprecated since_version and operator status from FunctionProto
104-
IR_VERSION = 0x0000000000000008;
104+
IR_VERSION_2021_7_30 = 0x0000000000000008;
105105

106+
// IR VERSION 9 published on May 5, 2023
107+
// Added AttributeProto to FunctionProto so that default attribute values can be set.
108+
// Added FLOAT8E4M3FN, FLOAT8E4M3FNUZ, FLOAT8E5M2, FLOAT8E5M2FNUZ.
109+
IR_VERSION_2023_5_5 = 0x0000000000000009;
110+
111+
// IR VERSION 10 published on TBD
112+
// Added UINT4, INT4.
113+
IR_VERSION = 0x000000000000000A;
106114
}
107115

108116
// Attributes
@@ -112,6 +120,8 @@ enum Version {
112120
// An AttributeProto MUST contain the name field, and *only one* of the
113121
// following content fields, effectively enforcing a C/C++ union equivalent.
114122
message AttributeProto {
123+
reserved 12, 16 to 19;
124+
reserved "v";
115125

116126
// Note: this enum is structurally identical to the OpSchema::AttrType
117127
// enum defined in schema.h. If you rev one, you likely need to rev the other.
@@ -184,6 +194,8 @@ message ValueInfoProto {
184194
optional TypeProto type = 2;
185195
// A human-readable documentation for this value. Markdown is allowed.
186196
optional string doc_string = 3;
197+
// Named metadata values; keys should be distinct.
198+
repeated StringStringEntryProto metadata_props = 4;
187199
}
188200

189201
// Nodes
@@ -198,19 +210,24 @@ message NodeProto {
198210
repeated string output = 2; // namespace Value
199211

200212
// An optional identifier for this node in a graph.
201-
// This field MAY be absent in ths version of the IR.
213+
// This field MAY be absent in this version of the IR.
202214
optional string name = 3; // namespace Node
203215

204216
// The symbolic identifier of the Operator to execute.
205217
optional string op_type = 4; // namespace Operator
206218
// The domain of the OperatorSet that specifies the operator named by op_type.
207219
optional string domain = 7; // namespace Domain
220+
// Overload identifier, used only to map this to a model-local function.
221+
optional string overload = 8;
208222

209223
// Additional named attributes.
210224
repeated AttributeProto attribute = 5;
211225

212226
// A human-readable documentation for this node. Markdown is allowed.
213227
optional string doc_string = 6;
228+
229+
// Named metadata values; keys should be distinct.
230+
repeated StringStringEntryProto metadata_props = 9;
214231
}
215232

216233
// Training information
@@ -255,7 +272,7 @@ message TrainingInfoProto {
255272
//
256273
// An execution of the training algorithm step is performed by executing the
257274
// graph obtained by combining the inference graph (namely "ModelProto.graph")
258-
// and the "algorithm" graph. That is, the actual the actual
275+
// and the "algorithm" graph. That is, the actual
259276
// input/initializer/output/node/value_info/sparse_initializer list of
260277
// the training graph is the concatenation of
261278
// "ModelProto.graph.input/initializer/output/node/value_info/sparse_initializer"
@@ -395,9 +412,9 @@ message ModelProto {
395412

396413
// A list of function protos local to the model.
397414
//
398-
// Name of the function "FunctionProto.name" should be unique within the domain "FunctionProto.domain".
415+
// The (domain, name, overload) tuple must be unique across the function protos in this list.
399416
// In case of any conflicts the behavior (whether the model local functions are given higher priority,
400-
// or standard opserator sets are given higher priotity or this is treated as error) is defined by
417+
// or standard operator sets are given higher priotity or this is treated as error) is defined by
401418
// the runtimes.
402419
//
403420
// The operator sets imported by FunctionProto should be compatible with the ones
@@ -469,6 +486,9 @@ message GraphProto {
469486
// which means, tensor 'a_scale' and tensor 'a_zero_point' are scale and zero point of tensor 'a' in the model.
470487
repeated TensorAnnotation quantization_annotation = 14;
471488

489+
// Named metadata values; keys should be distinct.
490+
repeated StringStringEntryProto metadata_props = 16;
491+
472492
reserved 3, 4, 6 to 9;
473493
reserved "ir_version", "producer_version", "producer_tag", "domain";
474494
}
@@ -505,6 +525,21 @@ message TensorProto {
505525
// This format has 1 sign bit, 8 exponent bits, and 7 mantissa bits.
506526
BFLOAT16 = 16;
507527

528+
// Non-IEEE floating-point format based on papers
529+
// FP8 Formats for Deep Learning, https://arxiv.org/abs/2209.05433,
530+
// 8-bit Numerical Formats For Deep Neural Networks, https://arxiv.org/pdf/2206.02915.pdf.
531+
// Operators supported FP8 are Cast, CastLike, QuantizeLinear, DequantizeLinear.
532+
// The computation usually happens inside a block quantize / dequantize
533+
// fused by the runtime.
534+
FLOAT8E4M3FN = 17; // float 8, mostly used for coefficients, supports nan, not inf
535+
FLOAT8E4M3FNUZ = 18; // float 8, mostly used for coefficients, supports nan, not inf, no negative zero
536+
FLOAT8E5M2 = 19; // follows IEEE 754, supports nan, inf, mostly used for gradients
537+
FLOAT8E5M2FNUZ = 20; // follows IEEE 754, supports nan, not inf, mostly used for gradients, no negative zero
538+
539+
// 4-bit data-types
540+
UINT4 = 21; // Unsigned integer in range [0, 15]
541+
INT4 = 22; // Signed integer in range [-8, 7], using two's-complement representation
542+
508543
// Future extensions go here.
509544
}
510545

@@ -538,11 +573,13 @@ message TensorProto {
538573
// When this field is present, the data_type field MUST be FLOAT or COMPLEX64.
539574
repeated float float_data = 4 [packed = true];
540575

541-
// For int32, uint8, int8, uint16, int16, bool, and float16 values
542-
// float16 values must be bit-wise converted to an uint16_t prior
576+
// For int32, uint8, int8, uint16, int16, uint4, int4, bool, float8 and float16 values
577+
// float16 and float8 values must be bit-wise converted to an uint16_t prior
543578
// to writing to the buffer.
579+
// uint4 and int4 values must be packed to 4bitx2 prior to writing to the buffer, the first element is stored in
580+
// the 4 LSB and the second element is stored in the 4 MSB.
544581
// When this field is present, the data_type field MUST be
545-
// INT32, INT16, INT8, UINT16, UINT8, BOOL, or FLOAT16
582+
// INT32, INT16, INT8, INT4, UINT16, UINT8, UINT4, BOOL, FLOAT16, BFLOAT16, FLOAT8E4M3FN, FLOAT8E4M3FNUZ, FLOAT8E5M2, FLOAT8E5M2FNUZ
546583
repeated int32 int32_data = 5 [packed = true];
547584

548585
// For strings.
@@ -572,6 +609,7 @@ message TensorProto {
572609
// Complex64 elements must be written as two consecutive FLOAT values, real component first.
573610
// Complex128 elements must be written as two consecutive DOUBLE values, real component first.
574611
// Boolean type MUST be written one byte per tensor element (00000001 for true, 00000000 for false).
612+
// uint4 and int4 values must be packed to 4bitx2, the first element is stored in the 4 LSB and the second element is stored in the 4 MSB.
575613
//
576614
// Note: the advantage of specific field rather than the raw_data field is
577615
// that in some cases (e.g. int data), protobuf does a better packing via
@@ -614,6 +652,9 @@ message TensorProto {
614652
// When this field is present, the data_type field MUST be
615653
// UINT32 or UINT64
616654
repeated uint64 uint64_data = 11 [packed = true];
655+
656+
// Named metadata values; keys should be distinct.
657+
repeated StringStringEntryProto metadata_props = 16;
617658
}
618659

619660
// A serialized sparse-tensor value
@@ -760,9 +801,8 @@ enum OperatorStatus {
760801
}
761802

762803
message FunctionProto {
763-
// The name of the function, similar usage of op_type in OperatorProto.
764-
// Combined with FunctionProto.domain, this forms the unique identity of
765-
// the FunctionProto.
804+
// The name of the function, similar to op_type in NodeProto.
805+
// This is part of the unique-id (domain, name, overload) of FunctionProtos in a model.
766806
optional string name = 1;
767807

768808
// Deprecated since IR Version 8
@@ -779,9 +819,16 @@ message FunctionProto {
779819
repeated string input = 4;
780820
repeated string output = 5;
781821

782-
// The attributes of the function.
822+
// The attribute parameters of the function.
823+
// It is for function parameters without default values.
783824
repeated string attribute = 6;
784825

826+
// The attribute protos of the function.
827+
// It is for function attributes with default values.
828+
// A function attribute shall be represented either as
829+
// a string attribute or an AttributeProto, not both.
830+
repeated AttributeProto attribute_proto = 11;
831+
785832
// The nodes in the function.
786833
repeated NodeProto node = 7;
787834
// A human-readable documentation for this function. Markdown is allowed.
@@ -802,11 +849,23 @@ message FunctionProto {
802849

803850
repeated OperatorSetIdProto opset_import = 9;
804851

805-
// The domain which this function belongs to. Combined with FunctionProto.name, this forms the unique identity of
806-
// the FunctionProto.
852+
// The domain which this function belongs to.
853+
// This is part of the unique-id (domain, name, overload) of FunctionProtos in a model.
807854
optional string domain = 10;
808-
}
809855

856+
// The overload identifier of the function.
857+
// This is part of the unique-id (domain, name, overload) of FunctionProtos in a model.
858+
optional string overload = 13;
859+
860+
// Information for the values in the function. The ValueInfoProto.name's
861+
// must be distinct and refer to names in the function (including inputs,
862+
// outputs, and intermediate values). It is optional for a value to appear
863+
// in value_info list.
864+
repeated ValueInfoProto value_info = 12;
865+
866+
// Named metadata values; keys should be distinct.
867+
repeated StringStringEntryProto metadata_props = 14;
868+
}
810869

811870
// For using protobuf-lite
812871
option optimize_for = LITE_RUNTIME;

0 commit comments

Comments
 (0)