This is an automated email from the ASF dual-hosted git repository.

dongjoon pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/orc-format.git


The following commit(s) were added to refs/heads/main by this push:
     new 3fecd70  MINOR: Add missing proto definition to spec (#22)
3fecd70 is described below

commit 3fecd7005111119bf873c128c81ee8f72823c989
Author: Gang Wu <[email protected]>
AuthorDate: Wed Apr 9 11:05:33 2025 +0800

    MINOR: Add missing proto definition to spec (#22)
    
    ### What changes were proposed in this pull request?
    
    - Add missing proto definitions to v1/v2 spec doc.
    - Fix alignment of type kind.
    
    
    ### Why are the changes needed?
    
    Just to be consistent with the protobuf definition
    
    ### How was this patch tested?
    
    N/A
---
 specification/ORCv0.md | 36 ++++++++++++++++++------------------
 specification/ORCv1.md | 40 +++++++++++++++++++++-------------------
 specification/ORCv2.md | 40 +++++++++++++++++++++-------------------
 3 files changed, 60 insertions(+), 56 deletions(-)

diff --git a/specification/ORCv0.md b/specification/ORCv0.md
index 5c36cf6..daccb58 100644
--- a/specification/ORCv0.md
+++ b/specification/ORCv0.md
@@ -180,24 +180,24 @@ that contains the list of their children's type ids.
 ```
 message Type {
  enum Kind {
- BOOLEAN = 0;
- BYTE = 1;
- SHORT = 2;
- INT = 3;
- LONG = 4;
- FLOAT = 5;
- DOUBLE = 6;
- STRING = 7;
- BINARY = 8;
- TIMESTAMP = 9;
- LIST = 10;
- MAP = 11;
- STRUCT = 12;
- UNION = 13;
- DECIMAL = 14;
- DATE = 15;
- VARCHAR = 16;
- CHAR = 17;
+  BOOLEAN = 0;
+  BYTE = 1;
+  SHORT = 2;
+  INT = 3;
+  LONG = 4;
+  FLOAT = 5;
+  DOUBLE = 6;
+  STRING = 7;
+  BINARY = 8;
+  TIMESTAMP = 9;
+  LIST = 10;
+  MAP = 11;
+  STRUCT = 12;
+  UNION = 13;
+  DECIMAL = 14;
+  DATE = 15;
+  VARCHAR = 16;
+  CHAR = 17;
  }
  // the kind of this type
  required Kind kind = 1;
diff --git a/specification/ORCv1.md b/specification/ORCv1.md
index a6b12d6..83b1357 100644
--- a/specification/ORCv1.md
+++ b/specification/ORCv1.md
@@ -222,25 +222,25 @@ that contains the list of their children's type ids.
 ```
 message Type {
  enum Kind {
- BOOLEAN = 0;
- BYTE = 1;
- SHORT = 2;
- INT = 3;
- LONG = 4;
- FLOAT = 5;
- DOUBLE = 6;
- STRING = 7;
- BINARY = 8;
- TIMESTAMP = 9;
- LIST = 10;
- MAP = 11;
- STRUCT = 12;
- UNION = 13;
- DECIMAL = 14;
- DATE = 15;
- VARCHAR = 16;
- CHAR = 17;
- TIMESTAMP_INSTANT = 18;
+  BOOLEAN = 0;
+  BYTE = 1;
+  SHORT = 2;
+  INT = 3;
+  LONG = 4;
+  FLOAT = 5;
+  DOUBLE = 6;
+  STRING = 7;
+  BINARY = 8;
+  TIMESTAMP = 9;
+  LIST = 10;
+  MAP = 11;
+  STRUCT = 12;
+  UNION = 13;
+  DECIMAL = 14;
+  DATE = 15;
+  VARCHAR = 16;
+  CHAR = 17;
+  TIMESTAMP_INSTANT = 18;
  }
  // the kind of this type
  required Kind kind = 1;
@@ -281,6 +281,8 @@ message ColumnStatistics {
  optional BinaryStatistics binaryStatistics = 8;
  optional TimestampStatistics timestampStatistics = 9;
  optional bool hasNull = 10;
+ optional uint64 bytes_on_disk = 11;
+ optional CollectionStatistics collection_statistics = 12;
 }
 ```
 
diff --git a/specification/ORCv2.md b/specification/ORCv2.md
index 3411485..73daf6e 100644
--- a/specification/ORCv2.md
+++ b/specification/ORCv2.md
@@ -242,25 +242,25 @@ that contains the list of their children's type ids.
 ```
 message Type {
  enum Kind {
- BOOLEAN = 0;
- BYTE = 1;
- SHORT = 2;
- INT = 3;
- LONG = 4;
- FLOAT = 5;
- DOUBLE = 6;
- STRING = 7;
- BINARY = 8;
- TIMESTAMP = 9;
- LIST = 10;
- MAP = 11;
- STRUCT = 12;
- UNION = 13;
- DECIMAL = 14;
- DATE = 15;
- VARCHAR = 16;
- CHAR = 17;
- TIMESTAMP_INSTANT = 18;
+  BOOLEAN = 0;
+  BYTE = 1;
+  SHORT = 2;
+  INT = 3;
+  LONG = 4;
+  FLOAT = 5;
+  DOUBLE = 6;
+  STRING = 7;
+  BINARY = 8;
+  TIMESTAMP = 9;
+  LIST = 10;
+  MAP = 11;
+  STRUCT = 12;
+  UNION = 13;
+  DECIMAL = 14;
+  DATE = 15;
+  VARCHAR = 16;
+  CHAR = 17;
+  TIMESTAMP_INSTANT = 18;
  }
  // the kind of this type
  required Kind kind = 1;
@@ -301,6 +301,8 @@ message ColumnStatistics {
  optional BinaryStatistics binaryStatistics = 8;
  optional TimestampStatistics timestampStatistics = 9;
  optional bool hasNull = 10;
+ optional uint64 bytes_on_disk = 11;
+ optional CollectionStatistics collection_statistics = 12;
 }
 ```
 

Reply via email to