apache · simhadri-g · Aug 1, 2023 · Aug 2, 2023 · Aug 17, 2023 · Aug 17, 2023
diff --git a/core/src/main/java/org/apache/iceberg/puffin/StandardBlobTypes.java b/core/src/main/java/org/apache/iceberg/puffin/StandardBlobTypes.java
@@ -27,6 +27,20 @@ private StandardBlobTypes() {}
    */
   public static final String APACHE_DATASKETCHES_THETA_V1 = "apache-datasketches-theta-v1";
 
+  /**
+   * A serialized form of Hive column stats object. The full list of available stats are provided in
+   * the <a
+   * href="https://cwiki.apache.org/confluence/display/Hive/StatsDev#StatsDev-ColumnStatistics">Hive
+   * columns stats wiki </a>
+   */
+  public static final String HIVE_COLUMN_STATS_OBJ = "hive-column-statistics-obj";
+
+  /**
+   * A serialized form of a KLL sketch produced by the <a
+   * href="https://datasketches.apache.org/">Apache DataSketches</a> library
+   */
+  public static final String APACHE_DATASKETCHES_KLL_SKETCH = "apache-datasketches-kll-sketch";
+
   /** A serialized deletion vector according to the Iceberg spec */
   public static final String DV_V1 = "deletion-vector-v1";
 }
diff --git a/format/puffin-spec.md b/format/puffin-spec.md
@@ -181,6 +181,23 @@ for Puffin v1.
 [roaring-bitmap-portable-serialization]: https://github.com/RoaringBitmap/RoaringFormatSpec?tab=readme-ov-file#extension-for-64-bit-implementations
 [roaring-bitmap-general-layout]: https://github.com/RoaringBitmap/RoaringFormatSpec?tab=readme-ov-file#general-layout
 
+#### `hive-column-statistics-obj` blob type
+
+A serialized form of Hive ColumnStatsObject.
+
+The ColumnStatsObject supports Histograms, NDV, Min and Max values, Number of nulls, Number of trues, column name, type.
+A full list of supported statistics is listed in the table here:
+[ColumnStatistics](https://cwiki.apache.org/confluence/display/Hive/StatsDev#StatsDev-ColumnStatistics)
+
+#### `apache-datasketches-KLL-sketch` blob type
+
+A serialized form of a "compact" KLL-sketch produced by the [Apache
+DataSketches](https://datasketches.apache.org/) library.
+Apache-Datasketches-KLL-sketch is an implementation of a very compact quantiles
+sketch with lazy compaction scheme and nearly optimal accuracy per bit.
+
+Histograms are derived from this sketch.
+
 ### Compression codecs
 
 The data can also be uncompressed. If it is compressed the codec should be one of