vespa-engine · arnej27959 · Dec 15, 2025 · Dec 11, 2025 · Dec 11, 2025 · Dec 11, 2025
diff --git a/application/pom.xml b/application/pom.xml
@@ -53,6 +53,10 @@
           <groupId>javax.annotation</groupId>
           <artifactId>javax.annotation-api</artifactId>
         </exclusion>
+        <exclusion>
+          <groupId>com.dev-smart</groupId>
+          <artifactId>ubjson</artifactId>
+        </exclusion>
       </exclusions>
     </dependency>
     <dependency>

diff --git a/config-model-fat/pom.xml b/config-model-fat/pom.xml
@@ -186,6 +186,7 @@
 
                     <!-- 3rd party artifacts embedded -->
                     <i>aopalliance:aopalliance:*:*</i>
+                    <i>com.dev-smart:ubjson:*:*</i>
                     <i>com.google.errorprone:error_prone_annotations:*:*</i>
                     <i>com.google.guava:failureaccess:*:*</i>
                     <i>com.google.guava:guava:*:*</i>

diff --git a/container-dev/pom.xml b/container-dev/pom.xml
@@ -94,6 +94,10 @@
           <groupId>org.lz4</groupId>
           <artifactId>lz4-java</artifactId>
         </exclusion>
+        <exclusion>
+          <groupId>com.dev-smart</groupId>
+          <artifactId>ubjson</artifactId>
+        </exclusion>
       </exclusions>
     </dependency>
     <dependency>

diff --git a/dependency-versions/pom.xml b/dependency-versions/pom.xml
@@ -33,6 +33,7 @@
 
         <!-- DO NOT UPGRADE THESE TO A NEW MAJOR VERSION WITHOUT CHECKING FOR BINARY COMPATIBILITY -->
         <aopalliance.vespa.version>1.0</aopalliance.vespa.version>
+        <dev-smart-ubjson.vespa.version>0.1.8</dev-smart-ubjson.vespa.version>
         <error-prone-annotations.vespa.version>2.30.0</error-prone-annotations.vespa.version>
         <guava.vespa.version>33.2.1-jre</guava.vespa.version>
         <guice.vespa.version>6.0.0</guice.vespa.version>

diff --git a/model-integration/pom.xml b/model-integration/pom.xml
@@ -376,6 +376,10 @@
       <version>${testcontainers.vespa.version}</version>
       <scope>test</scope>
     </dependency>
+    <dependency>
+      <groupId>com.dev-smart</groupId>
+      <artifactId>ubjson</artifactId>
+    </dependency>
   </dependencies>
   <build>
     <plugins>

diff --git a/...tion/src/main/java/ai/vespa/rankingexpression/importer/xgboost/AbstractXGBoostParser.java b/...tion/src/main/java/ai/vespa/rankingexpression/importer/xgboost/AbstractXGBoostParser.java
@@ -0,0 +1,66 @@
+// Copyright Vespa.ai. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.
+package ai.vespa.rankingexpression.importer.xgboost;
+
+/**
+ * Base class for XGBoost parsers containing shared tree-to-expression conversion logic.
+ *
+ * @author arnej
+ */
+abstract class AbstractXGBoostParser {
+
+    /**
+     * Converts an XGBoostTree node to a Vespa ranking expression string.
+     * This method handles both leaf nodes and split nodes recursively.
+     *
+     * @param node XGBoost tree node to convert.
+     * @return Vespa ranking expression for input node.
+     */
+    protected String treeToRankExp(XGBoostTree node) {
+        if (node.isLeaf()) {
+            return Double.toString(node.getLeaf());
+        } else {
+            assert node.getChildren().size() == 2;
+            String trueExp;
+            String falseExp;
+            if (node.getYes() == node.getChildren().get(0).getNodeid()) {
+                trueExp = treeToRankExp(node.getChildren().get(0));
+                falseExp = treeToRankExp(node.getChildren().get(1));
+            } else {
+                trueExp = treeToRankExp(node.getChildren().get(1));
+                falseExp = treeToRankExp(node.getChildren().get(0));
+            }
+            // xgboost uses float only internally, so round to closest float
+            float xgbSplitPoint = (float)node.getSplit_condition();
+            // but Vespa expects rank profile literals in double precision:
+            double vespaSplitPoint = xgbSplitPoint;
+            String formattedSplit = formatSplit(node.getSplit());
+            String condition;
+            if (node.getMissing() == node.getYes()) {
+                // Note: this is for handling missing features, as the backend handles comparison with NaN as false.
+                condition = "!(" + formattedSplit + " >= " + vespaSplitPoint + ")";
+            } else {
+                condition = formattedSplit + " < " + vespaSplitPoint;
+            }
+            return "if (" + condition + ", " + trueExp + ", " + falseExp + ")";
+        }
+    }
+
+    /**
+     * Formats a split field value for use in ranking expressions.
+     * If the split is a plain integer, wraps it with xgboost_input_X format.
+     * Otherwise, uses the split value as-is (for backward compatibility with JSON format).
+     *
+     * @param split The split field value from the tree node
+     * @return Formatted split expression for use in conditions
+     */
+    protected String formatSplit(String split) {
+        try {
+            Integer.parseInt(split);
+            return "xgboost_input_" + split;
+        } catch (NumberFormatException e) {
+            // Not a plain integer, use as-is (JSON format already has full attribute name)
+            return split;
+        }
+    }
+
+}
diff --git a/...ntegration/src/main/java/ai/vespa/rankingexpression/importer/xgboost/XGBoostImporter.java b/...ntegration/src/main/java/ai/vespa/rankingexpression/importer/xgboost/XGBoostImporter.java
@@ -25,6 +25,9 @@ public boolean canImport(String modelPath) {
         File modelFile = new File(modelPath);
         if ( ! modelFile.isFile()) return false;
 
+        if (modelFile.toString().endsWith(".ubj")) {
+            return XGBoostUbjParser.probe(modelPath);
+        }
         return modelFile.toString().endsWith(".json") && probe(modelFile);
     }
 
@@ -52,9 +55,15 @@ private boolean probe(File modelFile) {
     public ImportedModel importModel(String modelName, String modelPath) {
         try {
             ImportedModel model = new ImportedModel(modelName, modelPath, ImportedMlModel.ModelType.XGBOOST);
-            XGBoostParser parser = new XGBoostParser(modelPath);
-            RankingExpression expression = new RankingExpression(parser.toRankingExpression());
-            model.expression(modelName, expression);
+            if (modelPath.endsWith(".ubj")) {
+                XGBoostUbjParser parser = new XGBoostUbjParser(modelPath);
+                RankingExpression expression = new RankingExpression(parser.toRankingExpression());
+                model.expression(modelName, expression);
+            } else {
+                XGBoostParser parser = new XGBoostParser(modelPath);
+                RankingExpression expression = new RankingExpression(parser.toRankingExpression());
+                model.expression(modelName, expression);
+            }
             return model;
         } catch (IOException e) {
             throw new IllegalArgumentException("Could not import XGBoost model from '" + modelPath + "'", e);

diff --git a/...-integration/src/main/java/ai/vespa/rankingexpression/importer/xgboost/XGBoostParser.java b/...-integration/src/main/java/ai/vespa/rankingexpression/importer/xgboost/XGBoostParser.java
@@ -13,7 +13,7 @@
 /**
  * @author grace-lam
  */
-class XGBoostParser {
+class XGBoostParser extends AbstractXGBoostParser {
 
     private final List<XGBoostTree> xgboostTrees;
 
@@ -49,39 +49,4 @@ String toRankingExpression() {
         return ret.toString();
     }
 
-    /**
-     * Recursive helper function for toRankingExpression().
-     *
-     * @param node XGBoost tree node to convert.
-     * @return Vespa ranking expression for input node.
-     */
-    private String treeToRankExp(XGBoostTree node) {
-        if (node.isLeaf()) {
-            return Double.toString(node.getLeaf());
-        } else {
-            assert node.getChildren().size() == 2;
-            String trueExp;
-            String falseExp;
-            if (node.getYes() == node.getChildren().get(0).getNodeid()) {
-                trueExp = treeToRankExp(node.getChildren().get(0));
-                falseExp = treeToRankExp(node.getChildren().get(1));
-            } else {
-                trueExp = treeToRankExp(node.getChildren().get(1));
-                falseExp = treeToRankExp(node.getChildren().get(0));
-            }
-            // xgboost uses float only internally, so round to closest float
-            float xgbSplitPoint = (float)node.getSplit_condition();
-            // but Vespa expects rank profile literals in double precision:
-            double vespaSplitPoint = xgbSplitPoint;
-            String condition;
-            if (node.getMissing() == node.getYes()) {
-                // Note: this is for handling missing features, as the backend handles comparison with NaN as false.
-                condition = "!(" + node.getSplit() + " >= " + vespaSplitPoint + ")";
-            } else {
-                condition = node.getSplit() + " < " + vespaSplitPoint;
-            }
-            return "if (" + condition + ", " + trueExp + ", " + falseExp + ")";
-        }
-    }
-
 }