5353import java .util .stream .Stream ;
5454
5555import static org .apache .hudi .common .testutils .RawTripTestPayload .recordToString ;
56+ import static org .apache .hudi .config .HoodieBootstrapConfig .DATA_QUERIES_ONLY ;
5657import static org .junit .jupiter .api .Assertions .assertEquals ;
5758
5859/**
@@ -78,6 +79,7 @@ public class TestBootstrapRead extends HoodieSparkClientTestBase {
7879
7980 protected String [] partitionCols ;
8081 protected static String [] dropColumns = {"_hoodie_commit_time" , "_hoodie_commit_seqno" , "_hoodie_record_key" , "_hoodie_file_name" , "city_to_state" };
82+ protected static String [] fastBootstrapDropCols = {"city_to_state" , "partition_path" };
8183
8284 @ BeforeEach
8385 public void setUp () throws Exception {
@@ -227,12 +229,16 @@ protected void compareTables() {
227229 }
228230 Dataset <Row > hudiDf = sparkSession .read ().options (readOpts ).format ("hudi" ).load (hudiBasePath );
229231 Dataset <Row > bootstrapDf = sparkSession .read ().format ("hudi" ).load (bootstrapTargetPath );
232+ Dataset <Row > fastBootstrapDf = sparkSession .read ().format ("hudi" ).option (DATA_QUERIES_ONLY .key (), "true" ).load (bootstrapTargetPath );
230233 if (nPartitions == 0 ) {
234+ compareDf (fastBootstrapDf .drop ("city_to_state" ), bootstrapDf .drop (dropColumns ).drop ("_hoodie_partition_path" ));
231235 compareDf (hudiDf .drop (dropColumns ), bootstrapDf .drop (dropColumns ));
232236 return ;
233237 }
234238 compareDf (hudiDf .drop (dropColumns ).drop (partitionCols ), bootstrapDf .drop (dropColumns ).drop (partitionCols ));
239+ compareDf (fastBootstrapDf .drop ("city_to_state" ).drop (partitionCols ), bootstrapDf .drop (dropColumns ).drop ("_hoodie_partition_path" ).drop (partitionCols ));
235240 compareDf (hudiDf .select ("_row_key" ,partitionCols ), bootstrapDf .select ("_row_key" ,partitionCols ));
241+ compareDf (fastBootstrapDf .select ("_row_key" ,partitionCols ), bootstrapDf .select ("_row_key" ,partitionCols ));
236242 }
237243
238244 protected void compareDf (Dataset <Row > df1 , Dataset <Row > df2 ) {
0 commit comments