public class FeatureGroupEngine extends Object
| Constructor and Description |
|---|
FeatureGroupEngine() |
| Modifier and Type | Method and Description |
|---|---|
void |
insert(FeatureGroup featureGroup,
org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> featureData,
Storage storage,
HudiOperationType operation,
org.apache.spark.sql.SaveMode saveMode,
List<String> partitionKeys,
String hudiPrecombineKey,
Map<String,String> writeOptions) |
org.apache.spark.sql.streaming.StreamingQuery |
insertStream(FeatureGroup featureGroup,
org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> featureData,
String queryName,
String outputMode,
boolean awaitTermination,
Long timeout,
String checkpointLocation,
List<String> partitionKeys,
String hudiPrecombineKey,
Map<String,String> writeOptions)
Deprecated.
|
FeatureGroup |
save(FeatureGroup featureGroup,
org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> dataset,
List<String> partitionKeys,
String hudiPrecombineKey,
Map<String,String> writeOptions)
Create the metadata and write the data to the online/offline feature store.
|
void |
saveDataframe(FeatureGroup featureGroup,
org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> dataset,
Storage storage,
HudiOperationType operation,
Map<String,String> offlineWriteOptions,
Map<String,String> onlineWriteOptions,
Integer validationId) |
FeatureGroup |
saveFeatureGroupMetaData(FeatureGroup featureGroup,
List<String> partitionKeys,
String hudiPrecombineKey,
org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> featureData,
boolean saveEmpty) |
public FeatureGroup save(FeatureGroup featureGroup, org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> dataset, List<String> partitionKeys, String hudiPrecombineKey, Map<String,String> writeOptions) throws FeatureStoreException, IOException, ParseException
featureGroup - Feature Group metadata object.dataset - Spark DataFrame or RDD.partitionKeys - A list of feature names to be used as partition key when writing the feature data to the
offline storage, defaults to empty list.hudiPrecombineKey - A feature name to be used as a precombine key for the `TimeTravelFormat.HUDI` feature
group. If feature group has `TimeTravelFormat.HUDI` and hudi precombine key was not
specified then the first primary key of the feature group will be used as hudi precombine
key.writeOptions - Additional write options as key-value pairs, defaults to empty Map.FeatureStoreException - FeatureStoreExceptionIOException - IOExceptionParseException - ParseExceptionpublic void insert(FeatureGroup featureGroup, org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> featureData, Storage storage, HudiOperationType operation, org.apache.spark.sql.SaveMode saveMode, List<String> partitionKeys, String hudiPrecombineKey, Map<String,String> writeOptions) throws FeatureStoreException, IOException, ParseException
@Deprecated public org.apache.spark.sql.streaming.StreamingQuery insertStream(FeatureGroup featureGroup, org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> featureData, String queryName, String outputMode, boolean awaitTermination, Long timeout, String checkpointLocation, List<String> partitionKeys, String hudiPrecombineKey, Map<String,String> writeOptions) throws FeatureStoreException, IOException, org.apache.spark.sql.streaming.StreamingQueryException, TimeoutException, ParseException
FeatureStoreExceptionIOExceptionorg.apache.spark.sql.streaming.StreamingQueryExceptionTimeoutExceptionParseExceptionpublic void saveDataframe(FeatureGroup featureGroup, org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> dataset, Storage storage, HudiOperationType operation, Map<String,String> offlineWriteOptions, Map<String,String> onlineWriteOptions, Integer validationId) throws IOException, FeatureStoreException, ParseException
public FeatureGroup saveFeatureGroupMetaData(FeatureGroup featureGroup, List<String> partitionKeys, String hudiPrecombineKey, org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> featureData, boolean saveEmpty) throws FeatureStoreException, IOException, ParseException
Copyright © 2023. All rights reserved.