feast-dev · Felix-neko · May 31, 2025 · May 31, 2025 · Jun 1, 2025 · franciscojavierarceo
@@ -21,6 +21,7 @@ def bootstrap():
     driver_stats_df.to_parquet(
         path=str(data_path / "driver_hourly_stats.parquet"),
         allow_truncated_timestamps=True,
+        coerce_timestamps="us",
     )
 
     customer_entities = [201, 202, 203]
@@ -30,6 +31,7 @@ def bootstrap():
     customer_profile_df.to_parquet(
         path=str(data_path / "customer_daily_profile.parquet"),
         allow_truncated_timestamps=True,
+        coerce_timestamps="us",
     )
 
 

@@ -16,14 +16,8 @@
 
 
 # Entity definitions
-driver = Entity(
-    name="driver",
-    description="driver id",
-)
-customer = Entity(
-    name="customer",
-    description="customer id",
-)
+driver = Entity(name="driver", description="driver id", join_keys=["driver_id"])
+customer = Entity(name="customer", description="customer id", join_keys=["customer_id"])
 
 # Sources
 driver_hourly_stats = SparkSource(

@@ -27,27 +27,6 @@ def run_demo():
     print("\n--- Online features retrieved (instead) through a feature service---")
     fetch_online_features(store, use_feature_service=True)
 
-    print("\n--- Simulate a stream event ingestion of the hourly stats df ---")
-    event_df = pd.DataFrame.from_dict(
-        {
-            "driver_id": [1001],
-            "event_timestamp": [
-                datetime(2021, 5, 13, 10, 59, 42),
-            ],
-            "created": [
-                datetime(2021, 5, 13, 10, 59, 42),
-            ],
-            "conv_rate": [1.0],
-            "acc_rate": [1.0],
-            "avg_daily_trips": [1000],
-        }
-    )
-    print(event_df)
-    store.push("driver_stats_push_source", event_df, to=PushMode.ONLINE)
-
-    print("\n--- Online features again with updated values from a stream push---")
-    fetch_online_features(store, use_feature_service=True)
-
     print("\n--- Run feast teardown ---")
     subprocess.run(["feast", "teardown"])
 
@@ -82,8 +61,6 @@ def fetch_historical_features_entity_df(store: FeatureStore, for_batch_scoring:
             "driver_hourly_stats:conv_rate",
             "driver_hourly_stats:acc_rate",
             "driver_hourly_stats:avg_daily_trips",
-            "transformed_conv_rate:conv_rate_plus_val1",
-            "transformed_conv_rate:conv_rate_plus_val2",
         ],
     ).to_df()
     print(training_df.head())
@@ -94,23 +71,23 @@ def fetch_online_features(store, use_feature_service: bool):
         # {join_key: entity_value}
         {
             "driver_id": 1001,
+            "customer_id": 201,
             "val_to_add": 1000,
             "val_to_add_2": 2000,
         },
         {
             "driver_id": 1002,
+            "customer_id": 202,
             "val_to_add": 1001,
             "val_to_add_2": 2002,
         },
     ]
     if use_feature_service:
-        features_to_fetch = store.get_feature_service("driver_activity_v1")
+        features_to_fetch = store.get_feature_service("driver_activity")
     else:
         features_to_fetch = [
             "driver_hourly_stats:acc_rate",
             "driver_hourly_stats:avg_daily_trips",
-            "transformed_conv_rate:conv_rate_plus_val1",
-            "transformed_conv_rate:conv_rate_plus_val2",
         ]
     returned_features = store.get_online_features(
         features=features_to_fetch,