feast-dev
diff --git a/‎README.md‎
Lines changed: 1 addition & 1 deletion b/‎README.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/tutorials/azure/data/data_generator.py‎
Lines changed: 5 additions & 8 deletions b/‎docs/tutorials/azure/data/data_generator.py‎
Lines changed: 5 additions & 8 deletions
diff --git a/‎docs/tutorials/azure/notebooks/src/score.py‎
Lines changed: 1 addition & 1 deletion b/‎docs/tutorials/azure/notebooks/src/score.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/java-demo/feature_repo/driver_repo.py‎
Lines changed: 4 additions & 2 deletions b/‎examples/java-demo/feature_repo/driver_repo.py‎
Lines changed: 4 additions & 2 deletions
diff --git a/‎examples/java-demo/feature_repo/test.py‎
Lines changed: 5 additions & 1 deletion b/‎examples/java-demo/feature_repo/test.py‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎examples/java-demo/feature_repo/test_python_fetch.py‎
Lines changed: 1 addition & 1 deletion b/‎examples/java-demo/feature_repo/test_python_fetch.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/kind-quickstart/src/utils.py‎
Lines changed: 15 additions & 9 deletions b/‎examples/kind-quickstart/src/utils.py‎
Lines changed: 15 additions & 9 deletions
diff --git a/‎examples/online_store/milvus_tutorial/milvus_example.py‎
Lines changed: 67 additions & 29 deletions b/‎examples/online_store/milvus_tutorial/milvus_example.py‎
Lines changed: 67 additions & 29 deletions
@@ -33,7 +33,7 @@ Feast allows ML platform teams to:
 
 * **Make features consistently available for training and serving** by managing an _offline store_ (to process historical data for scale-out batch scoring or model training), a low-latency _online store_ (to power real-time prediction)_,_ and a battle-tested _feature server_ (to serve pre-computed features online).
 * **Avoid data leakage** by generating point-in-time correct feature sets so data scientists can focus on feature engineering rather than debugging error-prone dataset joining logic. This ensure that future feature values do not leak to models during training.
-* **Decouple ML from data infrastructure** by providing a single data access layer that abstracts feature storage from feature retrieval, ensuring models remain portable as you move from training models to serving models, from batch models to real-time models, and from one data infra system to another.
+* **Decouple ML from data infrastructure** by providing a single data access layer that abstracts feature storage from feature retrieval, ensuring models remain portable as you move from training models to serving models, from batch models to realtime models, and from one data infra system to another.
 
 Please see our [documentation](https://docs.feast.dev/) for more information about the project.
 
 
@@ -7,8 +7,7 @@
 from pytz import FixedOffset, timezone, utc
 from random import randint
 from enum import Enum
-from sqlalchemy import create_engine, DateTime
-from datetime import datetime
+from sqlalchemy import DateTime
 
 DEFAULT_ENTITY_DF_EVENT_TIMESTAMP_COL = "event_timestamp"
 
@@ -65,7 +64,8 @@ def create_orders_df(
             )
         ]
         df.sort_values(
-            by=["e_ts", "order_id", "driver_id", "customer_id"], inplace=True,
+            by=["e_ts", "order_id", "driver_id", "customer_id"],
+            inplace=True,
         )
     else:
         df[DEFAULT_ENTITY_DF_EVENT_TIMESTAMP_COL] = [
@@ -208,9 +208,7 @@ def create_customer_daily_profile_df(customers, start_date, end_date) -> pd.Data
 
 def generate_entities(date, n_customers, n_drivers, order_count):
     end_date = date
-    before_start_date = end_date - timedelta(days=365)
     start_date = end_date - timedelta(days=7)
-    after_end_date = end_date + timedelta(days=365)
     customer_entities = [20000 + c_id for c_id in range(n_customers)]
     driver_entities = [50000 + d_id for d_id in range(n_drivers)]
     orders_df = create_orders_df(
@@ -225,7 +223,7 @@ def generate_entities(date, n_customers, n_drivers, order_count):
 
 
 def save_df_to_csv(df, table_name, dtype):
-    df.to_csv(table_name+".csv", index=False)
+    df.to_csv(table_name + ".csv", index=False)
 
 
 if __name__ == "__main__":
@@ -247,7 +245,6 @@ def save_df_to_csv(df, table_name, dtype):
 
     print(drivers_df.head())
 
-
     orders_table = "orders"
     driver_hourly_table = "driver_hourly"
     customer_profile_table = "customer_profile"
@@ -257,4 +254,4 @@ def save_df_to_csv(df, table_name, dtype):
     print("uploading drivers")
     save_df_to_csv(drivers_df, driver_hourly_table, dtype={"datetime": DateTime()})
     print("uploading customers")
-    save_df_to_csv(customer_df, customer_profile_table, dtype={"datetime": DateTime()})
+    save_df_to_csv(customer_df, customer_profile_table, dtype={"datetime": DateTime()})
@@ -11,7 +11,7 @@
 from feast.infra.offline_stores.contrib.mssql_offline_store.mssql import (
     MsSqlServerOfflineStoreConfig,
 )
-from feast.infra.online_stores.redis import RedisOnlineStoreConfig, RedisOnlineStore
+from feast.infra.online_stores.redis import RedisOnlineStoreConfig
 
 
 def init():
 
@@ -14,7 +14,10 @@
     timestamp_field="event_timestamp",
     created_timestamp_column="created",
 )
-driver = Entity(name="driver_id", description="driver id",)
+driver = Entity(
+    name="driver_id",
+    description="driver id",
+)
 driver_hourly_stats_view = FeatureView(
     name="driver_hourly_stats",
     entities=[driver],
@@ -58,4 +61,3 @@ def transformed_conv_rate(inputs: pd.DataFrame) -> pd.DataFrame:
     df["conv_rate_plus_val1"] = inputs["conv_rate"] + inputs["val_to_add"]
     df["conv_rate_plus_val2"] = inputs["conv_rate"] + inputs["val_to_add_2"]
     return df
-
 
@@ -20,9 +20,13 @@ def fetch_java():
 
     print(
         stub.GetOnlineFeatures(
-            GetOnlineFeaturesRequest(features=feature_refs, entities=entity_rows,)
+            GetOnlineFeaturesRequest(
+                features=feature_refs,
+                entities=entity_rows,
+            )
         )
     )
 
+
 if __name__ == "__main__":
     fetch_java()
@@ -15,7 +15,7 @@ def run_demo():
             },
             {
                 "driver_id": 1002,
-            }
+            },
         ],
     ).to_dict()
     for key, value in sorted(features.items()):
 
@@ -1,12 +1,18 @@
 import subprocess
 
-def port_forward(service, external_port, local_port=80) :
-  """
-  Run a background process to forward port 80 of the given `service` service to the given `external_port` port.
 
-  Returns: the process instance
-  """
-  command = ["kubectl", "port-forward", f"service/{service}", f"{external_port}:{local_port}"]
-  process = subprocess.Popen(command)
-  print(f"Port-forwarding {service} with process ID: {process.pid}")
-  return process
+def port_forward(service, external_port, local_port=80):
+    """
+    Run a background process to forward port 80 of the given `service` service to the given `external_port` port.
+
+    Returns: the process instance
+    """
+    command = [
+        "kubectl",
+        "port-forward",
+        f"service/{service}",
+        f"{external_port}:{local_port}",
+    ]
+    process = subprocess.Popen(command)
+    print(f"Port-forwarding {service} with process ID: {process.pid}")
+    return process
@@ -32,39 +32,71 @@ def generate_sample_data():
 
     # Sample product data
     products = [
-        {"id": 1, "name": "Smartphone",
-         "description": "A high-end smartphone with advanced camera features and long battery life."},
-        {"id": 2, "name": "Laptop",
-         "description": "Powerful laptop with fast processor and high-resolution display for professional use."},
-        {"id": 3, "name": "Headphones",
-         "description": "Wireless noise-cancelling headphones with premium sound quality."},
-        {"id": 4, "name": "Smartwatch",
-         "description": "Fitness tracking smartwatch with heart rate monitoring and sleep analysis."},
-        {"id": 5, "name": "Tablet",
-         "description": "Lightweight tablet with vibrant display perfect for reading and browsing."},
-        {"id": 6, "name": "Camera",
-         "description": "Professional digital camera with high-resolution sensor and interchangeable lenses."},
-        {"id": 7, "name": "Speaker",
-         "description": "Bluetooth speaker with rich bass and long battery life for outdoor use."},
-        {"id": 8, "name": "Gaming Console",
-         "description": "Next-generation gaming console with 4K graphics and fast loading times."},
-        {"id": 9, "name": "E-reader",
-         "description": "E-ink display reader with backlight for comfortable reading in any lighting condition."},
-        {"id": 10, "name": "Smart TV",
-         "description": "4K smart television with built-in streaming apps and voice control."}
+        {
+            "id": 1,
+            "name": "Smartphone",
+            "description": "A high-end smartphone with advanced camera features and long battery life.",
+        },
+        {
+            "id": 2,
+            "name": "Laptop",
+            "description": "Powerful laptop with fast processor and high-resolution display for professional use.",
+        },
+        {
+            "id": 3,
+            "name": "Headphones",
+            "description": "Wireless noise-cancelling headphones with premium sound quality.",
+        },
+        {
+            "id": 4,
+            "name": "Smartwatch",
+            "description": "Fitness tracking smartwatch with heart rate monitoring and sleep analysis.",
+        },
+        {
+            "id": 5,
+            "name": "Tablet",
+            "description": "Lightweight tablet with vibrant display perfect for reading and browsing.",
+        },
+        {
+            "id": 6,
+            "name": "Camera",
+            "description": "Professional digital camera with high-resolution sensor and interchangeable lenses.",
+        },
+        {
+            "id": 7,
+            "name": "Speaker",
+            "description": "Bluetooth speaker with rich bass and long battery life for outdoor use.",
+        },
+        {
+            "id": 8,
+            "name": "Gaming Console",
+            "description": "Next-generation gaming console with 4K graphics and fast loading times.",
+        },
+        {
+            "id": 9,
+            "name": "E-reader",
+            "description": "E-ink display reader with backlight for comfortable reading in any lighting condition.",
+        },
+        {
+            "id": 10,
+            "name": "Smart TV",
+            "description": "4K smart television with built-in streaming apps and voice control.",
+        },
     ]
 
     # Create DataFrame
     df = pd.DataFrame(products)
 
     # Generate embeddings using sentence-transformers
-    model = SentenceTransformer('all-MiniLM-L6-v2')  # Small, fast model with 384-dim embeddings
-    embeddings = model.encode(df['description'].tolist())
+    model = SentenceTransformer(
+        "all-MiniLM-L6-v2"
+    )  # Small, fast model with 384-dim embeddings
+    embeddings = model.encode(df["description"].tolist())
 
     # Add embeddings and timestamp to DataFrame
-    df['embedding'] = embeddings.tolist()
-    df['event_timestamp'] = datetime.now() - timedelta(days=1)
-    df['created_timestamp'] = datetime.now() - timedelta(days=1)
+    df["embedding"] = embeddings.tolist()
+    df["event_timestamp"] = datetime.now() - timedelta(days=1)
+    df["created_timestamp"] = datetime.now() - timedelta(days=1)
 
     # Save to parquet file
     parquet_path = "data/sample_data.parquet"
@@ -135,16 +167,20 @@ def perform_similarity_search(store, query_text: str, top_k: int = 3):
     print(f"\nPerforming similarity search for: '{query_text}'")
 
     # Generate embedding for query text
-    model = SentenceTransformer('all-MiniLM-L6-v2')
+    model = SentenceTransformer("all-MiniLM-L6-v2")
     query_embedding = model.encode(query_text).tolist()
 
     # Perform similarity search using vector embeddings with version 2 API
     try:
         results = store.retrieve_online_documents_v2(
-            features=["product_embeddings:embedding", "product_embeddings:name", "product_embeddings:description"],
+            features=[
+                "product_embeddings:embedding",
+                "product_embeddings:name",
+                "product_embeddings:description",
+            ],
             query=query_embedding,
             top_k=top_k,
-            distance_metric="L2"
+            distance_metric="L2",
         ).to_df()
 
         # Print results
@@ -184,7 +220,9 @@ def main():
     perform_similarity_search(store, "portable computing device for work", top_k=3)
 
     print("\n=== Tutorial Complete ===")
-    print("You've successfully set up Milvus with Feast and performed vector similarity searches!")
+    print(
+        "You've successfully set up Milvus with Feast and performed vector similarity searches!"
+    )
 
 
 if __name__ == "__main__":
Original file line number	Diff line number	Diff line change
`@@ -11,7 +11,7 @@`
`11`	`11`	`from feast.infra.offline_stores.contrib.mssql_offline_store.mssql import (`
`12`	`12`	`MsSqlServerOfflineStoreConfig,`
`13`	`13`	`)`
`14`		`-from feast.infra.online_stores.redis import RedisOnlineStoreConfig, RedisOnlineStore`
	`14`	`+from feast.infra.online_stores.redis import RedisOnlineStoreConfig`
`15`	`15`
`16`	`16`
`17`	`17`	`def init():`
Original file line number	Diff line number	Diff line change
`@@ -20,9 +20,13 @@ def fetch_java():`
`20`	`20`
`21`	`21`	`print(`
`22`	`22`	`stub.GetOnlineFeatures(`
`23`		`- GetOnlineFeaturesRequest(features=feature_refs, entities=entity_rows,)`
	`23`	`+ GetOnlineFeaturesRequest(`
	`24`	`+ features=feature_refs,`
	`25`	`+ entities=entity_rows,`
	`26`	`+ )`
`24`	`27`	`)`
`25`	`28`	`)`
`26`	`29`
	`30`	`+`
`27`	`31`	`if __name__ == "__main__":`
`28`	`32`	`fetch_java()`
Original file line number	Diff line number	Diff line change
`@@ -15,7 +15,7 @@ def run_demo():`
`15`	`15`	`},`
`16`	`16`	`{`
`17`	`17`	`"driver_id": 1002,`
`18`		`- }`
	`18`	`+ },`
`19`	`19`	`],`
`20`	`20`	`).to_dict()`
`21`	`21`	`for key, value in sorted(features.items()):`