From 562da0613017fffdfa5893bb903cd6b11ff67294 Mon Sep 17 00:00:00 2001 From: Aditya Nambiar Date: Wed, 9 Oct 2024 13:22:32 -0700 Subject: [PATCH] query_offline: Remove format parameter from query_offline --- docs/examples/api-reference/client.py | 10 ++++---- docs/examples/getting-started/quickstart.py | 1 - .../api-reference/client/query-offline.md | 12 +++------- fennel/CHANGELOG.md | 4 ++++ fennel/client/client.py | 23 +++---------------- fennel/testing/mock_client.py | 5 ---- pyproject.toml | 2 +- 7 files changed, 16 insertions(+), 41 deletions(-) diff --git a/docs/examples/api-reference/client.py b/docs/examples/api-reference/client.py index be5a55fcd..9eec9b13c 100644 --- a/docs/examples/api-reference/client.py +++ b/docs/examples/api-reference/client.py @@ -11,6 +11,7 @@ from fennel.lib import includes, meta, inputs, outputs from fennel.testing import mock from fennel.expr.expr import col, lit, when +from fennel.client import Client webhook = Webhook(name="fennel_webhook") @@ -120,7 +121,6 @@ def test_dag_resolution(self, client): response = client.query_offline( outputs=[UserFeatures], inputs=[UserFeatures.userid], - format="pandas", input_dataframe=pd.DataFrame( {"UserFeatures.userid": [18232, 18234], "timestamp": [now, now]} ), @@ -136,7 +136,7 @@ def test_dag_resolution(self, client): ) # /docsnip - with self.assertRaises(NotImplementedError) as e: + with self.assertRaises(ValueError) as e: # docsnip query_offline_s3 from fennel.connectors import S3 @@ -153,12 +153,12 @@ def test_dag_resolution(self, client): response = client.query_offline( outputs=[UserFeatures], inputs=[UserFeatures.userid], - format="csv", timestamp_column="timestamp", input_s3=s3_input_connection, output_s3=s3_output_connection, ) # /docsnip - assert "Only pandas format is supported in MockClient" in str( - e.exception + assert ( + "input must contain a key 'input_dataframe' with the input dataframe" + in str(e.exception) ) diff --git a/docs/examples/getting-started/quickstart.py b/docs/examples/getting-started/quickstart.py index ef313b396..0dc58c05a 100644 --- a/docs/examples/getting-started/quickstart.py +++ b/docs/examples/getting-started/quickstart.py @@ -173,7 +173,6 @@ def myextractor(cls, ts: pd.Series, uids: pd.Series, sellers: pd.Series): UserSellerFeatures.seller_id, ], timestamp_column="timestamps", - format="pandas", input_dataframe=pd.DataFrame( [[1, 1, now], [1, 2, now], [1, 1, now - day], [1, 2, now - day]], columns=[ diff --git a/docs/pages/api-reference/client/query-offline.md b/docs/pages/api-reference/client/query-offline.md index faa61eff9..60129f4a2 100644 --- a/docs/pages/api-reference/client/query-offline.md +++ b/docs/pages/api-reference/client/query-offline.md @@ -21,16 +21,12 @@ either as Feature objects, or Featureset objects (in which case all features und that featureset are queried) or strings representing fully qualified feature names. - -The format of the input data - - - + A pandas dataframe object that contains the values of all features in the inputs list. Each row of the dataframe can be thought of as one entity for which features need to be queried. -Only relevant when `format` is "pandas". +This parameter is mutually exclusive with `input_s3`. @@ -39,8 +35,6 @@ In such cases, input data can be written to S3 and the location of the file is sent as `input_s3` via `S3.bucket()` function of [S3](/api-reference/connectors/s3) connector. -This parameter makes sense only when `format` isn't "pandas". - When using this option, please ensure that Fennel's data connector IAM role has the ability to execute read & list operations on this bucket - talk to Fennel support if you need help. @@ -115,7 +109,7 @@ in order to resolve the path from the input features to the output features. ===

 
 Union[pd.DataFrame, pd.Series]:
-        if format != "pandas":
-            raise NotImplementedError(
-                "Only pandas format is supported in MockClient"
-            )
         if input_dataframe is None:
             raise ValueError(
                 "input must contain a key 'input_dataframe' with the input dataframe"
diff --git a/pyproject.toml b/pyproject.toml
index 606c21761..93b0450e2 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "fennel-ai"
-version = "1.5.35"
+version = "1.5.36"
 description = "The modern realtime feature engineering platform"
 authors = ["Fennel AI "]
 packages = [{ include = "fennel" }]