-
Notifications
You must be signed in to change notification settings - Fork 1k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
fix: Redshift push ignores schema (#3671)
* Add fully-qualified-table-name Redshift prop Signed-off-by: Robin Neufeld <[email protected]> * pre-commit Signed-off-by: Robin Neufeld <[email protected]> * Docstring Signed-off-by: Robin Neufeld <[email protected]> * Test fully_qualified_table_name Signed-off-by: Robin Neufeld <[email protected]> * Simplify logic Signed-off-by: Robin Neufeld <[email protected]> * pre-commit Signed-off-by: Robin Neufeld <[email protected]> * pre-commit Signed-off-by: Robin Neufeld <[email protected]> * Test offline_write_batch Signed-off-by: Robin Neufeld <[email protected]> * Bump to trigger CI Signed-off-by: Robin Neufeld <[email protected]> * another bump for ci Signed-off-by: Robin Neufeld <[email protected]> --------- Signed-off-by: Robin Neufeld <[email protected]>
- Loading branch information
Showing
4 changed files
with
147 additions
and
2 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
67 changes: 67 additions & 0 deletions
67
sdk/python/tests/unit/infra/offline_stores/test_redshift.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,67 @@ | ||
from unittest.mock import MagicMock, patch | ||
|
||
import pandas as pd | ||
import pyarrow as pa | ||
|
||
from feast import FeatureView | ||
from feast.infra.offline_stores import offline_utils | ||
from feast.infra.offline_stores.redshift import ( | ||
RedshiftOfflineStore, | ||
RedshiftOfflineStoreConfig, | ||
) | ||
from feast.infra.offline_stores.redshift_source import RedshiftSource | ||
from feast.infra.utils import aws_utils | ||
from feast.repo_config import RepoConfig | ||
|
||
|
||
@patch.object(aws_utils, "upload_arrow_table_to_redshift") | ||
def test_offline_write_batch( | ||
mock_upload_arrow_table_to_redshift: MagicMock, | ||
simple_dataset_1: pd.DataFrame, | ||
): | ||
repo_config = RepoConfig( | ||
registry="registry", | ||
project="project", | ||
provider="local", | ||
offline_store=RedshiftOfflineStoreConfig( | ||
type="redshift", | ||
region="us-west-2", | ||
cluster_id="cluster_id", | ||
database="database", | ||
user="user", | ||
iam_role="abcdef", | ||
s3_staging_location="s3://bucket/path", | ||
), | ||
) | ||
|
||
batch_source = RedshiftSource( | ||
name="test_source", | ||
timestamp_field="ts", | ||
table="table_name", | ||
schema="schema_name", | ||
) | ||
feature_view = FeatureView( | ||
name="test_view", | ||
source=batch_source, | ||
) | ||
|
||
pa_dataset = pa.Table.from_pandas(simple_dataset_1) | ||
|
||
# patch some more things so that the function can run | ||
def mock_get_pyarrow_schema_from_batch_source(*args, **kwargs) -> pa.Schema: | ||
return pa_dataset.schema, pa_dataset.column_names | ||
|
||
with patch.object( | ||
offline_utils, | ||
"get_pyarrow_schema_from_batch_source", | ||
new=mock_get_pyarrow_schema_from_batch_source, | ||
): | ||
RedshiftOfflineStore.offline_write_batch( | ||
repo_config, feature_view, pa_dataset, progress=None | ||
) | ||
|
||
# check that we have included the fully qualified table name | ||
mock_upload_arrow_table_to_redshift.assert_called_once() | ||
|
||
call = mock_upload_arrow_table_to_redshift.call_args_list[0] | ||
assert call.kwargs["table_name"] == "schema_name.table_name" |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -190,3 +190,46 @@ def test_column_conflict(): | |
timestamp_field="event_timestamp", | ||
created_timestamp_column="event_timestamp", | ||
) | ||
|
||
|
||
@pytest.mark.parametrize( | ||
"source_kwargs,expected_name", | ||
[ | ||
( | ||
{ | ||
"database": "test_database", | ||
"schema": "test_schema", | ||
"table": "test_table", | ||
}, | ||
"test_database.test_schema.test_table", | ||
), | ||
( | ||
{"database": "test_database", "table": "test_table"}, | ||
"test_database.public.test_table", | ||
), | ||
({"table": "test_table"}, "public.test_table"), | ||
({"database": "test_database", "table": "b.c"}, "test_database.b.c"), | ||
({"database": "test_database", "table": "a.b.c"}, "a.b.c"), | ||
( | ||
{ | ||
"database": "test_database", | ||
"schema": "test_schema", | ||
"query": "select * from abc", | ||
}, | ||
"", | ||
), | ||
], | ||
) | ||
def test_redshift_fully_qualified_table_name(source_kwargs, expected_name): | ||
redshift_source = RedshiftSource( | ||
name="test_source", | ||
timestamp_field="event_timestamp", | ||
created_timestamp_column="created_timestamp", | ||
field_mapping={"foo": "bar"}, | ||
description="test description", | ||
tags={"test": "test"}, | ||
owner="[email protected]", | ||
**source_kwargs, | ||
) | ||
|
||
assert redshift_source.redshift_options.fully_qualified_table_name == expected_name |