-
Notifications
You must be signed in to change notification settings - Fork 10
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
use a new FeastDataStream class for feast functionality (#49)
* use a new FeastDataStream class for feast functionality * add pyi file for feast_data_stream
- Loading branch information
Showing
8 changed files
with
143 additions
and
58 deletions.
There are no files selected for viewing
Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.
Oops, something went wrong.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,7 +1,14 @@ | ||
from .context import Context | ||
from .datastream import DataStream | ||
from .data_stream import DataStream | ||
|
||
__all__ = [ | ||
"Context", | ||
"DataStream", | ||
] | ||
|
||
try: | ||
from .feast_data_stream import FeastDataStream | ||
|
||
__all__.append("FeastDataStream") | ||
except ImportError: | ||
pass |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,89 @@ | ||
import inspect | ||
from typing import Any, TypeVar, Union, cast, get_type_hints | ||
|
||
import pyarrow as pa | ||
from denormalized._internal import PyDataStream | ||
from denormalized.datafusion import Expr | ||
from feast import FeatureStore, Field | ||
from feast.data_source import PushMode | ||
from feast.type_map import pa_to_feast_value_type | ||
from feast.types import from_value_type | ||
|
||
from .data_stream import DataStream | ||
|
||
T = TypeVar("T") | ||
|
||
|
||
class FeastDataStreamMeta(type): | ||
"""Metaclass that modifies DataStream return types to FeastDataStream.""" | ||
|
||
def __new__(cls, name: str, bases: tuple, attrs: dict) -> Any: | ||
# Get all methods from DataStream that return DataStream | ||
datastream_methods = inspect.getmembers( | ||
DataStream, | ||
predicate=lambda x: ( | ||
inspect.isfunction(x) and get_type_hints(x).get("return") == DataStream | ||
), | ||
) | ||
|
||
# For each method that returns DataStream, create a wrapper that returns FeastDataStream | ||
for method_name, method in datastream_methods: | ||
if method_name not in attrs: # Only wrap if not already defined | ||
|
||
def create_wrapper(method_name): | ||
def wrapper(self, *args, **kwargs): | ||
result = getattr( | ||
super(cast(type, self.__class__), self), method_name | ||
)(*args, **kwargs) | ||
return self.__class__(result) | ||
|
||
# Copy original method's signature but change return type | ||
hints = get_type_hints(getattr(DataStream, method_name)) | ||
hints["return"] = ( | ||
"FeastDataStream" # Use string to handle forward reference | ||
) | ||
wrapper.__annotations__ = hints | ||
return wrapper | ||
|
||
attrs[method_name] = create_wrapper(method_name) | ||
|
||
return super().__new__(cls, name, bases, attrs) | ||
|
||
|
||
class FeastDataStream(DataStream, metaclass=FeastDataStreamMeta): | ||
"""A DataStream subclass with additional Feast-specific functionality.""" | ||
|
||
def __init__(self, stream: Union[PyDataStream, DataStream]) -> None: | ||
"""Initialize a FeastDataStream from either a PyDataStream or DataStream. | ||
Args: | ||
stream: Either a PyDataStream object or a DataStream object | ||
""" | ||
if isinstance(stream, DataStream): | ||
super().__init__(stream.ds) | ||
else: | ||
super().__init__(stream) | ||
|
||
def get_feast_schema(self) -> list[Field]: | ||
"""Get the Feast schema for this DataStream.""" | ||
return [ | ||
Field( | ||
name=s.name, dtype=from_value_type(pa_to_feast_value_type(str(s.type))) | ||
) | ||
for s in self.schema() | ||
] | ||
|
||
def write_feast_feature( | ||
self, feature_store: FeatureStore, source_name: str | ||
) -> None: | ||
"""Write the DataStream to a Feast feature store.""" | ||
|
||
def _sink_to_feast(rb: pa.RecordBatch): | ||
df = rb.to_pandas() | ||
|
||
try: | ||
feature_store.push(source_name, df, to=PushMode.ONLINE) | ||
except Exception as e: | ||
print(e) | ||
|
||
self.ds.sink_python(_sink_to_feast) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,42 @@ | ||
# feast_data_stream.pyi | ||
from typing import List, Optional, Type, Union | ||
|
||
from denormalized._internal import PyDataStream | ||
from denormalized.datafusion import Expr | ||
from feast import FeatureStore, Field | ||
|
||
from .data_stream import DataStream | ||
|
||
class FeastDataStreamMeta(type): | ||
def __new__(cls, name: str, bases: tuple, attrs: dict) -> Type[FeastDataStream]: ... | ||
|
||
class FeastDataStream(DataStream, metaclass=FeastDataStreamMeta): | ||
def __init__(self, stream: Union[PyDataStream, DataStream]) -> None: ... | ||
def select(self, expr_list: List[Expr]) -> FeastDataStream: ... | ||
def filter(self, predicate: Expr) -> FeastDataStream: ... | ||
def with_column(self, name: str, predicate: Expr) -> FeastDataStream: ... | ||
def join_on( | ||
self, right: DataStream, join_type: str, on_exprs: List[Expr] | ||
) -> FeastDataStream: ... | ||
def join( | ||
self, | ||
right: DataStream, | ||
join_type: str, | ||
left_cols: List[str], | ||
right_cols: List[str], | ||
filter: Optional[Expr] = None, | ||
) -> FeastDataStream: ... | ||
def window( | ||
self, | ||
group_exprs: List[Expr], | ||
aggr_exprs: List[Expr], | ||
window_length_millis: int, | ||
slide_millis: Optional[int] = None, | ||
) -> FeastDataStream: ... | ||
def print_schema(self) -> FeastDataStream: ... | ||
def print_plan(self) -> FeastDataStream: ... | ||
def print_physical_plan(self) -> FeastDataStream: ... | ||
def get_feast_schema(self) -> List[Field]: ... | ||
def write_feast_feature( | ||
self, feature_store: FeatureStore, source_name: str | ||
) -> None: ... |
This file was deleted.
Oops, something went wrong.