From 1cc10d63723da51bd0e932e7222e185e266d1882 Mon Sep 17 00:00:00 2001 From: gwaramadze <1044831+gwaramadze@users.noreply.github.com> Date: Mon, 13 Jan 2025 08:02:16 +0000 Subject: [PATCH] Update documentation --- docs/api-reference/dataframe.md | 26 ++++++------ docs/api-reference/quixstreams.md | 68 ++++++++++++++++++------------- docs/api-reference/sources.md | 20 +++++++-- 3 files changed, 69 insertions(+), 45 deletions(-) diff --git a/docs/api-reference/dataframe.md b/docs/api-reference/dataframe.md index ce7a51de5..1c80813c1 100644 --- a/docs/api-reference/dataframe.md +++ b/docs/api-reference/dataframe.md @@ -1008,7 +1008,7 @@ operations, but branches can still be generated from its originating SDF. class StreamingSeries(BaseStreaming) ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L70) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L60) `StreamingSeries` are typically generated by `StreamingDataframes` when getting elements from, or performing certain operations on, a `StreamingDataframe`, @@ -1075,7 +1075,7 @@ def from_apply_callback(cls, func: ApplyWithMetadataCallback, sdf_id: int) -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L132) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L126) Create a StreamingSeries from a function. @@ -1104,7 +1104,7 @@ instance of `StreamingSeries` def apply(func: ApplyCallback) -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L155) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L149) Add a callable to the execution list for this series. @@ -1156,7 +1156,7 @@ a new `StreamingSeries` with the new callable added def compose_returning() -> ReturningExecutor ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L189) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L183) Compose a list of functions from this StreamingSeries and its parents into one @@ -1187,7 +1187,7 @@ def compose( None]] = None) -> VoidExecutor ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L204) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L198) Compose all functions of this StreamingSeries into one big closure. @@ -1245,7 +1245,7 @@ def test(value: Any, ctx: Optional[MessageContext] = None) -> Any ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L248) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L242) A shorthand to test `StreamingSeries` with provided value @@ -1277,7 +1277,7 @@ result of `StreamingSeries` def isin(other: Container) -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L304) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L313) Check if series value is in "other". @@ -1322,7 +1322,7 @@ new StreamingSeries def contains(other: Union[Self, object]) -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L331) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L344) Check if series value contains "other" @@ -1367,7 +1367,7 @@ new StreamingSeries def is_(other: Union[Self, object]) -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L356) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L369) Check if series value refers to the same object as `other` @@ -1409,7 +1409,7 @@ new StreamingSeries def isnot(other: Union[Self, object]) -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L379) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L392) Check if series value does not refer to the same object as `other` @@ -1452,7 +1452,7 @@ new StreamingSeries def isnull() -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L403) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L416) Check if series value is None. @@ -1489,7 +1489,7 @@ new StreamingSeries def notnull() -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L426) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L439) Check if series value is not None. @@ -1526,7 +1526,7 @@ new StreamingSeries def abs() -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L449) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L462) Get absolute value of the series value. diff --git a/docs/api-reference/quixstreams.md b/docs/api-reference/quixstreams.md index 9b21e0309..d25cf868d 100644 --- a/docs/api-reference/quixstreams.md +++ b/docs/api-reference/quixstreams.md @@ -1641,7 +1641,7 @@ operations, but branches can still be generated from its originating SDF. class StreamingSeries(BaseStreaming) ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L70) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L60) `StreamingSeries` are typically generated by `StreamingDataframes` when getting elements from, or performing certain operations on, a `StreamingDataframe`, @@ -1700,7 +1700,7 @@ def from_apply_callback(cls, func: ApplyWithMetadataCallback, sdf_id: int) -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L132) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L126) Create a StreamingSeries from a function. @@ -1723,7 +1723,7 @@ instance of `StreamingSeries` def apply(func: ApplyCallback) -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L155) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L149) Add a callable to the execution list for this series. @@ -1767,7 +1767,7 @@ a new `StreamingSeries` with the new callable added def compose_returning() -> ReturningExecutor ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L189) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L183) Compose a list of functions from this StreamingSeries and its parents into one @@ -1794,7 +1794,7 @@ def compose( None]] = None) -> VoidExecutor ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L204) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L198) Compose all functions of this StreamingSeries into one big closure. @@ -1844,7 +1844,7 @@ def test(value: Any, ctx: Optional[MessageContext] = None) -> Any ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L248) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L242) A shorthand to test `StreamingSeries` with provided value @@ -1870,7 +1870,7 @@ result of `StreamingSeries` def isin(other: Container) -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L304) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L313) Check if series value is in "other". @@ -1907,7 +1907,7 @@ new StreamingSeries def contains(other: Union[Self, object]) -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L331) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L344) Check if series value contains "other" @@ -1944,7 +1944,7 @@ new StreamingSeries def is_(other: Union[Self, object]) -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L356) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L369) Check if series value refers to the same object as `other` @@ -1978,7 +1978,7 @@ new StreamingSeries def isnot(other: Union[Self, object]) -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L379) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L392) Check if series value does not refer to the same object as `other` @@ -2013,7 +2013,7 @@ new StreamingSeries def isnull() -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L403) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L416) Check if series value is None. @@ -2044,7 +2044,7 @@ new StreamingSeries def notnull() -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L426) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L439) Check if series value is not None. @@ -2075,7 +2075,7 @@ new StreamingSeries def abs() -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L449) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/series.py#L462) Get absolute value of the series value. @@ -2370,7 +2370,7 @@ class FixedTimeWindow() def final() -> "StreamingDataFrame" ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/windows/time_based.py#L129) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/windows/time_based.py#L127) Apply the window aggregation and return results only when the windows are closed. @@ -2401,7 +2401,7 @@ can remain unprocessed until the message the same key is received. def current() -> "StreamingDataFrame" ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/windows/time_based.py#L167) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/windows/time_based.py#L165) Apply the window transformation to the StreamingDataFrame to return results for each updated window. @@ -2429,7 +2429,7 @@ regardless of whether the window is closed or not. ```python def get_window_ranges(timestamp_ms: int, duration_ms: int, - step_ms: Optional[int] = None) -> Deque[Tuple[int, int]] + step_ms: Optional[int] = None) -> Deque[tuple[int, int]] ``` [[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/dataframe/windows/base.py#L17) @@ -2666,7 +2666,7 @@ def add_apply(func: Union[ metadata: bool = False) -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/core/stream/stream.py#L186) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/core/stream/stream.py#L190) Add an "apply" function to the Stream. @@ -2697,7 +2697,7 @@ def add_update(func: Union[UpdateCallback, UpdateWithMetadataCallback], metadata: bool = False) -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/core/stream/stream.py#L227) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/core/stream/stream.py#L231) Add an "update" function to the Stream, that will mutate the input value. @@ -2725,7 +2725,7 @@ def add_transform(func: Union[TransformCallback, TransformExpandedCallback], expand: bool = False) -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/core/stream/stream.py#L261) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/core/stream/stream.py#L265) Add a "transform" function to the Stream, that will mutate the input value. @@ -2754,7 +2754,7 @@ a new Stream derived from the current one def diff(other: Self) -> Self ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/core/stream/stream.py#L285) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/core/stream/stream.py#L289) Takes the difference between Streams `self` and `other` based on their last @@ -2787,7 +2787,7 @@ a new independent `Stream` instance whose root begins at the diff def root_path(allow_splits=True) -> List[Self] ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/core/stream/stream.py#L350) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/core/stream/stream.py#L354) Return a list of all parent Streams including the node itself. @@ -2807,7 +2807,7 @@ a list of `Stream` objects def full_tree() -> List[Self] ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/core/stream/stream.py#L371) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/core/stream/stream.py#L375) Starts at tree root and finds every Stream in the tree (including splits). @@ -2829,7 +2829,7 @@ def compose( None]] = None) -> VoidExecutor ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/core/stream/stream.py#L378) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/core/stream/stream.py#L382) Generate an "executor" closure by mapping all relatives of this `Stream` and @@ -2861,7 +2861,7 @@ the stream has transform functions in the tree. Default - True. def compose_returning() -> ReturningExecutor ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/core/stream/stream.py#L435) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/core/stream/stream.py#L439) Compose a list of functions from this `Stream` and its parents into one big closure that always returns the transformed record. @@ -11184,6 +11184,18 @@ The iterable should output dicts with the following data/naming structure: ## quixstreams.sources.community.file.file + + +### FileFetcher + +```python +class FileFetcher() +``` + +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/sources/community/file/file.py#L22) + +Serves individual files while downloading another in the background. + ### FileSource @@ -11192,7 +11204,7 @@ The iterable should output dicts with the following data/naming structure: class FileSource(Source) ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/sources/community/file/file.py#L19) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/sources/community/file/file.py#L70) Ingest a set of files from a desired origin into Kafka by iterating through the provided folder and processing all nested files within it. @@ -11262,10 +11274,10 @@ def __init__(directory: Union[str, Path], compression: Optional[CompressionName] = None, replay_speed: float = 1.0, name: Optional[str] = None, - shutdown_timeout: float = 10) + shutdown_timeout: float = 30) ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/sources/community/file/file.py#L79) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/sources/community/file/file.py#L130) **Arguments**: @@ -11292,7 +11304,7 @@ to gracefully shutdown def default_topic() -> Topic ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/sources/community/file/file.py#L152) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/sources/community/file/file.py#L204) Uses the file structure to generate the desired partition count for the diff --git a/docs/api-reference/sources.md b/docs/api-reference/sources.md index 7f76c5d9f..148cd30a1 100644 --- a/docs/api-reference/sources.md +++ b/docs/api-reference/sources.md @@ -822,6 +822,18 @@ For other parameters See `quixstreams.sources.kafka.KafkaReplicatorSource` ## quixstreams.sources.community.file.file + + +### FileFetcher + +```python +class FileFetcher() +``` + +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/sources/community/file/file.py#L22) + +Serves individual files while downloading another in the background. + ### FileSource @@ -830,7 +842,7 @@ For other parameters See `quixstreams.sources.kafka.KafkaReplicatorSource` class FileSource(Source) ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/sources/community/file/file.py#L19) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/sources/community/file/file.py#L70) Ingest a set of files from a desired origin into Kafka by iterating through the provided folder and processing all nested files within it. @@ -902,10 +914,10 @@ def __init__(directory: Union[str, Path], compression: Optional[CompressionName] = None, replay_speed: float = 1.0, name: Optional[str] = None, - shutdown_timeout: float = 10) + shutdown_timeout: float = 30) ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/sources/community/file/file.py#L79) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/sources/community/file/file.py#L130)
@@ -936,7 +948,7 @@ to gracefully shutdown def default_topic() -> Topic ``` -[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/sources/community/file/file.py#L152) +[[VIEW SOURCE]](https://github.com/quixio/quix-streams/blob/main/quixstreams/sources/community/file/file.py#L204) Uses the file structure to generate the desired partition count for the