Brittany Kozura
04/06/2023, 6:29 PM@asset
def transformed_data() -> pd.DataFrame:
df = get_data_from_s3(partition_name=val_in_config)
df = do_some_stuff(df)
return df
data_transform_job = define_asset_job(
"data_transform",
selection='transformed_data',
config={}
)
how would I complete this approach? (get_data_from_s3 will get all data if partition_name==none)sandy
04/07/2023, 6:51 PMfrom dagster import Field
@asset(config_schema={"partition_name": Field(str, is_required=False)})
def transformed_data(context) -> pd.DataFrame:
partition_name = context.op_config.get("partition_name")
df = get_data_from_s3(partition_name=partition_name)
df = do_some_stuff(df)
return df