import kumoai as kumo
from kumoai.graph import Column
from kumoapi.typing import Stype, Dtype
# Please update your target URL and kumo API key.
API_URL = ""
API_KEY = ""
kumo.init(url=API_URL, api_key=API_KEY)
quickstart_config = {'connector_root_dir': 's3://kumo-public-datasets/quickstart', 'data_source_type': 'S3', 'connector_id': 'quickstart'}
quickstart_connector = kumo.S3Connector(
root_dir=quickstart_config["connector_root_dir"],
_connector_id = quickstart_config["connector_id"]
)
transactions_config = {
'connector_id': 'quickstart',
'table_name': 'transactions',
'file_type': 'PARQUET',
'table_name_alias': 'transactions1',
'cols': [
Column(name='t_dat', stype=Stype.timestamp, dtype=Dtype.date, timestamp_format=None),
Column(name='customer_id', stype=Stype.ID, dtype=Dtype.string, timestamp_format=None),
Column(name='article_id', stype=Stype.ID, dtype=Dtype.int64, timestamp_format=None),
Column(name='price', stype=Stype.numerical, dtype=Dtype.float64, timestamp_format=None),
Column(name='sales_channel_id', stype=Stype.ID, dtype=Dtype.int64, timestamp_format=None)
],
'pkey': None,
'time_col': 't_dat',
'end_time_col': None
}
transactions = kumo.Table(
source_table=quickstart_connector.table(
transactions_config["table_name"]
),
columns=transactions_config["cols"],
primary_key=transactions_config['pkey'],
time_column=transactions_config['time_col'],
end_time_column=transactions_config["end_time_col"]
)