The objective of this page is to provide a detailed description of the global variables used in Dataiku's workflow.
Versioning variables
these two variables are used to define the version of the runs in Dataiku folders:
- the version name must be updated for each new run
- the extract_month_date refers to the first forecast month in the extracted forecast data, and is updated automatically during a scenario step (https://dss.solvay.com/projects/SPOT_CS_PO_918/scenarios/2DATAPREPARATION/steps).
"versioning_version_name": "Q3.3_all_families_run", "extract_month_date": "2023-09-01",
GBU variables
specific measures and GBU identifiers, which must be updated for each new GBU
"GBU_measures": {
"historical_revenue": "historical_sales",
"historical_volume": "historical_volume",
"historical_price": "historical_unit_price"
},
"GBU_identifiers": {
"id_key": "cpc",
"product_key": "material_code",
"customer_key": "shipto_code",
"soldto_key": "soldto_code",
"soldto_group_key": "soldto_group",
"shipto_key": "shipto_code",
"family_key": "gbu_product_family",
"sales_key": "forecasted_sales",
"volumes_key": "forecasted_volume",
"prices_key": "computed_unit_price"
},
GBU families
the names of integrated product families for the current GBU, to be updated each time we add a new product family
"families_in_scope": [ "Sulfosuccinate_Sulfosuccinamate", "Specialty_Monomers", "Phosphate_Esters", "Guars" ],
Product composition data
"product_composition": {
"component_values": [
"COMPONENT",
"IMPURITY",
"SOLVENT",
"ADDITIVE",
"Z_CONST"
],
"product_identifier": "EHS_Product",
"component_type_identifier": "Component_Type",
"measure_identifier": "Average",
"unit_identifier": "Unit"
},
Pre-processing variables
"preprocessing_filters": {
"product_group": [
"SSPH"
],
"material_name": [
"AEROSOL OT-100 SURF 25KG FBD WHSKIN",
"AEROSOL OT-100 SURF 11KG W/LBL BOX"
],
"end_use": [
"Hpc-Api"
]
},
"imputers": {
"most_frequent": [
"manual_region_SS",
"manual_region_SM",
"product_group"
],
"constant": {
"n_competitors": 1,
"historical_unit_price_coalesce_ratio_on_12": 1,
"historical_sales_coalesce_ratio_on_12": 1,
"historical_unit_price_ratio_3_on_12_month": 1
},
"mean": [
"COMPONENT_ratio",
"IMPURITY_ratio",
"SOLVENT_ratio",
"n_components"
]
},
"categorical_encoder": "TargetMean",
"ordinal_encoder": "Ordinal",
"evolution_features_params": {
"evolution_columns": [
"historical_sales",
"historical_volume",
"historical_unit_price"
],
"numerator_list": [
1,
3,
6
],
"denominator_list": [
12
]
},