from dataclasses import dataclass, field from datetime import datetime @dataclass class TCalcDatasetConfig: start_date: 'datetime' = datetime(year=2023, month=1, day=1) date_format: str = "%Y-%m-%d" datetime_format: str = "%Y-%m-%d %H:%M:%S" input_columns: list = field(default_factory=lambda: [ "created_at", "pick_at", "from_lat", "from_lon", "to_lat", "to_lon", "weight", "volume" ]) preprocessing: list[dict] = field(default_factory=lambda: [ {"name": "from_lat", "bias": 40, "std": 4}, {"name": "from_lon", "bias": 40, "std": 4}, {"name": "to_lat", "bias": 40, "std": 4}, {"name": "to_lon", "bias": 40, "std": 4}, {"name": "distance", "bias": 700, "std": 950}, {"name": "weight", "bias": 12000, "std": 8000}, {"name": "volume", "bias": 55, "std": 31}, {"name": "time_passed", "bias": 6, "std": 3}, {"name": "car_type_id", "bias": 1, "std": 1}, {"name": "urgency", "bias": 0, "std": 1}, ]) distributions: dict = field(default_factory=lambda: { "dot": [1, 0, 0], "trades": [0, 1, 0], "tariff": [0, 0, 1] }) use_distr: str = "dot" coordinates_thr: dict = field(default_factory=lambda: { "lat": [39.6, 72.89], "lon": [19.32, 158.34] })