worker_id = "worker-prod-01" base_path = "/data/ml-experiments" max_workers = 4 # Redis connection redis_addr = "localhost:6379" redis_password = "JZVd2Y6IDaLNaYLBOFgQ7ae4Ox5t37NTIyPMQlLJD4k=" redis_db = 0 # SSH connection (for remote operations) host = "localhost" user = "ml-user" port = 22 ssh_key = "~/.ssh/id_rsa" # Podman configuration podman_image = "ml-training:latest" gpu_access = true container_workspace = "/workspace" container_results = "/results" train_script = "train.py" # Dataset management auto_fetch_data = true data_dir = "/data/datasets" data_manager_path = "/usr/local/bin/data_manager" dataset_cache_ttl = "24h" # Task management task_lease_duration = "1h" heartbeat_interval = "30s" graceful_timeout = "5m" poll_interval = "100ms" metrics_flush_interval = "10s" # Metrics exporter [metrics] enabled = true listen_addr = ":9090"