traffic.yaml 1.5 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455
  1. # SPDX-License-Identifier: Apache-2.0
  2. _target_: data.datasets.create_datasets
  3. config:
  4. source_path: /workspace/datasets/traffic/traffic.csv
  5. dest_path: /workspace/datasets/traffic/
  6. train_range:
  7. - 0
  8. - 3624
  9. valid_range:
  10. - 3456
  11. - 3984
  12. test_range:
  13. - 3816
  14. - 4200
  15. dataset_stride: 1
  16. scale_per_id: False
  17. encoder_length: 168
  18. input_length: 168
  19. example_length: 192
  20. MultiID: False
  21. features:
  22. - name: 'id'
  23. feature_type: 'ID'
  24. feature_embed_type: 'CATEGORICAL'
  25. cardinality: 964
  26. - name: 'hours_from_start'
  27. feature_type: 'TIME'
  28. feature_embed_type: 'CONTINUOUS'
  29. - name: 'values'
  30. feature_type: 'TARGET'
  31. feature_embed_type: 'CONTINUOUS'
  32. scaler:
  33. _target_: sklearn.preprocessing.StandardScaler
  34. - name: 'time_on_day'
  35. feature_type: 'KNOWN'
  36. feature_embed_type: 'CONTINUOUS'
  37. scaler:
  38. _target_: sklearn.preprocessing.StandardScaler
  39. - name: 'day_of_week'
  40. feature_type: 'KNOWN'
  41. feature_embed_type: 'CATEGORICAL'
  42. cardinality: 8
  43. - name: 'hours_from_start'
  44. feature_type: 'KNOWN'
  45. feature_embed_type: 'CONTINUOUS'
  46. scaler:
  47. _target_: sklearn.preprocessing.StandardScaler
  48. - name: 'categorical_id'
  49. feature_type: 'STATIC'
  50. feature_embed_type: 'CATEGORICAL'
  51. cardinality: 964
  52. train_samples: 450000
  53. valid_samples: 50000
  54. binarized: True
  55. time_series_count: 964