electricity.yaml 1.6 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758
  1. # SPDX-License-Identifier: Apache-2.0
  2. _target_: data.datasets.create_datasets
  3. config:
  4. graph: False
  5. source_path: /workspace/datasets/electricity/electricity.csv
  6. dest_path: /workspace/datasets/electricity/
  7. train_range:
  8. - 0
  9. - 31560
  10. valid_range:
  11. - 31392
  12. - 32136
  13. test_range:
  14. - 31968
  15. - 35000
  16. dataset_stride: 1
  17. scale_per_id: True
  18. encoder_length: 168
  19. input_length: 168
  20. example_length: 192
  21. MultiID: False
  22. features:
  23. - name: 'categorical_id'
  24. feature_type: 'ID'
  25. feature_embed_type: 'CATEGORICAL'
  26. cardinality: 371
  27. - name: 'hours_from_start'
  28. feature_type: 'TIME'
  29. feature_embed_type: 'CONTINUOUS'
  30. - name: 'power_usage_weight'
  31. feature_type: 'WEIGHT'
  32. feature_embed_type: 'CONTINUOUS'
  33. - name: 'power_usage'
  34. feature_type: 'TARGET'
  35. feature_embed_type: 'CONTINUOUS'
  36. scaler:
  37. _target_: sklearn.preprocessing.StandardScaler
  38. - name: 'hour'
  39. feature_type: 'KNOWN'
  40. feature_embed_type: 'CATEGORICAL'
  41. cardinality: 25
  42. - name: 'day_of_week'
  43. feature_type: 'KNOWN'
  44. feature_embed_type: 'CATEGORICAL'
  45. cardinality: 8
  46. - name: 'hours_from_start'
  47. feature_type: 'KNOWN'
  48. feature_embed_type: 'CONTINUOUS'
  49. scaler:
  50. _target_: sklearn.preprocessing.StandardScaler
  51. - name: 'categorical_id'
  52. feature_type: 'STATIC'
  53. feature_embed_type: 'CATEGORICAL'
  54. cardinality: 371
  55. train_samples: 450000
  56. valid_samples: 50000
  57. binarized: True
  58. time_series_count: 369