Browse Source

add NAB dataset

Former-commit-id: 0db3367376 [formerly eaae1889ac] [formerly 7bc91cb700 [formerly dafd927231]] [formerly c5dd8fd0e9 [formerly a91a1562c3] [formerly db97273a42 [formerly f63568349f]]] [formerly 55e71b6698 [formerly 65aa49367c] [formerly 6b73a2f59e [formerly 5f29959f25]] [formerly 65c646b334 [formerly d24a604dd1] [formerly 84fdf5b654 [formerly e9dba9005d]]]] [formerly c746c1012f [formerly 5e82b8268f] [formerly 5976e7aff9 [formerly d2b5614e7b]] [formerly a81496588a [formerly d9d4c6ddbf] [formerly 0828a0086c [formerly 91270be431]]] [formerly 1df60ec98b [formerly 59e9243bc5] [formerly f0c6636a0f [formerly b6114c95be]] [formerly 219cd77ccd [formerly 72e00ed5d7] [formerly 1994baceaf [formerly 498cdf71bf]]]]] [formerly f17419f091 [formerly 2904ab86ac] [formerly 8aae1bed9b [formerly a93b237f5b]] [formerly 41d0fc0d23 [formerly 611f0de9ff] [formerly 5606008f0d [formerly f268a174d5]]] [formerly 96592825d0 [formerly 2fc9338ae3] [formerly fb34b63743 [formerly d691b3f182]] [formerly b4d533928f [formerly 402f2a94d7] [formerly 3a76e095e5 [formerly c5166f8816]]]] [formerly 7e1251edf6 [formerly cb03a9a3f0] [formerly 8d62be6e08 [formerly 868118adb2]] [formerly 7df726ee99 [formerly 4a08b5bb8b] [formerly 3b2109c8a3 [formerly 32a0c35fcf]]] [formerly f502641f2e [formerly ba700a94c5] [formerly d421d682ae [formerly e9314c61a3]] [formerly d1bfb9f2c7 [formerly 2331157922] [formerly 23d8a07079 [formerly 4aeffca422]]]]]]
Former-commit-id: e905f2d10d [formerly 142b6ae58d] [formerly 33ec2ad3fe [formerly 2552960fc1]] [formerly 22a0bb40e9 [formerly 9776f26e72] [formerly 38c2cdc832 [formerly 50b66f8fdf]]] [formerly 842854a31a [formerly ca096a9360] [formerly aa34005d2a [formerly 9dcac2a86e]] [formerly 71dc464bd0 [formerly 38dd92c83e] [formerly 14adc68236 [formerly f3c67ca4bc]]]] [formerly c745eb7894 [formerly ab3ccbcf51] [formerly 8f453e065e [formerly d971c991a6]] [formerly 5e54cf6b56 [formerly c3faa9f4d4] [formerly 657d6e7173 [formerly 0581451b49]]] [formerly 42ff7b7766 [formerly f717f79cb9] [formerly 51d14fa0fe [formerly 3c7b130ba0]] [formerly af4cbc3b12 [formerly b954b5da24] [formerly 23d8a07079]]]]
Former-commit-id: 101df5f3d2 [formerly 8733bbdd40] [formerly b77e6fc4a1 [formerly d3d416aafe]] [formerly 1549ec183f [formerly 2988678215] [formerly 834d3b67e6 [formerly 0f7a2cc5f8]]] [formerly 43c85cb173 [formerly febbeb4c5e] [formerly c11f086b61 [formerly abd8363fa9]] [formerly ef875f7d6a [formerly a0a4a2c5b4] [formerly 014d56184c [formerly 8259af562c]]]]
Former-commit-id: f2c7752f1e [formerly 062b17453c] [formerly ef91b9f2c1 [formerly 923748d6af]] [formerly 0deb3fd193 [formerly fd3340c709] [formerly b6c750b3ef [formerly 1f5f12e8b3]]]
Former-commit-id: 8839829d9a [formerly b502165fae] [formerly 3df9ef108f [formerly e9ddcc6575]]
Former-commit-id: c965df4a37 [formerly aa04bbcc9e]
Former-commit-id: 2a723377ea
master
lhenry15 4 years ago
parent
commit
0f88581004
61 changed files with 155921 additions and 148656 deletions
  1. +1
    -1
      datasets/NAB/add_label.py
  2. +4033
    -4033
      datasets/NAB/artificialNoAnomaly/labeled_art_daily_no_noise.csv
  3. +4033
    -4033
      datasets/NAB/artificialNoAnomaly/labeled_art_daily_perfect_square_wave.csv
  4. +4033
    -4033
      datasets/NAB/artificialNoAnomaly/labeled_art_daily_small_noise.csv
  5. +4033
    -4033
      datasets/NAB/artificialNoAnomaly/labeled_art_flatline.csv
  6. +4033
    -4033
      datasets/NAB/artificialNoAnomaly/labeled_art_noisy.csv
  7. +4033
    -4033
      datasets/NAB/artificialWithAnomaly/labeled_art_daily_flatmiddle.csv
  8. +4033
    -4033
      datasets/NAB/artificialWithAnomaly/labeled_art_daily_jumpsdown.csv
  9. +4033
    -4033
      datasets/NAB/artificialWithAnomaly/labeled_art_daily_jumpsup.csv
  10. +4033
    -4033
      datasets/NAB/artificialWithAnomaly/labeled_art_daily_nojump.csv
  11. +4033
    -4033
      datasets/NAB/artificialWithAnomaly/labeled_art_increase_spike_density.csv
  12. +4033
    -4033
      datasets/NAB/artificialWithAnomaly/labeled_art_load_balancer_spikes.csv
  13. +4033
    -4033
      datasets/NAB/realAWSCloudwatch/labeled_ec2_cpu_utilization_24ae8d.csv
  14. +4033
    -4033
      datasets/NAB/realAWSCloudwatch/labeled_ec2_cpu_utilization_53ea38.csv
  15. +4033
    -4033
      datasets/NAB/realAWSCloudwatch/labeled_ec2_cpu_utilization_5f5533.csv
  16. +4033
    -4033
      datasets/NAB/realAWSCloudwatch/labeled_ec2_cpu_utilization_77c1ca.csv
  17. +4033
    -4033
      datasets/NAB/realAWSCloudwatch/labeled_ec2_cpu_utilization_825cc2.csv
  18. +4033
    -4033
      datasets/NAB/realAWSCloudwatch/labeled_ec2_cpu_utilization_ac20cd.csv
  19. +4033
    -4033
      datasets/NAB/realAWSCloudwatch/labeled_ec2_cpu_utilization_c6585a.csv
  20. +4033
    -4033
      datasets/NAB/realAWSCloudwatch/labeled_ec2_cpu_utilization_fe7f93.csv
  21. +4731
    -4731
      datasets/NAB/realAWSCloudwatch/labeled_ec2_disk_write_bytes_1ef3de.csv
  22. +4033
    -4033
      datasets/NAB/realAWSCloudwatch/labeled_ec2_disk_write_bytes_c0d644.csv
  23. +4033
    -4033
      datasets/NAB/realAWSCloudwatch/labeled_ec2_network_in_257a54.csv
  24. +4731
    -4731
      datasets/NAB/realAWSCloudwatch/labeled_ec2_network_in_5abac7.csv
  25. +4033
    -4033
      datasets/NAB/realAWSCloudwatch/labeled_elb_request_count_8c0756.csv
  26. +4622
    -4622
      datasets/NAB/realAWSCloudwatch/labeled_grok_asg_anomaly.csv
  27. +1244
    -1244
      datasets/NAB/realAWSCloudwatch/labeled_iio_us-east-1_i-a2eb1cd9_NetworkIn.csv
  28. +4033
    -4033
      datasets/NAB/realAWSCloudwatch/labeled_rds_cpu_utilization_cc0c53.csv
  29. +4033
    -4033
      datasets/NAB/realAWSCloudwatch/labeled_rds_cpu_utilization_e47b3b.csv
  30. +1625
    -1625
      datasets/NAB/realAdExchange/labeled_exchange-2_cpc_results.csv
  31. +1625
    -1625
      datasets/NAB/realAdExchange/labeled_exchange-2_cpm_results.csv
  32. +1539
    -1539
      datasets/NAB/realAdExchange/labeled_exchange-3_cpc_results.csv
  33. +1539
    -1539
      datasets/NAB/realAdExchange/labeled_exchange-3_cpm_results.csv
  34. +1644
    -1644
      datasets/NAB/realAdExchange/labeled_exchange-4_cpc_results.csv
  35. +1644
    -1644
      datasets/NAB/realAdExchange/labeled_exchange-4_cpm_results.csv
  36. +7268
    -0
      datasets/NAB/realKnownCause/labeled_ambient_temperature_system_failure.csv
  37. +0
    -1
      datasets/NAB/realKnownCause/labeled_ambient_temperature_system_failure.csv.REMOVED.git-id
  38. +1
    -1
      datasets/NAB/realKnownCause/labeled_cpu_utilization_asg_misconfiguration.csv.REMOVED.git-id
  39. +4033
    -4033
      datasets/NAB/realKnownCause/labeled_ec2_request_latency_system_failure.csv
  40. +1
    -1
      datasets/NAB/realKnownCause/labeled_machine_temperature_system_failure.csv.REMOVED.git-id
  41. +1
    -1
      datasets/NAB/realKnownCause/labeled_nyc_taxi.csv.REMOVED.git-id
  42. +1883
    -1883
      datasets/NAB/realKnownCause/labeled_rogue_agent_key_hold.csv
  43. +5316
    -5316
      datasets/NAB/realKnownCause/labeled_rogue_agent_key_updown.csv
  44. +2501
    -2501
      datasets/NAB/realTraffic/labeled_TravelTime_387.csv
  45. +2163
    -2163
      datasets/NAB/realTraffic/labeled_TravelTime_451.csv
  46. +2381
    -2381
      datasets/NAB/realTraffic/labeled_occupancy_6005.csv
  47. +2501
    -2501
      datasets/NAB/realTraffic/labeled_occupancy_t4013.csv
  48. +2501
    -2501
      datasets/NAB/realTraffic/labeled_speed_6005.csv
  49. +1128
    -1128
      datasets/NAB/realTraffic/labeled_speed_7578.csv
  50. +2496
    -2496
      datasets/NAB/realTraffic/labeled_speed_t4013.csv
  51. +1
    -1
      datasets/NAB/realTweets/labeled_Twitter_volume_AAPL.csv.REMOVED.git-id
  52. +1
    -1
      datasets/NAB/realTweets/labeled_Twitter_volume_AMZN.csv.REMOVED.git-id
  53. +1
    -1
      datasets/NAB/realTweets/labeled_Twitter_volume_CRM.csv.REMOVED.git-id
  54. +1
    -1
      datasets/NAB/realTweets/labeled_Twitter_volume_CVS.csv.REMOVED.git-id
  55. +1
    -1
      datasets/NAB/realTweets/labeled_Twitter_volume_FB.csv.REMOVED.git-id
  56. +1
    -1
      datasets/NAB/realTweets/labeled_Twitter_volume_GOOG.csv.REMOVED.git-id
  57. +1
    -1
      datasets/NAB/realTweets/labeled_Twitter_volume_IBM.csv.REMOVED.git-id
  58. +1
    -1
      datasets/NAB/realTweets/labeled_Twitter_volume_KO.csv.REMOVED.git-id
  59. +1
    -1
      datasets/NAB/realTweets/labeled_Twitter_volume_PFE.csv.REMOVED.git-id
  60. +1
    -1
      datasets/NAB/realTweets/labeled_Twitter_volume_UPS.csv.REMOVED.git-id
  61. +0
    -2
      examples/run_automl.py

+ 1
- 1
datasets/NAB/add_label.py View File

@@ -16,5 +16,5 @@ for key in label_info.keys():
else:
label.append('0')
df['label'] = label
df.to_csv(fpath+"/labeled_"+fname)
df.to_csv(fpath+"/labeled_"+fname, index=False)


+ 4033
- 4033
datasets/NAB/artificialNoAnomaly/labeled_art_daily_no_noise.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/artificialNoAnomaly/labeled_art_daily_perfect_square_wave.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/artificialNoAnomaly/labeled_art_daily_small_noise.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/artificialNoAnomaly/labeled_art_flatline.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/artificialNoAnomaly/labeled_art_noisy.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/artificialWithAnomaly/labeled_art_daily_flatmiddle.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/artificialWithAnomaly/labeled_art_daily_jumpsdown.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/artificialWithAnomaly/labeled_art_daily_jumpsup.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/artificialWithAnomaly/labeled_art_daily_nojump.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/artificialWithAnomaly/labeled_art_increase_spike_density.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/artificialWithAnomaly/labeled_art_load_balancer_spikes.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/realAWSCloudwatch/labeled_ec2_cpu_utilization_24ae8d.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/realAWSCloudwatch/labeled_ec2_cpu_utilization_53ea38.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/realAWSCloudwatch/labeled_ec2_cpu_utilization_5f5533.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/realAWSCloudwatch/labeled_ec2_cpu_utilization_77c1ca.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/realAWSCloudwatch/labeled_ec2_cpu_utilization_825cc2.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/realAWSCloudwatch/labeled_ec2_cpu_utilization_ac20cd.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/realAWSCloudwatch/labeled_ec2_cpu_utilization_c6585a.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/realAWSCloudwatch/labeled_ec2_cpu_utilization_fe7f93.csv
File diff suppressed because it is too large
View File


+ 4731
- 4731
datasets/NAB/realAWSCloudwatch/labeled_ec2_disk_write_bytes_1ef3de.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/realAWSCloudwatch/labeled_ec2_disk_write_bytes_c0d644.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/realAWSCloudwatch/labeled_ec2_network_in_257a54.csv
File diff suppressed because it is too large
View File


+ 4731
- 4731
datasets/NAB/realAWSCloudwatch/labeled_ec2_network_in_5abac7.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/realAWSCloudwatch/labeled_elb_request_count_8c0756.csv
File diff suppressed because it is too large
View File


+ 4622
- 4622
datasets/NAB/realAWSCloudwatch/labeled_grok_asg_anomaly.csv
File diff suppressed because it is too large
View File


+ 1244
- 1244
datasets/NAB/realAWSCloudwatch/labeled_iio_us-east-1_i-a2eb1cd9_NetworkIn.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/realAWSCloudwatch/labeled_rds_cpu_utilization_cc0c53.csv
File diff suppressed because it is too large
View File


+ 4033
- 4033
datasets/NAB/realAWSCloudwatch/labeled_rds_cpu_utilization_e47b3b.csv
File diff suppressed because it is too large
View File


+ 1625
- 1625
datasets/NAB/realAdExchange/labeled_exchange-2_cpc_results.csv
File diff suppressed because it is too large
View File


+ 1625
- 1625
datasets/NAB/realAdExchange/labeled_exchange-2_cpm_results.csv
File diff suppressed because it is too large
View File


+ 1539
- 1539
datasets/NAB/realAdExchange/labeled_exchange-3_cpc_results.csv
File diff suppressed because it is too large
View File


+ 1539
- 1539
datasets/NAB/realAdExchange/labeled_exchange-3_cpm_results.csv
File diff suppressed because it is too large
View File


+ 1644
- 1644
datasets/NAB/realAdExchange/labeled_exchange-4_cpc_results.csv
File diff suppressed because it is too large
View File


+ 1644
- 1644
datasets/NAB/realAdExchange/labeled_exchange-4_cpm_results.csv
File diff suppressed because it is too large
View File


+ 7268
- 0
datasets/NAB/realKnownCause/labeled_ambient_temperature_system_failure.csv
File diff suppressed because it is too large
View File


+ 0
- 1
datasets/NAB/realKnownCause/labeled_ambient_temperature_system_failure.csv.REMOVED.git-id View File

@@ -1 +0,0 @@
49b3ed29808987b19c9a17d47838d7fd21a64290

+ 1
- 1
datasets/NAB/realKnownCause/labeled_cpu_utilization_asg_misconfiguration.csv.REMOVED.git-id View File

@@ -1 +1 @@
35256ed33e1a2c8b0c4abfbf924bb6f009c932a3
6b0bc2aa98d9bd1769aded1842269293ecdbf46c

+ 4033
- 4033
datasets/NAB/realKnownCause/labeled_ec2_request_latency_system_failure.csv
File diff suppressed because it is too large
View File


+ 1
- 1
datasets/NAB/realKnownCause/labeled_machine_temperature_system_failure.csv.REMOVED.git-id View File

@@ -1 +1 @@
26eb88e5a373bbda063203bf28b818eaba168f29
4e6e62763fb4d8a5c8ca35981b7af97c9ce88fbc

+ 1
- 1
datasets/NAB/realKnownCause/labeled_nyc_taxi.csv.REMOVED.git-id View File

@@ -1 +1 @@
eeb114c5c4471f4089ac206800eaa2330119dc04
8d535c4e4624c3e769c603db381cde74ffd1541b

+ 1883
- 1883
datasets/NAB/realKnownCause/labeled_rogue_agent_key_hold.csv
File diff suppressed because it is too large
View File


+ 5316
- 5316
datasets/NAB/realKnownCause/labeled_rogue_agent_key_updown.csv
File diff suppressed because it is too large
View File


+ 2501
- 2501
datasets/NAB/realTraffic/labeled_TravelTime_387.csv
File diff suppressed because it is too large
View File


+ 2163
- 2163
datasets/NAB/realTraffic/labeled_TravelTime_451.csv
File diff suppressed because it is too large
View File


+ 2381
- 2381
datasets/NAB/realTraffic/labeled_occupancy_6005.csv
File diff suppressed because it is too large
View File


+ 2501
- 2501
datasets/NAB/realTraffic/labeled_occupancy_t4013.csv
File diff suppressed because it is too large
View File


+ 2501
- 2501
datasets/NAB/realTraffic/labeled_speed_6005.csv
File diff suppressed because it is too large
View File


+ 1128
- 1128
datasets/NAB/realTraffic/labeled_speed_7578.csv
File diff suppressed because it is too large
View File


+ 2496
- 2496
datasets/NAB/realTraffic/labeled_speed_t4013.csv
File diff suppressed because it is too large
View File


+ 1
- 1
datasets/NAB/realTweets/labeled_Twitter_volume_AAPL.csv.REMOVED.git-id View File

@@ -1 +1 @@
2d91a1145560d6f2ba78653857e4c365b849af48
0edff7c15786fd853fe6ad350c614242f5b2871b

+ 1
- 1
datasets/NAB/realTweets/labeled_Twitter_volume_AMZN.csv.REMOVED.git-id View File

@@ -1 +1 @@
6bd82e25bc77b7c2d239e35fe3292418b7f7f2f6
8cb8dcfaa5c9c855e7c6d4f059838e20284d6dbc

+ 1
- 1
datasets/NAB/realTweets/labeled_Twitter_volume_CRM.csv.REMOVED.git-id View File

@@ -1 +1 @@
10197fd0d3ae336cc3af7b73c2b8172925878a81
f813962b33568d076285707a60cbfec7b0daa864

+ 1
- 1
datasets/NAB/realTweets/labeled_Twitter_volume_CVS.csv.REMOVED.git-id View File

@@ -1 +1 @@
a2bbcaeffe42bb34694e005021c137a501f42fa4
5a221a242b60a8ff302a6bf174ab05b7661a1dfd

+ 1
- 1
datasets/NAB/realTweets/labeled_Twitter_volume_FB.csv.REMOVED.git-id View File

@@ -1 +1 @@
207e1632a8e355fb2622f090d19aa0bbc8b46f3d
da6e1f36aeba57d81340b3e468a64eca017561f0

+ 1
- 1
datasets/NAB/realTweets/labeled_Twitter_volume_GOOG.csv.REMOVED.git-id View File

@@ -1 +1 @@
b1ceb02a500f874bb83fff57c0343800b5f8d598
a2b7ee363323c1583a38fc604425281d0a32e90a

+ 1
- 1
datasets/NAB/realTweets/labeled_Twitter_volume_IBM.csv.REMOVED.git-id View File

@@ -1 +1 @@
ba0a753fc1e7b9031debc24bbe2ba4f8659a9992
4c504cb93885a3d759c308d39833af0cb72586b8

+ 1
- 1
datasets/NAB/realTweets/labeled_Twitter_volume_KO.csv.REMOVED.git-id View File

@@ -1 +1 @@
1641472acea894a40c5ec95ad7cc329719d6cfc7
3e208a1d5a72f93d3105599578918e51f07a31f1

+ 1
- 1
datasets/NAB/realTweets/labeled_Twitter_volume_PFE.csv.REMOVED.git-id View File

@@ -1 +1 @@
46cf6c9d1c2b44f537641a6401824da570ad8986
3147689c7a7ae3b0b05a5ee2de699f754e8973e9

+ 1
- 1
datasets/NAB/realTweets/labeled_Twitter_volume_UPS.csv.REMOVED.git-id View File

@@ -1 +1 @@
e0ea87c58b01bd07d9763dc49288a9ce17e20a0a
3e4904fb5fa4e4c0b86fc67f1700b94786f376f5

+ 0
- 2
examples/run_automl.py View File

@@ -18,8 +18,6 @@ metric = 'F1_MACRO' # F1 on both label 0 and 1

# Read data and generate dataset and problem
df = pd.read_csv(table_path)
print(df[4])
exit()
dataset, problem_description = generate_dataset_problem(df, target_index=target_index, metric=metric)

# Start backend


Loading…
Cancel
Save