Skip to content

Commit

Permalink
Added option to download SMD dataset. Processing not done yet.
Browse files Browse the repository at this point in the history
  • Loading branch information
Jad-yehya committed May 16, 2024
1 parent 3d4022c commit 208e4e5
Showing 1 changed file with 8 additions and 1 deletion.
9 changes: 8 additions & 1 deletion exploratory/data_preprocess.py
Original file line number Diff line number Diff line change
Expand Up @@ -153,6 +153,9 @@ def get_data(dataset_name):
args = sys.argv[1:]
if args[0] == "download":
commands = [
"git clone https://github.com/NetManAIOps/OmniAnomaly.git",
"mv OmniAnomaly/ServerMachineDataset .",
"rm -rf OmniAnomaly",
"wget https://s3-us-west-2.amazonaws.com/telemanom/data.zip",
"unzip data.zip",
"rm data.zip",
Expand All @@ -162,7 +165,11 @@ def get_data(dataset_name):
for command in commands:
subprocess.run(command, shell=True)

# Adds the option to process all datasets at once
commands = sys.argv[1:]
if "ALL" in commands:
commands = datasets

load = []
if len(commands) > 0:
for d in commands:
Expand All @@ -173,6 +180,6 @@ def get_data(dataset_name):
print(
"""
Usage: python data_preprocess.py <datasets>
where <datasets> should be one of ['SMD', 'SMAP', 'MSL']
where <datasets> should be one of ['SMD', 'SMAP', 'MSL', 'ALL']
"""
)

0 comments on commit 208e4e5

Please sign in to comment.