From 5862660b1a34e23fd4e3697ec6e8fcdc55422ea2 Mon Sep 17 00:00:00 2001 From: lhenry15 Date: Tue, 15 Sep 2020 01:47:53 -0500 Subject: [PATCH] add run_pipeline example Former-commit-id: 288393715aef1167ae66eda9bc620ed467a1aa77 [formerly fd66dd92f82fc5c9be80fce431a27ecd13d03e5e] [formerly f969a91e290587101ce5da11654a23e00ff61f40 [formerly 328bc7f4293f49c1aa8f1acccba4e867f4bc2731]] [formerly 055971c1ba48739b4e92fa18cdcded05ca6ad18e [formerly 2dc54dce68d56f9c196242ec902086824b4f4c01] [formerly 614269ccfe01d90267cd0d625b9fe21c70ad6eb7 [formerly f37d0044dda5ef041f87be83b59a3c82e6378e7c]]] [formerly c524aa15ac71cac6b2d4bd8fa493afaf1b5d9fd8 [formerly 0c85249c00bea271fa0b5da005eabdb645aaccdd] [formerly c883bf8cf18d1cc08b92747c2d459a5f9c99e4e6 [formerly 045a32725aa2430c12a92c0215718184bdcb0ba7]] [formerly fca41f37d2fdef81dd234a64e325b5e84f53c2a7 [formerly fbe1445b3f98c67dbe916b6c650d7d7b2b8172a3] [formerly ee00fd612b78683d7a9d17d2a163a58d6fd48ccd [formerly 8cb4e5a42378b70c383d24d4ed870b192bc8a4c8]]]] [formerly 827b81298b1eae286c643327d3b0f4aae2e0d78c [formerly fea21bff95e634a5de9b0e2901589228202efec0] [formerly 46870a25ff273d3e0aa005d003c8dd512dc4b060 [formerly 5f0a227ae9589fdc80848f32f18787141587c392]] [formerly 51f667d8e7a7043a6d7992b80ff1008da36b27df [formerly c93cb06e2051e4cae7a8a553d297b81e47dbf1e6] [formerly 86c1b5c69b44b5e5d290e9d6edf4f94a4145bb89 [formerly 1dd4ebf49ed9abe23537025d747a511032dca5a4]]] [formerly f6e35b7fcd5f22963f31f4312c2e02ba53216c29 [formerly 037dd8a3379b9e88a27f7f8f4cb583c64fe8474e] [formerly 69ce24d9a98a5b5a909eb49ee76662a9c82a0ce5 [formerly 1fcf5b8fd4bcc47184e866bd0dd585782e61c32e]] [formerly 35e9100330448e626be7d0f2dc9865e0239fb47d [formerly 28cb84ba65d5e80787c72cad7741dec19055c842] [formerly 901542acd1935cf686a8e0def9bae33103d20690 [formerly a9e8a39377deb4a218aadfc8343b6f28d651cf16]]]]] [formerly 8ece4325ab17c330b4a1d323cfc9c3620e7019fd [formerly ba66105df3c103e2dc4d16f1c5ead76f06878a96] [formerly 86d52f8e52e0cedf8c3903dd11d2ec74231d6706 [formerly 540386c495fb2e63e559dda9ef2e673bdc4b9df7]] [formerly 8ea7d87d774701bdd6f6cddc5b30d25f1011aeb6 [formerly 5399029369ad53cd998f3ec4707cba3e9744a977] [formerly f862e7add97e26d12a5e0c4dd3c2f8e15a974aff [formerly e946cfd883b354fae31fe9fd1c9d711b45b3e0f5]]] [formerly 986ef588e1fa349ec40978317fdc5d72778e9697 [formerly 98f1111c6db092e1e9a50c7c84459fdfd857b500] [formerly ed53a50f20c674a4724d8fefbe0f1f21519371e9 [formerly a0c848e95e57d8f9d32969fa59a4d61cb8fe20c4]] [formerly 6da3707228a56074edea7cb30b8e5182f33fb4f5 [formerly 8dcd999b94f4aed64e22a51dcc73c92609753ecd] [formerly dfb80dd48bef777b866d55cba0493319b58268de [formerly d93676b1051b8ee7e6b107eb707ad064247c936d]]]] [formerly b3a8e4729f4fda4a57f91cd3b988ec36fc934ed2 [formerly 7a16fe05434cd5915d078e36d081c164ccb32259] [formerly 0fd9ccb9125af86bbad35384d9e2f9bd0543d8a2 [formerly 90cf76ed5f5b99b4f9a5f3ca1a42e04a0f1421fd]] [formerly 98ccdd8f1818a60f5e02782fa403cc79b3244bc8 [formerly 9d09d642ee44836d5a25aa3d9ef4cb95ec2806f7] [formerly 4091dda241442a999f92f882f1ce7d51d8b4cf72 [formerly 507f2b27c407d48290f67ff39359dfbb00ee077a]]] [formerly f628b52f38541978a4b0f17e6f7bfd189718e825 [formerly a85c59dc5d789e2f6bcd63e81f340862ad85bde3] [formerly f55864ca0c97976a46de7c707e6ebf344fa5d8f2 [formerly 816768d4b63c1fc45e6dd40ef77d41b5d4889ff0]] [formerly 4b611c8ca97ab592395bf9922654baf4c13b65c5 [formerly 63aefd8cee6e71db2799d76b350128eb770bfbc6] [formerly 1e48dbf314fc3673f6d6051cf6bbbf91a23fd884 [formerly 1c4b9c0a1cd540bb25a58f0890984acc0f8e51d1]]]]]] Former-commit-id: 4214ab428b90b77b7e966fe9afdfc453aa6ad954 [formerly ec8c656b5c4e3b63c60a6bd3878bb5dee8b83796] [formerly d05bf6ca413e44c736624a1bc6d33d363cc9650f [formerly c12b38a108b4fbc234fee2f29905b153a36d3928]] [formerly 426ffc8ab1d21df35ba62d88c871a6ddce69b7e5 [formerly 8dfab4a38bf9a3c66d0dbaededa051c345f0a79f] [formerly d3a97e3fa19726f1c70d72d69b75d8765e8d46e9 [formerly f2e7e2cb51f41b04ec5c736ba151fc312829b56c]]] [formerly 060461b7be48b6626c095cea7f096706844d4928 [formerly 5a001ba0f4c314f07b22e821c114270d86cf1d9e] [formerly 385181b3c7ba999d2565d583f808719ed3e9d3af [formerly 90e9cdf946538202f8914112a4fcc9f55d500406]] [formerly 2572c6d9b8c2dab7eb327a4eec1a430593b8269e [formerly 3eb5ace3e38ee383dfdaee09584a23f7636e6f0c] [formerly 0d0bfb4fcb470a39d37a9de97f5d1baaf968eb61 [formerly 42eb4bd14417f9cdc0a37771f467b67ae9742f24]]]] [formerly d872261dccb4cc84be3bbd3a69966b3de9629918 [formerly 2c92cf236be49e5889e8d2a3c35ba425c88895df] [formerly 9f47a08afac3c203d19656f593d5f98cdd426c7e [formerly e123cd95e11747a01ccc223e2c5bb31406f2ab9b]] [formerly 8fcc9c9dd1d09f05d2d7fe465b940babb2a75a82 [formerly c6e0419dbcd17e7060fe61a14240008058fb1b78] [formerly 95c5650729aa26b0de955036d127b912dac07516 [formerly 1d3dc1a7e486f43626c9cd267de3a55d9c128332]]] [formerly 0210e142de053c7c8f83bba173eedab5c428003d [formerly c33cb25185f26ca0820b89979c9a1296385b18a7] [formerly 6f1280668eb1c0ade3f18a8c91917f78ae08d4f7 [formerly 2686c34dcd75c89d9db522e56ea9c37b72c32780]] [formerly 28401889eb471a58d5093a390450ce1df3e6d717 [formerly 2f7569552aede53ebb5db3aee4e4288fdc3b8c1a] [formerly 1e48dbf314fc3673f6d6051cf6bbbf91a23fd884]]]] Former-commit-id: 149e5f1a0b86c11b07beb0c1ae17db18843018b5 [formerly 9fd497b6aebebad61df908d791d3d8140df9f9a9] [formerly 13e0388bfe630ce876a39c4fc6f04f48169c7428 [formerly 21155c585794e447700b17887658e65f42739c77]] [formerly 194f3976cdd2640b4c534c200fdf95d014d83109 [formerly dd7d329721ebb15f18dd5176528c7548412d5bb3] [formerly 741a66597f7eb8d48f2a5cb7f224fc08b1c3a06b [formerly f4244702e8ca53ffe94ef47e41a881eb86f3ee62]]] [formerly 57ad7550ad238fdef0b0139889471d4dab1b91e6 [formerly dc2076235d273ad860024132ed92f4ad4c79e122] [formerly 2cd5644f994de8536f2759af3b40fc6ffbdd2acd [formerly 900eaa1a535ce83d9737453d037bb12b6853f649]] [formerly 6608ad174bbfde51429c52d930330495ea3345ea [formerly dfbf60f2b5dbdfb44fa05fc611f2f46c32f22556] [formerly edbfe1bff6aa96d321cbc4d44cd988c8d5cc519a [formerly 734463e4b73029051c3a7ada84efed712c7a6a81]]]] Former-commit-id: 7fefbdfa7b145b49d45e386bc257398cef4464c7 [formerly 0f7c45a1be76e4207f011a2d1d79d51bdcd17766] [formerly c3b6bdf21e07310d425de93d815a0aa62803cca3 [formerly b818b775d2302cb4c5a6a9d24b87e4ef3415669f]] [formerly 4d04227c136c19d8ae474565d3bfbe4f0468f691 [formerly 4439eefeaafa3761c43384a2a7a88e4b3ce37217] [formerly d919921c2ca562211679c0da33de6d120f6584fd [formerly c7f35290534b6a1b9c634ed587c2746532adb505]]] Former-commit-id: ae31ceb1a095c62e7b73fc668b17ebdceec576d3 [formerly aed7c1c48863787237ef7383a28a6f2bb82a8940] [formerly 0a0eb413b8de772fbb44b1dac7c4e774d0d53cee [formerly d87ee60333cc84668984cf9d5344ec2815c57c78]] Former-commit-id: 36dee1f46ed5e0a15006144bd23a20859c019bf9 [formerly 2db524c9087be99f6e3cd2cce6c29e1bb7db85e7] Former-commit-id: 46ed14eae239dcf1e66e69e91468bdee1ac3d03d --- examples/run_certain_pipeline.py | 30 ---------------------------- examples/run_pipeline.py | 42 ++++++++++++++++++++++++++++++++++++++++ 2 files changed, 42 insertions(+), 30 deletions(-) delete mode 100644 examples/run_certain_pipeline.py create mode 100644 examples/run_pipeline.py diff --git a/examples/run_certain_pipeline.py b/examples/run_certain_pipeline.py deleted file mode 100644 index 4f02ea5..0000000 --- a/examples/run_certain_pipeline.py +++ /dev/null @@ -1,30 +0,0 @@ - -import os - -results_dir = './' -pipeline_run_yml_dir = './' - -pipeline_yml_name = './pipeline.yml' # './pipeline_yml/pipeline_10.yml' -pipline_yml_index = pipeline_yml_name[11:-4] - -python_command = 'python3 -m d3m runtime fit-produce -p ' + pipeline_yml_name \ - + ' -r ./datasets/anomaly/yahoo_sub_5/TRAIN/problem_TRAIN/problemDoc.json' \ - + ' -i ./datasets/anomaly/yahoo_sub_5/TRAIN/dataset_TRAIN/datasetDoc.json' \ - + ' -t ./datasets/anomaly/yahoo_sub_5/TEST/dataset_TEST/datasetDoc.json -o ' \ - + results_dir + 'result.csv' \ - + ' -O ' \ - + pipeline_run_yml_dir + 'pipeline_run' + '.yml' - -print(python_command) -os.system(python_command) -# 'python3 -m d3m runtime fit-produce -p pipeline.yml -# -r ../datasets/anomaly/kpi/TRAIN/problem_TRAIN/problemDoc.json -# -i ../datasets/anomaly/kpi/TRAIN/dataset_TRAIN/datasetDoc.json -# -t ../datasets/anomaly/kpi/TEST/dataset_TEST/datasetDoc.json -# -o results.csv -O pipeline_run.yml' - -# python3 -m d3m runtime fit-produce -p pipeline.yml -# -r ../datasets/anomaly/yahoo_sub_5/TRAIN/problem_TRAIN/problemDoc.json -# -i ../datasets/anomaly/yahoo_sub_5/TRAIN/dataset_TRAIN/datasetDoc.json -# -t ../datasets/anomaly/yahoo_sub_5/TEST/dataset_TEST/datasetDoc.json -# -o result.csv -O pipeline_run.yml \ No newline at end of file diff --git a/examples/run_pipeline.py b/examples/run_pipeline.py new file mode 100644 index 0000000..ae9d8ec --- /dev/null +++ b/examples/run_pipeline.py @@ -0,0 +1,42 @@ +import pandas as pd +import sys +import argparse + +from searcher import schemas as schemas_utils +from searcher.utils import generate_dataset_problem, evaluate_pipeline +from axolotl.utils import pipeline as pipeline_utils +import os + +this_path = os.path.dirname(os.path.abspath(__file__)) +#table_path = 'datasets/NAB/realTweets/labeled_Twitter_volume_IBM.csv' # The path of the dataset + +parser = argparse.ArgumentParser(description='Arguments for running predefined pipelin.') +parser.add_argument('--table_path', type=str, default=os.path.join(this_path, '../datasets/yahoo_sub_5.csv'), + help='Input the path of the input data table') +parser.add_argument('--target_index', type=int, default=6, + help='Index of the ground truth (for evaluation)') +parser.add_argument('--metric',type=str, default='F1_MACRO', + help='Evaluation Metric (F1, F1_MACRO)') +parser.add_argument('--pipeline_path', default=os.path.join(this_path, '../tods/searcher/resources/default_pipeline.json'), + help='Input the path of the pre-built pipeline description') + +args = parser.parse_args() + +table_path = args.table_path +target_index = args.target_index # what column is the target +pipeline_path = args.pipeline_path +metric = args.metric # F1 on both label 0 and 1 + +time_limit = 30 # How many seconds you wanna search + +# Read data and generate dataset and problem +df = pd.read_csv(table_path) +dataset, problem_description = generate_dataset_problem(df, target_index=target_index, metric=metric) + +# Load the default pipeline +pipeline = pipeline_utils.load_pipeline(pipeline_path) + +# Run the pipeline +pipeline_result = evaluate_pipeline(problem_description, dataset, pipeline) +print(pipeline_result) +