You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

DeepLog_test.py 1.8 kB

4 years ago
4 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354
  1. import numpy as np
  2. from tods.sk_interface.detection_algorithm.DeepLog_skinterface import DeepLogSKI
  3. #from tods.tods_skinterface.primitiveSKI.detection_algorithm.DeepLog_skinterface import DeepLogSKI
  4. from sklearn.metrics import precision_recall_curve
  5. from sklearn.metrics import accuracy_score
  6. from sklearn.metrics import confusion_matrix
  7. from sklearn.metrics import classification_report
  8. import matplotlib.pyplot as plt
  9. from sklearn import metrics
  10. #prepare the data
  11. data = np.loadtxt("./500_UCR_Anomaly_robotDOG1_10000_19280_19360.txt")
  12. X_train = np.expand_dims(data[:10000], axis=1)
  13. X_test = np.expand_dims(data[10000:], axis=1)
  14. transformer = DeepLogSKI()
  15. transformer.fit(X_train)
  16. prediction_labels_train = transformer.predict(X_train)
  17. prediction_labels = transformer.predict(X_test)
  18. prediction_score = transformer.predict_score(X_test)
  19. print("Primitive: ", transformer.primitive)
  20. print("Prediction Labels\n", prediction_labels)
  21. print("Prediction Score\n", prediction_score)
  22. # y_true = prediction_labels_train[:1000]
  23. # y_pred = prediction_labels[:1000]
  24. y_true = prediction_labels_train
  25. y_pred = prediction_labels
  26. print('Accuracy Score: ', accuracy_score(y_true, y_pred))
  27. confusion_matrix(y_true, y_pred)
  28. print(classification_report(y_true, y_pred))
  29. precision, recall, thresholds = precision_recall_curve(y_true, y_pred)
  30. f1_scores = 2*recall*precision/(recall+precision)
  31. print('Best threshold: ', thresholds[np.argmax(f1_scores)])
  32. print('Best F1-Score: ', np.max(f1_scores))
  33. fpr, tpr, threshold = metrics.roc_curve(y_true, y_pred)
  34. roc_auc = metrics.auc(fpr, tpr)
  35. plt.title('ROC')
  36. plt.plot(fpr, tpr, 'b', label = 'AUC = %0.2f' % roc_auc)
  37. plt.legend(loc = 'lower right')
  38. plt.ylabel('True Positive Rate')
  39. plt.xlabel('False Positive Rate')
  40. plt.show()

全栈的自动化机器学习系统,主要针对多变量时间序列数据的异常检测。TODS提供了详尽的用于构建基于机器学习的异常检测系统的模块,它们包括:数据处理(data processing),时间序列处理( time series processing),特征分析(feature analysis),检测算法(detection algorithms),和强化模块( reinforcement module)。这些模块所提供的功能包括常见的数据预处理、时间序列数据的平滑或变换,从时域或频域中抽取特征、多种多样的检测算