You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

DeepLog_test.py 1.7 kB

4 years ago
1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253
  1. import numpy as np
  2. from tods.tods_skinterface.primitiveSKI.detection_algorithm.DeepLog_skinterface import DeepLogSKI
  3. from sklearn.metrics import precision_recall_curve
  4. from sklearn.metrics import accuracy_score
  5. from sklearn.metrics import confusion_matrix
  6. from sklearn.metrics import classification_report
  7. import matplotlib.pyplot as plt
  8. from sklearn import metrics
  9. #prepare the data
  10. data = np.loadtxt("./500_UCR_Anomaly_robotDOG1_10000_19280_19360.txt")
  11. X_train = np.expand_dims(data[:10000], axis=1)
  12. X_test = np.expand_dims(data[10000:], axis=1)
  13. transformer = DeepLogSKI()
  14. transformer.fit(X_train)
  15. prediction_labels_train = transformer.predict(X_train)
  16. prediction_labels = transformer.predict(X_test)
  17. prediction_score = transformer.predict_score(X_test)
  18. print("Primitive: ", transformer.primitive)
  19. print("Prediction Labels\n", prediction_labels)
  20. print("Prediction Score\n", prediction_score)
  21. # y_true = prediction_labels_train[:1000]
  22. # y_pred = prediction_labels[:1000]
  23. y_true = prediction_labels_train
  24. y_pred = prediction_labels
  25. print('Accuracy Score: ', accuracy_score(y_true, y_pred))
  26. confusion_matrix(y_true, y_pred)
  27. print(classification_report(y_true, y_pred))
  28. precision, recall, thresholds = precision_recall_curve(y_true, y_pred)
  29. f1_scores = 2*recall*precision/(recall+precision)
  30. print('Best threshold: ', thresholds[np.argmax(f1_scores)])
  31. print('Best F1-Score: ', np.max(f1_scores))
  32. fpr, tpr, threshold = metrics.roc_curve(y_true, y_pred)
  33. roc_auc = metrics.auc(fpr, tpr)
  34. plt.title('ROC')
  35. plt.plot(fpr, tpr, 'b', label = 'AUC = %0.2f' % roc_auc)
  36. plt.legend(loc = 'lower right')
  37. plt.ylabel('True Positive Rate')
  38. plt.xlabel('False Positive Rate')
  39. plt.show()

全栈的自动化机器学习系统,主要针对多变量时间序列数据的异常检测。TODS提供了详尽的用于构建基于机器学习的异常检测系统的模块,它们包括:数据处理(data processing),时间序列处理( time series processing),特征分析(feature analysis),检测算法(detection algorithms),和强化模块( reinforcement module)。这些模块所提供的功能包括常见的数据预处理、时间序列数据的平滑或变换,从时域或频域中抽取特征、多种多样的检测算