forked from ClustProject/KUDataOutlier
-
Notifications
You must be signed in to change notification settings - Fork 1
/
kde.py
43 lines (30 loc) · 1.44 KB
/
kde.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
import os
import argparse
from utils import *
from sklearn.neighbors import KernelDensity
# Kernel Density Estimation
def kde(X_train, X_test):
# KDE 기반 분포 추정
kde_model = KernelDensity(kernel='gaussian', bandwidth=0.2)
kde_model.fit(X_train.values)
kde_test = - 1.0 * kde_model.score_samples(X_test.values)
kde_test = pd.DataFrame(kde_test, index=X_test.index, columns=['score'])
return kde_test
def main(train_data_path, test_data_path, save_root_path):
os.makedirs(save_root_path, exist_ok=True)
X_train = pd.read_csv(train_data_path, index_col=0)
X_train.index = pd.to_datetime(X_train.index)
X_test = pd.read_csv(test_data_path, index_col=0)
X_test.index = pd.to_datetime(X_test.index)
test_scores = kde(X_train, X_test)
test_scores.to_csv(os.path.join(save_root_path, 'anomaly_score.csv'))
draw_plot(test_scores, save_path=os.path.join(save_root_path, 'anomaly_score_plot.jpg'))
if __name__ == '__main__':
parser = argparse.ArgumentParser()
parser.add_argument('--train-data-path', type=str, default='./data/nasa_bearing_train.csv')
parser.add_argument('--test-data-path', type=str, default='./data/nasa_bearing_test.csv')
parser.add_argument('--save-root-path', type=str, default='./result/kde')
args, _ = parser.parse_known_args()
main(train_data_path=args.train_data_path,
test_data_path=args.test_data_path,
save_root_path=args.save_root_path)