stroo/main.py

22 lines
494 B
Python

#data loading
import numpy as np
f=np.load("useragents.npz")
from stroo import train_model
#understands pure strings
#definitely not the best possible model
#so if this is at least >0.55 (on more complicated data) we should be able to do something with it
#also migth be included into an isolation forest
model=train_model(f["train"],n=3)
#calculate auc. Has disparity between normal, abnormal: np.mean(testy)~=0.065
print(model.eval(f["testx"],f["testy"]))
#in my tests reaches >0.99