22 lines
494 B
Python
22 lines
494 B
Python
|
|
|
|
#data loading
|
|
import numpy as np
|
|
f=np.load("useragents.npz")
|
|
|
|
|
|
from stroo import train_model
|
|
|
|
#understands pure strings
|
|
#definitely not the best possible model
|
|
#so if this is at least >0.55 (on more complicated data) we should be able to do something with it
|
|
#also migth be included into an isolation forest
|
|
model=train_model(f["train"],n=3)
|
|
|
|
#calculate auc. Has disparity between normal, abnormal: np.mean(testy)~=0.065
|
|
print(model.eval(f["testx"],f["testy"]))
|
|
#in my tests reaches >0.99
|
|
|
|
|
|
|