#data loading import numpy as np f=np.load("useragents.npz") from stroo import train_model #understands pure strings #definitely not the best possible model #so if this is at least >0.55 (on more complicated data) we should be able to do something with it #also migth be included into an isolation forest model=train_model(f["train"],n=3) #calculate auc. Has disparity between normal, abnormal: np.mean(testy)~=0.065 print(model.eval(f["testx"],f["testy"])) #in my tests reaches >0.99