@inproceedings{scholars11006, doi = {10.1109/BigData47090.2019.9006420}, year = {2019}, note = {cited By 3; Conference of 2019 IEEE International Conference on Big Data, Big Data 2019 ; Conference Date: 9 December 2019 Through 12 December 2019; Conference Code:157991}, pages = {5888--5896}, title = {An Apriori-based Data Analysis on Suspicious Network Event Recognition}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, journal = {Proceedings - 2019 IEEE International Conference on Big Data, Big Data 2019}, author = {Jian, Z. and Sakai, H. and Watada, J. and Roy, A. and Hassan, M. H. B.}, isbn = {9781728108582}, keywords = {Learning algorithms; Statistical tests, Apriori algorithms; Cross validation; Event recognition; Logical properties; Machine learning models; Missing values; Rule-based models; Training data sets, Big data}, url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85081355750&doi=10.1109\%2fBigData47090.2019.9006420&partnerID=40&md5=e5cf69fd42d66343581335cd3dfff099}, abstract = {Apriori-based rule generators, which are powered by the DIS-Apriori algorithm and the NIS-Apriori algorithm, are applied to analyze the data sets available in the IEEE BigData 2019 Cup: Suspicious Network Event Recognition. Then, each missing value in the test data set is decided by using the obtained rules. The advantage of our rule-based model is that the obtained rules are very easy to understand in comparison with other 'black-box' machine learning models. Furthermore, two algorithms preserve the logical property 'completeness,' so they generate rules without excess and deficiency. In evaluation, the AUC measure seems unfavorable to our model, so we employed 3-fold cross-validation for the training data set, and we obtained a 94 mean score. This result ensures the validity of our model. We report several meaningful results in this experiment, as well as the estimation of missing values. {\^A}{\copyright} 2019 IEEE.} }