diff --git a/README.rst b/README.rst index 563a082cb..4191b844b 100644 --- a/README.rst +++ b/README.rst @@ -166,32 +166,32 @@ The different algorithms are presented in the sphinx-gallery_. References: ----------- -.. [1] : I. Tomek, “Two modifications of CNN,” In Systems, Man, and Cybernetics, IEEE Transactions on, vol. 6, pp 769-772, 2010. +.. [1] : I. Tomek, “Two modifications of CNN,” IEEE Transactions on Systems, Man, and Cybernetics, vol. 6, pp. 769-772, 1976. [`bib `_] -.. [2] : I. Mani, I. Zhang. “kNN approach to unbalanced data distributions: a case study involving information extraction,” In Proceedings of workshop on learning from imbalanced datasets, 2003. +.. [2] : I. Mani, J. Zhang. “kNN approach to unbalanced data distributions: A case study involving information extraction,” In Proceedings of the Workshop on Learning from Imbalanced Data Sets, pp. 1-7, 2003. [`pdf `_] [`bib `_] -.. [3] : P. Hart, “The condensed nearest neighbor rule,” In Information Theory, IEEE Transactions on, vol. 14(3), pp. 515-516, 1968. +.. [3] : P. E. Hart, “The condensed nearest neighbor rule,” IEEE Transactions on Information Theory, vol. 14(3), pp. 515-516, 1968. [`pdf `_] [`bib `_] -.. [4] : M. Kubat, S. Matwin, “Addressing the curse of imbalanced training sets: one-sided selection,” In ICML, vol. 97, pp. 179-186, 1997. +.. [4] : M. Kubat, S. Matwin, “Addressing the curse of imbalanced training sets: One-sided selection,” In Proceedings of the 14th International Conference on Machine Learning, vol. 97, pp. 179-186, 1997. [`pdf `_] [`bib `_] -.. [5] : J. Laurikkala, “Improving identification of difficult small classes by balancing class distribution,” Springer Berlin Heidelberg, 2001. +.. [5] : J. Laurikkala, “Improving identification of difficult small classes by balancing class distribution,” Proceedings of the 8th Conference on Artificial Intelligence in Medicine in Europe, pp. 63-66, 2001. [`pdf `_] [`bib `_] -.. [6] : D. Wilson, “Asymptotic Properties of Nearest Neighbor Rules Using Edited Data,” In IEEE Transactions on Systems, Man, and Cybernetrics, vol. 2 (3), pp. 408-421, 1972. +.. [6] : D. Wilson, “Asymptotic Properties of Nearest Neighbor Rules Using Edited Data,” IEEE Transactions on Systems, Man, and Cybernetrics, vol. 2(3), pp. 408-421, 1972. [`pdf `_] [`bib `_] -.. [7] : D. Smith, Michael R., Tony Martinez, and Christophe Giraud-Carrier. “An instance level analysis of data complexity.” Machine learning 95.2 (2014): 225-256. +.. [7] : M. R. Smith, T. Martinez, C. Giraud-Carrier, “An instance level analysis of data complexity,” Machine learning, vol. 95(2), pp. 225-256, 2014. [`pdf `_] [`bib `_] -.. [8] : N. V. Chawla, K. W. Bowyer, L. O.Hall, W. P. Kegelmeyer, “SMOTE: synthetic minority over-sampling technique,” Journal of artificial intelligence research, 321-357, 2002. +.. [8] : N. V. Chawla, K. W. Bowyer, L. O. Hall, W. P. Kegelmeyer, “SMOTE: Synthetic minority over-sampling technique,” Journal of Artificial Intelligence Research, vol. 16, pp. 321-357, 2002. [`pdf `_] [`bib `_] -.. [9] : H. Han, W. Wen-Yuan, M. Bing-Huan, “Borderline-SMOTE: a new over-sampling method in imbalanced data sets learning,” Advances in intelligent computing, 878-887, 2005. +.. [9] : H. Han, W.-Y. Wang, B.-H. Mao, “Borderline-SMOTE: A new over-sampling method in imbalanced data sets learning,” In Proceedings of the 1st International Conference on Intelligent Computing, pp. 878-887, 2005. [`pdf `_] [`bib `_] -.. [10] : H. M. Nguyen, E. W. Cooper, K. Kamei, “Borderline over-sampling for imbalanced data classification,” International Journal of Knowledge Engineering and Soft Data Paradigms, 3(1), pp.4-21, 2001. +.. [10] : H. M. Nguyen, E. W. Cooper, K. Kamei, “Borderline over-sampling for imbalanced data classification,” In Proceedings of the 5th International Workshop on computational Intelligence and Applications, pp. 24-29, 2009. [`pdf `_] [`bib `_] -.. [11] : G. Batista, R. C. Prati, M. C. Monard. “A study of the behavior of several methods for balancing machine learning training data,” ACM Sigkdd Explorations Newsletter 6 (1), 20-29, 2004. +.. [11] : G. E. A. P. A. Batista, R. C. Prati, M. C. Monard, “A study of the behavior of several methods for balancing machine learning training data,” ACM Sigkdd Explorations Newsletter, vol. 6(1), pp. 20-29, 2004. [`pdf `_] [`bib `_] -.. [12] : G. Batista, B. Bazzan, M. Monard, [“Balancing Training Data for Automated Annotation of Keywords: a Case Study,” In WOB, 10-18, 2003. +.. [12] : G. E. A. P. A. Batista, A. L. C. Bazzan, M. C. Monard, “Balancing training data for automated annotation of keywords: A case study,” In Proceedings of the 2nd Brazilian Workshop on Bioinformatics, pp. 10-18, 2003. [`pdf `_] [`bib `_] -.. [13] : X. Y. Liu, J. Wu and Z. H. Zhou, “Exploratory Undersampling for Class-Imbalance Learning,” in IEEE Transactions on Systems, Man, and Cybernetics, Part B (Cybernetics), vol. 39, no. 2, pp. 539-550, April 2009. +.. [13] : X.-Y. Liu, J. Wu and Z.-H. Zhou, “Exploratory undersampling for class-imbalance learning,” IEEE Transactions on Systems, Man, and Cybernetics, vol. 39(2), pp. 539-550, 2009. [`pdf `_] [`bib `_] -.. [14] : I. Tomek, “An Experiment with the Edited Nearest-Neighbor Rule,” IEEE Transactions on Systems, Man, and Cybernetics, vol. 6(6), pp. 448-452, June 1976. +.. [14] : I. Tomek, “An experiment with the edited nearest-neighbor rule,” IEEE Transactions on Systems, Man, and Cybernetics, vol. 6(6), pp. 448-452, 1976. [`bib `_] -.. [15] : He, Haibo, Yang Bai, Edwardo A. Garcia, and Shutao Li. “ADASYN: Adaptive synthetic sampling approach for imbalanced learning,” In IEEE International Joint Conference on Neural Networks (IEEE World Congress on Computational Intelligence), pp. 1322-1328, 2008. +.. [15] : H. He, Y. Bai, E. A. Garcia, S. Li, “ADASYN: Adaptive synthetic sampling approach for imbalanced learning,” In Proceedings of the 5th IEEE International Joint Conference on Neural Networks, pp. 1322-1328, 2008. [`pdf `_] [`bib `_] diff --git a/references.bib b/references.bib new file mode 100644 index 000000000..54c45019c --- /dev/null +++ b/references.bib @@ -0,0 +1,178 @@ + +@InProceedings{ batista2003, + title = {Balancing training data for automated annotation of + keywords: A case study}, + author = {Batista, Gustavo E. A. P. A. and Bazzan, Ana L. C. and + Monard, Maria Carolina}, + booktitle = {Proceedings of the 2nd Brazilian Workshop on + Bioinformatics}, + pages = {10--18}, + year = {2003}, + month = {Dec.}, + address = {Rio de Janeiro, Brazil} +} + +@Article{ batista2004, + title = {A study of the behavior of several methods for balancing + machine learning training data}, + author = {Batista, Gustavo E. A. P. A. and Prati, Ronaldo C. and + Monard, Maria Carolina}, + journal = {ACM Sigkdd Explorations Newsletter}, + volume = {6}, + number = {1}, + pages = {20--29}, + year = {2004}, + publisher = {ACM} +} + +@Article{ chawla2002, + title = {SMOTE: Synthetic minority over-sampling technique}, + author = {Chawla, Nitesh V. and Bowyer, Kevin W. and Hall, Lawrence + O. and Kegelmeyer, W. Philip}, + journal = {Journal of Artificial Intelligence Research}, + volume = {16}, + pages = {321--357}, + year = {2002} +} + +@InProceedings{ han2005, + title = {Borderline-SMOTE: A new over-sampling method in imbalanced + data sets learning}, + author = {Han, Hui and Wang, Wen-Yuan and Mao, Bing-Huan}, + journal = {Advances in intelligent computing}, + pages = {878--887}, + year = {2005}, + booktitle = {Proceedings of the 1st International Conference on + Intelligent Computing}, + month = {Aug.}, + address = {Hefei, China} +} + +@Article{ hart1968, + title = {The condensed nearest neighbor rule}, + author = {Hart, Peter E.}, + journal = {IEEE Transactions on Information Theory}, + volume = {14}, + number = {3}, + pages = {515--516}, + year = {1968}, + publisher = {IEEE} +} + +@InProceedings{ he2008, + title = {ADASYN: Adaptive synthetic sampling approach for + imbalanced learning}, + author = {He, Haibo and Bai, Yang and Garcia, Edwardo A. and Li, + Shutao}, + booktitle = {Proceedings of the 5th IEEE International Joint Conference + on Neural Networks}, + pages = {1322--1328}, + year = {2008}, + organization = {IEEE}, + month = {Jun.}, + address = {Hong Kong, China} +} + +@InProceedings{ kubat1997, + title = {Addressing the curse of imbalanced training sets: + One-sided selection}, + author = {Kubat, Miroslav and Matwin, Stan}, + booktitle = {Proceedings of the 14th International Conference on + Machine Learning}, + volume = {97}, + pages = {179--186}, + year = {1997}, + address = {Nashville, Tennessee, USA}, + month = {July} +} + +@InProceedings{ laurikkala2001, + title = {Improving identification of difficult small classes by + balancing class distribution}, + author = {Laurikkala, Jorma}, + journal = {Proceedings of the 8th Conference on Artificial + Intelligence in Medicine in Europe}, + pages = {63--66}, + address = {Cascais, Portugal}, + month = {Jul.}, + year = {2001}, + publisher = {Springer} +} + +@Article{ liu2009, + title = {Exploratory undersampling for class-imbalance learning}, + author = {Liu, Xu-Ying and Wu, Jianxin and Zhou, Zhi-Hua}, + journal = {IEEE Transactions on Systems, Man, and Cybernetics}, + volume = {39}, + number = {2}, + pages = {539--550}, + year = {2009}, + publisher = {IEEE} +} + +@InProceedings{ mani2003, + title = {kNN approach to unbalanced data distributions: A case + study involving information extraction}, + author = {Mani, Inderjeet and Zhang, Jianping}, + booktitle = {Proceedings of the Workshop on Learning from Imbalanced + Data Sets}, + volume = {126}, + year = {2003}, + month = {Aug.}, + pages = {1--7}, + address = {Washington, DC, USA} +} + +@InProceedings{ nguyen2009, + title = {Borderline over-sampling for imbalanced data + classification}, + author = {Nguyen, Hien M. and Cooper, Eric W. and Kamei, Katsuari}, + journal = {Proceedings of the 5th International Workshop on + computational Intelligence and Applications}, + pages = {24--29}, + year = {2009} +} + +@Article{ smith2014, + title = {An instance level analysis of data complexity}, + author = {Smith, Michael R. and Martinez, Tony and Giraud-Carrier, + Christophe}, + journal = {Machine learning}, + volume = {95}, + number = {2}, + pages = {225--256}, + year = {2014}, + publisher = {Springer} +} + +@Article{ tomek1976a, + title = {Two modifications of CNN}, + author = {Tomek, Ivan}, + journal = {IEEE Trans. Systems, Man and Cybernetics}, + volume = {6}, + issue = {6}, + pages = {769--772}, + year = {1976} +} + +@Article{ tomek1976b, + title = {An experiment with the edited nearest-neighbor rule}, + author = {Tomek, Ivan}, + journal = {IEEE Transactions on Systems, Man, and Cybernetics}, + number = {6}, + issue = {6}, + pages = {448--452}, + year = {1976} +} + +@Article{ wilson1972, + title = {Asymptotic properties of nearest neighbor rules using + edited data}, + author = {Wilson, Dennis L.}, + journal = {IEEE Transactions on Systems, Man, and Cybernetics}, + volume = {2}, + number = {3}, + pages = {408--421}, + year = {1972}, + publisher = {IEEE} +}