@inproceedings{fd339338579643d9aeb5c407bd26dc8a,
title = "Binary classification for teacher donor's project",
abstract = "Classification always plays an important role in statistical machine learning, which contains both binary classification problems and multi-label classification problems. This article focuses on binary classification models including natural language processing for text objects to help teachers to improve their chances of being funded based on real data sets collected by DonorsChoose.org. Comparing about two natural language processing methods for projects proposals proposed by teachers, we also implement various statistical algorithms on our data sets, aiming to enhance the classification accuracy which can be measured by model accuracy and the area under the curve(AUC). In conclusion, the text objects are important for computer to conduct supervised learning and the length of the proposal and the price column are the crucial features. In addition, the best model will be the LightBGM with AUC 0.77 and accuracy 86\%.",
keywords = "binary classification, natural language processing, statistical machine learning models, Python",
author = "Yunwei Zhang and Zibin Zhang",
year = "2018",
doi = "10.2991/iceess-18.2018.40",
language = "English",
isbn = "9789462525948",
series = "Advances in Social Science Education and Humanities Research",
publisher = "Atlantis Press",
pages = "157--160",
editor = "Jerry Liu and Huijuan Xue and Xiaonan Xiao",
booktitle = "Proceedings of the 2018 International Conference on Education, Economics and Social Science (ICEESS 2018)",
address = "Netherlands",
note = "International Conference on Education, Economics and Social Science (ICEESS) ; Conference date: 30-10-2018 Through 31-10-2018",
}