@article {OTERO201642, title = {Finding informative code metrics under uncertainty for predicting the pass rate of online courses}, journal = {Information Sciences}, volume = {373}, year = {2016}, pages = {42 - 56}, abstract = {A method is proposed for predicting the pass rate of a Computer Science course. Input data comprises different software metrics that are evaluated on a set of programs, comprising students{\textquoteright} answers to a list of computing challenges proposed by the course instructor. Different kinds of uncertainty are accepted, including missing answers and multiple responses to the same challenge. The most informative metrics are selected according to an extension to vague data of the observed Fisher information. The proposed method was tested on experimental data collected during two years at Oviedo University. Yearly changes in the pass rate of two groups were accurately predicted on the basis of 7 software metrics. 73 volunteer students and 1500 source files were involved in the experimentation.}, keywords = {Automatic grading, feature selection, Genetic Fuzzy Systems, Low Quality Data, vague data}, issn = {0020-0255}, doi = {https://doi.org/10.1016/j.ins.2016.08.090}, url = {http://www.sciencedirect.com/science/article/pii/S0020025516306715}, author = {Jos{\'e} Otero and Luis Junco and Rosario Su{\'a}rez and Ana Palacios and In{\'e}s Couso and Luciano S{\'a}nchez} }