% pubman genre = article @article{item_3656705, title = {{Typology meets statistical modeling: The German gender system}}, author = {Fedden, Sebastian and Naranjo, Mat{\'\i}as Guzm{\'a}n and Corbett, Greville G.}, language = {eng}, issn = {0097-8507}, doi = {10.1353/lan.2025.a962898}, publisher = {Linguistic Society of America [etc.]}, address = {Washington, DC [etc.]}, year = {2025}, date = {2025-06}, abstract = {{The German gender system is known for its complexity, and there is a persistent misconception that it is largely arbitrary, and hence a challenge for the typology of gender systems. In response, we construct a database of more than 30,000 German nouns and show that a boosting tree model achieves a predictive success of 96{\textpercent}. Even more surprising, the model performs at 87{\textpercent} when trained on just the 100 most frequent nouns. We thus demonstrate that the complex German system fits into a typologically well-known scheme, being a combination of semantic and formal assignment principles. In addition to our success with the specific problem, we show the value of statistical modeling for typologists and reflect on what exactly we can learn from these techniques.{\textasteriskcentered}. {\copyright} 2025, Linguistic Society of America. All rights reserved.}}, journal = {{Language}}, volume = {101}, number = {2}, pages = {251--290}, }