@article{4616, author = {Chen Wang}, title = {Modeling Clustering Approaches to Recommender Systems in Language Datasets}, journal = {Journal of Data Processing}, year = {2025}, volume = {15}, number = {4}, doi = {https://doi.org/10.6025/jdp/2025/15/4/175-182}, url = {https://www.dline.info/jdp/fulltext/v15n4/jdpv15n4_3.pdf}, abstract = {This paper proposes a novel approach to improving personalized recommendations in English resource libraries. Addressing challenges such as information overload, lack of personalization, cold start problems, and algorithmic complexity, the study leverages the K-means clustering algorithman unsupervised machine learning technique to group users and resources based on similarity. By transforming multidimensional resource attributes (e.g., topic, proficiency level, target audience) into onedimensional data via dimensionality reduction, the system improves storage, search, and recommendation efficiency. The model integrates user English proficiency data, processes it via dynamic multimodal modeling and principal component analysis, and clusters users for tailored suggestions. Experimental results demonstrate that the K-means based system outperforms traditional collaborative filtering in recommendation accuracy, although recall rates vary with list size. User activity data reveal consistent personalized recommendation usage (~40% daily peak) and search spikes at 15:00 and 21:00, likely reflecting student and working user learning patterns. The study concludes that the proposed method effectively enhances resource management and user satisfaction, ofering a scalable and efficient solution for digital English libraries. Future work includes refining algorithms to improve accuracy and user experience further.}, }