@article{3029, author = {Mohamed Salim El Bazzi, Abdelatif Ennaji, Driss Mammass}, title = {Automatic Indexation of Large Text and Datasets}, journal = {Journal of Information Technology Review}, year = {2020}, volume = {11}, number = {3}, doi = {https://doi.org/10.6025/jitr/2020/11/3/83-93}, url = {http://www.dline.info/jitr/fulltext/v11n3/jitrv11n3_1.pdf}, abstract = {When the text corpus is huge, it is somewhat difficult to effectively manage the collection with good indexing. When the text has complex datasets, the classification and indexing is a challenging issue. We in this exercise, has proposed an efficiently automatic indexing system for large datasets. We have also tested its effectiveness in large collection of real texts. To make evaluation, we have applied KNN and SVM classifiers. The proposed solution easily outperforms the traditional indexing pattern based on TFIDF system. Even the evaluation was carried out in the environment of Arabic language, it is applied to any language.}, }