@article{337, author = {Hassen Sallay}, title = {On Arabic Texts Compression and Searching}, journal = {Journal of Digital Information Management}, year = {2010}, volume = {8}, number = {6}, doi = {}, url = {http://www.dline.info/fpaper/jdim/v8i6/2.pdf}, abstract = {With the dramatic increasing of electronic Arabic content, the text compression techniques will play a major role in several domains and applications such as search engines, data archiving, searching and retrieval from huge databases. Mainly the combination of compression and indexing techniques allows the interesting possibility to work directly on the compressed textual fi les or databases, which results saving time and resources. The existing compression techniques and tools are generic and do not consider the specifi c characteristics of the Arabic language such as its derivative nature. Mainly compression techniques should be based on the morphology characteristics of the Arabic language, its grammatical characteristics, the texts subject, and their statistical characteristics. The paper surveys the state of the art of the Arabic texts compression techniques and tools and identifi es some research tracks that should be explored in future. It presents also some dedicated Arabic text compression algorithms which save more physical space and speed up the data retrieval text fi les by searching in their compressed form.}, }