@inproceedings{cb0385ea177b49b8b88ecacefbf98468,
title = "Adapting Google Translate using Dictionary and Word Embedding for Arabic-Indonesian Cross-lingual Information Retrieval",
abstract = "The translation has an essential role in Cross-lingual Information Retrieval. Translation using a dictionary is reliable even though it has a limited vocabulary. Translation using google translate, in some cases, using different words used in document target words. The translation process causes word translation to be less accurate to get relevant documents. In this paper, we proposed a new translation approach by adapting google translate using a dictionary and word embedding in Arabic-Indonesian Cross-lingual Information Retrieval. The dictionary is the primary resource used for translation improved by Levenshtein distance and FastText for finding the correct word translation. Google translate is used to complete translation when the word does not exist in the dictionary resource. The proposed method archive a BLEU score of 0.47. This score is higher than the other comparison resource score. The proposed method successfully improves the translated query to retrieve more relevant documents in cross-lingual information retrieval based on this implementation.",
keywords = "Cross-lingual information retrieval, Dictionary, FastText, Google Translate, Levenshtein distance",
author = "Maryamah Maryamah and Arifin, {Agus Zainal} and Riyanarto Sarno and Hasan, {Ahmad Makki}",
note = "Publisher Copyright: {\textcopyright} 2021 IEEE.; 2020 IEEE International Conference on Internet of Things and Intelligence Systems, IoTaIS 2020 ; Conference date: 27-01-2021 Through 28-01-2021",
year = "2021",
month = jan,
day = "27",
doi = "10.1109/IoTaIS50849.2021.9359708",
language = "English",
series = "IoTaIS 2020 - Proceedings: 2020 IEEE International Conference on Internet of Things and Intelligence Systems",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "205--209",
booktitle = "IoTaIS 2020 - Proceedings",
address = "United States",
}