@inproceedings{3d997120f78f4546a8fdc6740937d263,
title = "Drugs Clustering Based on Their Compositions Using Word2Vec and K-means Clustering",
abstract = "With the rapid growth in medicine, it is essential to determine a method of cluster drug composition data to make it easy for industries to define medicine composition. K-means clustering is one way to cluster the composition of drugs. In this paper, we use the Word2Vec model and convert the composition of the drug into a vector. We cluster it using K-means, also visualize the data results of the clustering. In Word2Vec, we use two methods, namely CBOW and SG. Meanwhile, in K-means, we determine the number of centroids using the Elbow Criterion and Silhouette Coefficient method. Datasets consist of more than 250 product names of drug from Farmaku and K24. The experiment results show that the Silhouette Coefficient value using the CBOW and SG methods are 0.901 and 0.877. Both CBOW and SG method generating the best value of the number of clusters is three.",
keywords = "cbow, drugs clustering, elbow criterion, k-means clustering, silhouette coefficient, skip-gram, word2vec",
author = "Rahmat Hidayat and Rakhmawati, {Nur Aini}",
note = "Publisher Copyright: {\textcopyright} 2022 American Institute of Physics Inc.. All rights reserved.; 2nd International Conference on Information Technology, Advanced Mechanical and Electrical Engineering, ICITAMEE 2021 ; Conference date: 25-08-2021 Through 26-08-2021",
year = "2022",
month = nov,
day = "30",
doi = "10.1063/5.0104981",
language = "English",
series = "AIP Conference Proceedings",
publisher = "American Institute of Physics Inc.",
editor = "Yessi Jusman and Fajrin, {Hanifah Rahmi}",
booktitle = "2021 2nd International Conference on Information Technology, Advanced Mechanical and Electrical Engineering, ICITAMEE 2021",
}