@inproceedings{d23c1df6f9da4ce198263e4a9fcad037,
title = "Fast Sentence Classification using Word Co-occurrence Graphs",
abstract = "We consider a supervised classification problem of categorizing e-commerce products based on just the words in the title. If done in real-time, the categorization can greatly benefit sellers by enabling them to offer immediate feedback. We present a deterministic algorithm by constructing weighted word co-occurrence graphs from the listing/item titles. We empirically evaluate this algorithm on two publicly available product listing datasets, Etsy and Amazon. Our method's accuracy is comparable to that of a supervised classifier constructed using the fastText library. The inference time of our model is up to 2.9× faster than the fastText classifier and has small training times. The training and inference of our model scales well for big datasets performing large-scale classification on millions of listings. We perform a detailed analysis and provide insights into our method and the product categorization task.",
author = "Ashirbad Mishra and Shad Kirmani and Kamesh Madduri",
note = "Publisher Copyright: {\textcopyright} 2024 IEEE.; 2024 IEEE International Conference on Big Data, BigData 2024 ; Conference date: 15-12-2024 Through 18-12-2024",
year = "2024",
doi = "10.1109/BigData62323.2024.10825869",
language = "English (US)",
series = "Proceedings - 2024 IEEE International Conference on Big Data, BigData 2024",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "620--629",
editor = "Wei Ding and Chang-Tien Lu and Fusheng Wang and Liping Di and Kesheng Wu and Jun Huan and Raghu Nambiar and Jundong Li and Filip Ilievski and Ricardo Baeza-Yates and Xiaohua Hu",
booktitle = "Proceedings - 2024 IEEE International Conference on Big Data, BigData 2024",
address = "United States",
}