{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,7]],"date-time":"2026-03-07T18:37:20Z","timestamp":1772908640588,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":30,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,5,30]],"date-time":"2024-05-30T00:00:00Z","timestamp":1717027200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,5,30]]},"DOI":"10.1145\/3650200.3656629","type":"proceedings-article","created":{"date-parts":[[2024,6,3]],"date-time":"2024-06-03T14:11:54Z","timestamp":1717423914000},"page":"286-297","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":3,"title":["An Efficient and Scalable Approach to Build Co-occurrence Matrix for DNN's Embedding Layer"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0006-8764-9081","authenticated-orcid":false,"given":"Quentin","family":"Petit","sequence":"first","affiliation":[{"name":"ED STIC, Universit\u00e9 Paris-Saclay, France and Paris Distributed and Parallel Technologies Lab, Huawei Technologies France, France and Maison de la Simulation, France"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4160-7170","authenticated-orcid":false,"given":"Chong","family":"Li","sequence":"additional","affiliation":[{"name":"Paris Distributed and Parallel Technologies Lab, Huawei Technologies France, France"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4228-0069","authenticated-orcid":false,"given":"Nahid","family":"Emad","sequence":"additional","affiliation":[{"name":"Universit\u00e9 Paris-Saclay, France and Maison de la Simulation, France"}]}],"member":"320","published-online":{"date-parts":[[2024,6,3]]},"reference":[{"key":"e_1_3_2_1_1_1","first-page":"993","article-title":"Latent dirichlet allocation","author":"Blei M","year":"2003","unstructured":"David\u00a0M Blei, Andrew\u00a0Y Ng, and Michael\u00a0I Jordan. 2003. Latent dirichlet allocation. Journal of machine Learning research 3, Jan (2003), 993\u20131022.","journal-title":"Journal of machine Learning research 3"},{"key":"e_1_3_2_1_2_1","volume-title":"Redmond WA","author":"Breese S","year":"1998","unstructured":"Jack\u00a0S Breese, David Heckerman, and Carl\u00a0M Kadie. 1998. Anonymous web data from www. microsoft. com. Microsoft Research, Redmond WA (1998), 98052\u20136399."},{"key":"e_1_3_2_1_3_1","volume-title":"Bulk synchronous parallel computing\u2014a paradigm for transportable software. Tools and Environments for Parallel and Distributed Systems","author":"Cheatham Thomas","year":"1996","unstructured":"Thomas Cheatham, Amr Fahmy, Dan Stefanescu, and Leslie Valiant. 1996. Bulk synchronous parallel computing\u2014a paradigm for transportable software. Tools and Environments for Parallel and Distributed Systems (1996), 61\u201376."},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01212"},{"key":"e_1_3_2_1_5_1","volume-title":"Deep learning and practice with mindspore","author":"Chen Lei","unstructured":"Lei Chen. 2021. Deep learning and practice with mindspore. Springer Nature."},{"key":"e_1_3_2_1_6_1","volume-title":"An image is worth 16x16 words: Transformers for image recognition at scale. arXiv preprint arXiv:2010.11929","author":"Dosovitskiy Alexey","year":"2020","unstructured":"Alexey Dosovitskiy, Lucas Beyer, Alexander Kolesnikov, Dirk Weissenborn, Xiaohua Zhai, Thomas Unterthiner, Mostafa Dehghani, Matthias Minderer, Georg Heigold, Sylvain Gelly, 2020. An image is worth 16x16 words: Transformers for image recognition at scale. arXiv preprint arXiv:2010.11929 (2020)."},{"key":"e_1_3_2_1_7_1","series-title":"SIAM journal on matrix analysis and applications 13, 1","volume-title":"Sparse matrices in MATLAB: Design and implementation","author":"Gilbert R","year":"1992","unstructured":"John\u00a0R Gilbert, Cleve Moler, and Robert Schreiber. 1992. Sparse matrices in MATLAB: Design and implementation. SIAM journal on matrix analysis and applications 13, 1 (1992), 333\u2013356."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/2939672.2939754"},{"key":"e_1_3_2_1_9_1","volume-title":"Entity embeddings of categorical variables. arXiv preprint arXiv:1604.06737","author":"Guo Cheng","year":"2016","unstructured":"Cheng Guo and Felix Berkhahn. 2016. Entity embeddings of categorical variables. arXiv preprint arXiv:1604.06737 (2016)."},{"key":"e_1_3_2_1_10_1","volume-title":"Word and phrase translation with word2vec. arXiv preprint arXiv:1705.03127","author":"Jansen Stefan","year":"2017","unstructured":"Stefan Jansen. 2017. Word and phrase translation with word2vec. arXiv preprint arXiv:1705.03127 (2017)."},{"key":"e_1_3_2_1_11_1","volume-title":"Proceedings of NAACL-HLT. 4171\u20134186","author":"Ming-Wei\u00a0Chang Jacob Devlin","year":"2019","unstructured":"Jacob Devlin Ming-Wei\u00a0Chang Kenton and Lee\u00a0Kristina Toutanova. 2019. BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding. In Proceedings of NAACL-HLT. 4171\u20134186."},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.5555\/1165013.1165016"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-662-44851-9_17"},{"key":"e_1_3_2_1_14_1","volume-title":"An introduction to information retrieval","author":"Manning D","unstructured":"Christopher\u00a0D Manning. 2009. An introduction to information retrieval. Cambridge university press."},{"key":"e_1_3_2_1_15_1","first-page":"3","article-title":"Bibliographic coupling system based on references. Nauchno-Tekhnicheskaya Informatsiya Seriya","volume":"2","author":"Marshakova V","year":"1973","unstructured":"Irena\u00a0V Marshakova. 1973. Bibliographic coupling system based on references. Nauchno-Tekhnicheskaya Informatsiya Seriya, Ser 2, 6 (1973), 3\u20138.","journal-title":"Ser"},{"key":"e_1_3_2_1_16_1","volume-title":"Efficient estimation of word representations in vector space. arXiv preprint arXiv:1301.3781","author":"Mikolov Tomas","year":"2013","unstructured":"Tomas Mikolov, Kai Chen, Greg Corrado, and Jeffrey Dean. 2013. Efficient estimation of word representations in vector space. arXiv preprint arXiv:1301.3781 (2013)."},{"key":"e_1_3_2_1_17_1","volume-title":"Distributed representations of words and phrases and their compositionality. Advances in neural information processing systems 26","author":"Mikolov Tomas","year":"2013","unstructured":"Tomas Mikolov, Ilya Sutskever, Kai Chen, Greg\u00a0S Corrado, and Jeff Dean. 2013. Distributed representations of words and phrases and their compositionality. Advances in neural information processing systems 26 (2013)."},{"key":"e_1_3_2_1_18_1","volume-title":"Branch prediction techniques and optimizations","author":"Parihar Raj","year":"2015","unstructured":"Raj Parihar. 2015. Branch prediction techniques and optimizations. University of Rochester, NY, USA (2015)."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1162"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/2623330.2623732"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N18-1202"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N18-1202"},{"key":"e_1_3_2_1_23_1","volume-title":"Distributed and Parallel Sparse Computing for Very Large Graph Neural Networks. In 2022 IEEE International Conference on Big Data (Big Data). IEEE, 6796\u20136798","author":"Petit R","year":"2022","unstructured":"Quentin\u00a0R Petit, Chong Li, and Nahid Emad. 2022. Distributed and Parallel Sparse Computing for Very Large Graph Neural Networks. In 2022 IEEE International Conference on Big Data (Big Data). IEEE, 6796\u20136798."},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-55895-0_433"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1093\/genetics\/155.2.945"},{"key":"e_1_3_2_1_26_1","unstructured":"Alec Radford Karthik Narasimhan Tim Salimans Ilya Sutskever 2018. Improving language understanding by generative pre-training. (2018)."},{"key":"e_1_3_2_1_27_1","volume-title":"SPARSKIT: A basic tool kit for sparse matrix computations.","author":"Saad Youcef","year":"1990","unstructured":"Youcef Saad. 1990. SPARSKIT: A basic tool kit for sparse matrix computations. (1990)."},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/3077136.3080713"},{"key":"e_1_3_2_1_29_1","unstructured":"Ashish Vaswani Noam Shazeer Niki Parmar Jakob Uszkoreit Llion Jones Aidan\u00a0N Gomez \u0141ukasz Kaiser and Illia Polosukhin. 2017. Attention is all you need. In Advances in neural information processing systems. 5998\u20136008."},{"key":"e_1_3_2_1_30_1","volume-title":"Graph transformer networks. Advances in neural information processing systems 32","author":"Yun Seongjun","year":"2019","unstructured":"Seongjun Yun, Minbyul Jeong, Raehyun Kim, Jaewoo Kang, and Hyunwoo\u00a0J Kim. 2019. Graph transformer networks. Advances in neural information processing systems 32 (2019)."}],"event":{"name":"ICS '24: 2024 International Conference on Supercomputing","location":"Kyoto Japan","acronym":"ICS '24","sponsor":["SIGARCH ACM Special Interest Group on Computer Architecture"]},"container-title":["Proceedings of the 38th ACM International Conference on Supercomputing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3650200.3656629","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3650200.3656629","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T15:23:42Z","timestamp":1755876222000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3650200.3656629"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,5,30]]},"references-count":30,"alternative-id":["10.1145\/3650200.3656629","10.1145\/3650200"],"URL":"https:\/\/doi.org\/10.1145\/3650200.3656629","relation":{},"subject":[],"published":{"date-parts":[[2024,5,30]]},"assertion":[{"value":"2024-06-03","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}