{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T00:30:04Z","timestamp":1775003404229,"version":"3.50.1"},"reference-count":98,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,12,17]],"date-time":"2024-12-17T00:00:00Z","timestamp":1734393600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,12,17]],"date-time":"2024-12-17T00:00:00Z","timestamp":1734393600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,12,17]]},"DOI":"10.1109\/icca62237.2024.10927845","type":"proceedings-article","created":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T02:16:27Z","timestamp":1743041787000},"page":"1-10","source":"Crossref","is-referenced-by-count":3,"title":["Data Partitioning and Storage Strategies for Artificial Intelligence and Machine Learning Applications: A Review of Techniques"],"prefix":"10.1109","author":[{"given":"Kingsley C.","family":"Nwosu","sequence":"first","affiliation":[{"name":"Norfolk State University,Department of Computer Science,Norfolk,VA,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ibrahim","family":"Kamara","sequence":"additional","affiliation":[{"name":"Norfolk State University,Department of Computer Science,Norfolk,VA,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Musbah","family":"Abdulgader","sequence":"additional","affiliation":[{"name":"Norfolk State University,Department of Computer Science,Norfolk,VA,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yen-Hung","family":"Hu","sequence":"additional","affiliation":[{"name":"Norfolk State University,Department of Computer Science,Norfolk,VA,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1166\/asl.2017.10229"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1145\/3047307"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-45876-X_28"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/icime.2010.5477529"},{"key":"ref5","article-title":"Sampling-based range partition methods for big data analytics","author":"Vojnovic","year":"2012","journal-title":"Technical report, Microsoft Research"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/SC.1998.10025"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/iceta51985.2020.9379231"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/BigData.2015.7364047"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/iciccs53718.2022.9788257"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1631\/FITEE.1601883"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/tkde.2019.2946162"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/bigdse.2015.9"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/imcet59736.2023.10368261"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.5334\/dsj-2015-002"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/3148238"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1117\/12.2585723"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2018.11.066"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1007\/s10614-021-10126-5"},{"key":"ref19","article-title":"Randomized Machine Learning Approaches: Recent Developments and Challenges","author":"Gallicchio","year":"2017","journal-title":"ESANN"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-7908-2604-3_16"},{"key":"ref21","volume-title":"Deep Learning","author":"Goodfellow","year":"2016"},{"key":"ref22","article-title":"A machine learning approach to databases indexes","author":"Beutel","year":"2017","journal-title":"ML Systems Workshop, NIPS"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.14778\/3659437.3659441"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1007\/s10489-020-01674-8"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1145\/3318464.3389703"},{"key":"ref26","volume-title":"Database System Concepts","author":"Silberschatz","year":"2010"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4899-7637-6"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/MC.2009.263"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1201\/b16527"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1016\/S0305-0548(01)00031-4"},{"key":"ref31","volume-title":"Batch Processes","author":"Korovessi","year":"2006"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/BigData47090.2019.9006337"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1016\/j.compeleceng.2017.03.009"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TCSS.2016.2516039"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-15887-3_30"},{"key":"ref36","author":"Cano","year":"2015","journal-title":"ASML: automatic streaming machine learning"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/3588982.3603608"},{"key":"ref38","volume-title":"Storing Hierarchical Data in SQL: Mastering Graph Structures","author":"Rahnama","year":"2011"},{"key":"ref39","volume-title":"Storing Hierarchical Data in SQL: Mastering Graph Structures","author":"Fox","year":"2023"},{"key":"ref40","article-title":"TIBCO","volume-title":"What is Hierarchical Data?","year":"2024"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1093\/bib\/bbac216"},{"key":"ref42","first-page":"3417","article-title":"Sublinear algorithms for hierarchical clustering","volume":"35","author":"Agarwal","year":"2022","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2018.2854283"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/ICNSC.2019.8743164"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-26253-2_13"},{"key":"ref46","volume-title":"Database Internals: A Deep Dive into How Distributed Data Systems Work","author":"Petrov"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1002\/9780470602379"},{"issue":"2","key":"ref48","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3377454","article-title":"A survey on distributed machine learning","volume":"53","author":"Verbraeken","year":"2020","journal-title":"ACM Computing Surveys (CSUR)"},{"key":"ref49","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1007\/s13748-012-0035-5","article-title":"A survey of methods for distributed machine learning","volume":"2","author":"Peteiro-Barral","year":"2013","journal-title":"Progress in Artificial Intelligence"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2021.3086014"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2022.3140660"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-57500-6"},{"key":"ref53","volume-title":"Understanding Data Encryption: A Practical Guide to Secure Computing","author":"Smith","year":"2020"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1145\/258533.258660"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1137\/1.9781611975031.39"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/ISPASS57527.2023.00048"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1145\/3488838.3488862"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1145\/3488838.3488862"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1007\/s10586-020-03076-4"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1007\/s11227-017-2027-5"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1145\/3489517.3530553"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-48308-5_56"},{"key":"ref63","first-page":"13","article-title":"Advanced partitioning techniques for massively distributed computation","author":"Zhou","journal-title":"Proceedings of the 2012 ACM SIGMOD International Conference on Management of Data"},{"key":"ref64","doi-asserted-by":"crossref","first-page":"229","DOI":"10.1145\/3127479.3131613","article-title":"A robust partitioning scheme for ad-hoc query workloads","author":"Shanbhag","year":"2017","journal-title":"Proceedings of the 2017 Symposium on Cloud Computing"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2024.3365810"},{"key":"ref66","first-page":"121","article-title":"A graph based technique of process partitioning","author":"Xue","year":"2018","journal-title":"Journal of Web Engineering"},{"key":"ref67","first-page":"31","article-title":"Graph mining based on a data partitioning approach","author":"Nguyen","journal-title":"Proceedings of the Nineteenth Conference on Australasian Database"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1007\/bfb0025878"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2018.00096"},{"key":"ref70","article-title":"Improving Hadoop Performance with Data Locality","author":"Shvachko","year":"2010","journal-title":"Proceedings of the IEEE International Symposium on Parallel and Distributed Processing"},{"key":"ref71","first-page":"1","article-title":"The Impact of Data Locality on MapReduce Performance: An In-depth Study","volume-title":"Proceedings of the VLDB Endowment","volume":"3","author":"Ibrahim","year":"2010"},{"issue":"2","key":"ref72","first-page":"165","article-title":"Data Locality in Distributed Systems","volume":"19","author":"Frachtenberg","journal-title":"IEEE Transactions on Parallel and Distributed Systems"},{"issue":"2","key":"ref73","first-page":"126","article-title":"Optimizing Data Locality for Efficient Big Data Processing","volume":"3","author":"Zhang","year":"2015","journal-title":"IEEE Transactions on Cloud Computing"},{"issue":"1","key":"ref74","first-page":"173","article-title":"Data Locality-Aware Load Balancing for Distributed Systems","volume":"39","author":"Gandhi","year":"2011","journal-title":"ACM SIGMETRICS Performance Evaluation Review"},{"issue":"4","key":"ref75","doi-asserted-by":"crossref","first-page":"18","DOI":"10.1145\/121973.121975","article-title":"What is scalability?","volume":"18","author":"Hill","year":"1990","journal-title":"ACM SIGARCH Computer Architecture News"},{"key":"ref76","doi-asserted-by":"crossref","first-page":"195","DOI":"10.1145\/350391.350432","article-title":"Characteristics of scalability and their impact on performance","author":"Bondi","year":"2000","journal-title":"Proceedings of the 2nd International Workshop on Software and Performance"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/71.862209"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1109\/SPLC.1993.365568"},{"key":"ref79","doi-asserted-by":"crossref","first-page":"195","DOI":"10.1145\/350391.350432","article-title":"Characteristics of scalability and their impact on performance","author":"Bondi","year":"2000","journal-title":"Proceedings of the 2nd International Workshop on Software and Performance"},{"issue":"7","key":"ref80","first-page":"2124","article-title":"Survey On Scalability In Cloud Environment","volume":"5","author":"Ab Rashid Dar","year":"2016","journal-title":"International Journal of Advanced Research in Computer Engineering & Technology (IJARCET)"},{"issue":"4","key":"ref81","doi-asserted-by":"crossref","first-page":"425","DOI":"10.1016\/0360-8352(90)90001-3","article-title":"Evaluation of interprocessor communication overhead in distributed computer systems","volume":"18","author":"Bhatia","year":"1990","journal-title":"Computers & Industrial Engineering"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/ALLERTON.2016.7852338"},{"key":"ref83","first-page":"1790","article-title":"Minimizing of the communication overhead in distributed control computer of power system using correct partition and DMA","author":"Zdenek","year":"2006","journal-title":"Proceedings of IASME\/WSEAS International Conference Energy and Environment 2006"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1109\/ICPP.2010.30"},{"issue":"1","key":"ref85","first-page":"5641831","article-title":"A hierarchical load balancing strategy considering communication delay overhead for large distributed computing systems","volume":"2016","author":"Yang","year":"2016","journal-title":"Mathematical Problems in Engineering"},{"key":"ref86","volume-title":"Distributed Systems: Principles and Paradigms","author":"Tanenbaum","year":"2002"},{"key":"ref87","volume-title":"Designing Data-Intensive Applications","author":"Kleppmann","year":"2017"},{"issue":"1","key":"ref88","doi-asserted-by":"crossref","first-page":"26","DOI":"10.1145\/146941.146943","article-title":"The design and implementation of a log-structured file system","volume":"10","author":"Rosenblum","year":"1992","journal-title":"ACM Trans. Comput. Syst"},{"key":"ref89","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1007\/978-981-15-6401-7_11-1","article-title":"Fault Tolerant Architectures","volume-title":"Handbook of Computer Architecture","author":"Sahoo","year":"2023"},{"key":"ref90","doi-asserted-by":"publisher","DOI":"10.1109\/OJCS.2020.3006807"},{"key":"ref91","first-page":"290","article-title":"On the structure of the system of minimum edge cuts of a graph","author":"Dinitz","year":"1976","journal-title":"Issledovaniya po Diskretnoi Optimizatsii"},{"key":"ref92","first-page":"229","article-title":"Faster algorithms for finding small edge cuts in planar graphs","author":"Rao","journal-title":"Proceedings of the twenty-fourth annual ACM symposium on Theory of computing"},{"key":"ref93","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1016\/0012-365X(92)90690-H","article-title":"Max-cut in circulant graphs","volume":"108","author":"Poljak","year":"1992","journal-title":"Discrete Mathematics"},{"key":"ref94","article-title":"Computing vertex-edge cut-pairs and 2-edge cuts in practice","author":"Georgiadis","year":"2021","journal-title":"19th International Symposium on Experimental Algorithms (SEA 2021). Schloss Dagstuhl-Leibniz-Zentrum fur Informatik"},{"issue":"1","key":"ref95","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1002\/jgt.21746","article-title":"On maximum edge cuts of connected digraphs","volume":"76","author":"Chen","year":"2014","journal-title":"Journal of Graph Theory"},{"key":"ref96","volume-title":"Database Systems: The Complete Book","author":"Garcia-Molina","year":"2008"},{"key":"ref97","first-page":"3","article-title":"The Wisconsin Benchmark: Past, Present, and Future","author":"DeWitt","year":"1993","journal-title":"Proceedings of the 2nd International Conference on Parallel and Distributed Information Systems"},{"key":"ref98","first-page":"296","article-title":"Parallel multilevel algorithms for multi-constraint graph partitioning","volume-title":"in European Conference on Parallel Processing","author":"Schloegel","year":"2000"}],"event":{"name":"2024 International Conference on Computer and Applications (ICCA)","location":"Cairo, Egypt","start":{"date-parts":[[2024,12,17]]},"end":{"date-parts":[[2024,12,19]]}},"container-title":["2024 International Conference on Computer and Applications (ICCA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10927736\/10927741\/10927845.pdf?arnumber=10927845","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T07:45:25Z","timestamp":1743061525000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10927845\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,17]]},"references-count":98,"URL":"https:\/\/doi.org\/10.1109\/icca62237.2024.10927845","relation":{},"subject":[],"published":{"date-parts":[[2024,12,17]]}}}