{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,30]],"date-time":"2025-07-30T16:56:48Z","timestamp":1753894608956,"version":"3.41.2"},"reference-count":41,"publisher":"Ubiquity Press, Ltd.","license":[{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,8,24]]},"DOI":"10.5334\/dsj-2020-035","type":"journal-article","created":{"date-parts":[[2020,8,24]],"date-time":"2020-08-24T10:32:41Z","timestamp":1598265161000},"source":"Crossref","is-referenced-by-count":3,"title":["SparkNN: A Distributed In-Memory Data Partitioning for KNN Queries on Big Spatial Data"],"prefix":"10.5334","volume":"19","author":[{"given":"Zaher","family":"Al Aghbari","sequence":"first","affiliation":[]},{"given":"Tasneem","family":"Ismail","sequence":"additional","affiliation":[]},{"given":"Ibrahim","family":"Kamel","sequence":"additional","affiliation":[]}],"member":"3285","reference":[{"issue":"11","key":"key20200824063237_B1","doi-asserted-by":"crossref","first-page":"1009","DOI":"10.14778\/2536222.2536227","article-title":"Hadoop gis: A high performance spatial data warehousing system over mapreduce","volume":"6","year":"2013","journal-title":"Proceedings of the VLDB Endowment"},{"issue":"1","key":"key20200824063237_B2","first-page":"1","article-title":"Geosimmr: A mapreduce algorithm for detecting communities based on distance and interest in social networks","volume":"18","year":"2019","journal-title":"Data Science Journal"},{"issue":"1","key":"key20200824063237_B3","doi-asserted-by":"crossref","first-page":"69","DOI":"10.3233\/IDA-2011-0511","article-title":"On clustering large number of data streams","volume":"16","year":"2012","journal-title":"Intelligent Data Analysis"},{"issue":"1","key":"key20200824063237_B4","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1080\/17445760.2012.729584","article-title":"Energy-efficient distributed wireless sensor network scheme for cluster detection","volume":"28","year":"2013","journal-title":"International Journal of Parallel, Emergent and Distributed Systems"},{"first-page":"1","article-title":"In-memory Spatial-Aware Framework for Processing Proximity-Alike Queries in Big Spatial Data","year":"2018","key":"key20200824063237_B5"},{"key":"key20200824063237_B6","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1016\/j.aeue.2018.09.005","article-title":"Distributed trajectory design for data gathering using mobile sink in wireless sensor networks","volume":"96","year":"2018","journal-title":"AEU-International Journal of Electronics and Communications"},{"key":"key20200824063237_B7","doi-asserted-by":"crossref","first-page":"398","DOI":"10.1016\/j.future.2019.02.035","article-title":"Urban data management system: Towards big data analytics for internet of things based smart urban environment using customized hadoop","volume":"96","year":"2019","journal-title":"Future Generation Computer Systems"},{"first-page":"61","article-title":"Supporting range queries on web data using k-nearest neighbor search","year":"2007","key":"key20200824063237_B8"},{"issue":"1","key":"key20200824063237_B9","doi-asserted-by":"crossref","first-page":"107","DOI":"10.1145\/1327452.1327492","article-title":"MapReduce: simplified data processing on large clusters","volume":"51","year":"2008","journal-title":"Communications of the ACM"},{"issue":"4","key":"key20200824063237_B10","first-page":"131","article-title":"Offline automatic segmentation based recognition of handwritten Arabic words","volume":"4","year":"2011","journal-title":"International Journal of Signal Processing, Image Processing and Pattern Recognition"},{"first-page":"1352","article-title":"Spatialhadoop: A mapreduce framework for spatial data","year":"2015","key":"key20200824063237_B11"},{"first-page":"477","article-title":"A framework for co-location patterns mining in big spatial data","year":"2017","key":"key20200824063237_B12"},{"key":"key20200824063237_B13","unstructured":"Geolite 2 free downloadable databases maxmind developer site. https:\/\/dev.maxmind.com\/geoip\/geoip2\/geolite2\/. Accessed: 2019-05-22."},{"volume-title":"HBase: the definitive guide: random access to your planetsize data","year":"2011","key":"key20200824063237_B14"},{"issue":"2","key":"key20200824063237_B15","first-page":"56","article-title":"SECONDO: A Platform for Moving Objects Database Research and for Publishing and Integrating Research Implementations","volume":"33","year":"2010","journal-title":"IEEE Data Eng. Bull"},{"journal-title":"Datenbanksysteme f\u00fcr Business, Technologie und Web (BTW 2017)","article-title":"The STARK framework for spatio-temporal data analytics on spark","year":"2017","key":"key20200824063237_B16"},{"year":"2011","key":"key20200824063237_B17","article-title":"Fast approximate nearest-neighbor search with k-nearest neighbor graph"},{"key":"key20200824063237_B18","doi-asserted-by":"crossref","first-page":"10","DOI":"10.1016\/j.knosys.2018.05.006","article-title":"Apra: An approximate parallel recommendation algorithm for big data","volume":"157","year":"2018","journal-title":"Knowledge-Based Systems"},{"issue":"4","key":"key20200824063237_B19","doi-asserted-by":"crossref","first-page":"46","DOI":"10.3390\/jsan7040046","article-title":"Opportunistically exploiting internet of things for wireless sensor network routing in smart cities","volume":"7","year":"2018","journal-title":"Journal of Sensor and Actuator Networks"},{"volume-title":"Geospatial Informatics, Fusion, and Motion Video Analytics V","year":"2015","key":"key20200824063237_B20"},{"key":"key20200824063237_B21","unstructured":"JTS Topology Suite. https:\/\/www.osgeo.org\/projects\/jts\/. Accessed: 2019-06-18."},{"issue":"2","key":"key20200824063237_B22","doi-asserted-by":"crossref","first-page":"163","DOI":"10.1142\/S0219691303000141","article-title":"Content-based image retrieval technique using wavelet-based shift and brightness invariant edge feature","volume":"1","year":"2003","journal-title":"International Journal of Wavelets, Multiresolution and Information Processing"},{"first-page":"1190","article-title":"Parallel secondo: A practical system for largescale processing of moving objects","year":"2014","key":"key20200824063237_B23"},{"key":"key20200824063237_B24","unstructured":"Magellan: Geospatial Analytics on Spark. Oct. 2015. https:\/\/hortonworks.com\/blog\/magellan-geospatial-analytics-in-spark\/. Accessed: 2019-06-18."},{"first-page":"7","article-title":"MD-HBase: A scalable multi-dimensional data infrastructure for location aware services","year":"2011","key":"key20200824063237_B25"},{"key":"key20200824063237_B26","unstructured":"OpenStreetMap. https:\/\/www.openstreetmap.org\/. Accessed: 2019-06-18."},{"key":"key20200824063237_B27","unstructured":"Ryan LeCompte. Bounded priority queue in scala. https:\/\/gist.github.com\/ryanlecompte\/5746241. Accessed: 2019-06-08."},{"key":"key20200824063237_B28","doi-asserted-by":"crossref","first-page":"893","DOI":"10.1016\/j.future.2016.10.019","article-title":"Social networking data analysis tools and challenges","volume":"86","year":"2018","journal-title":"Future Generation Computer Systems"},{"first-page":"263","article-title":"Interactive and Scalable Exploration of Big Spatial Data\u2013A Data Management Perspective","year":"2015","key":"key20200824063237_B29"},{"issue":"13","key":"key20200824063237_B30","doi-asserted-by":"crossref","first-page":"1565","DOI":"10.14778\/3007263.3007310","article-title":"Locationspark: A distributed in-memory data management system for big spatial data","volume":"9","year":"2016","journal-title":"Proceedings of the VLDB Endowment"},{"issue":"2","key":"key20200824063237_B31","doi-asserted-by":"crossref","first-page":"1626","DOI":"10.14778\/1687553.1687609","article-title":"Hive: a warehousing solution over a mapreduce framework","volume":"2","year":"2009","journal-title":"Proceedings of the VLDB Endowment"},{"volume-title":"Hadoop: The definitive guide","year":"2012","key":"key20200824063237_B32"},{"first-page":"73","article-title":"Spatial indexing and analytics on Hadoop","year":"2014","key":"key20200824063237_B33"},{"first-page":"1071","article-title":"Simba: Efficient in-memory spatial analytics","year":"2016","key":"key20200824063237_B34"},{"first-page":"200","article-title":"On massive spatial data retrieval based on spark","year":"2014","key":"key20200824063237_B35"},{"first-page":"34","article-title":"Large-scale spatial join query processing in cloud","year":"2015","key":"key20200824063237_B36"},{"year":"2015","key":"key20200824063237_B37","article-title":"Geospark: A cluster computing framework for processing large-scale spatial data"},{"first-page":"2","article-title":"Resilient distributed datasets: A fault-tolerant abstraction for in-memory cluster computing","year":"2012","key":"key20200824063237_B38"},{"issue":"11","key":"key20200824063237_B39","doi-asserted-by":"crossref","first-page":"56","DOI":"10.1145\/2934664","article-title":"Apache spark: a unified engine for big data processing","volume":"59","year":"2016","journal-title":"Communications of the ACM"},{"volume-title":"SIGIR","year":"2015","key":"key20200824063237_B40"},{"first-page":"11","article-title":"Trajspark: A scalable and efficient in-memory management system for big trajectory data","year":"2017","key":"key20200824063237_B41"}],"container-title":["Data Science Journal"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/doi.org\/10.5334\/dsj-2020-035","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,11]],"date-time":"2022-07-11T09:20:38Z","timestamp":1657531238000},"score":1,"resource":{"primary":{"URL":"http:\/\/datascience.codata.org\/articles\/10.5334\/dsj-2020-035\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020]]},"references-count":41,"alternative-id":["10.5334\/dsj-2020-035"],"URL":"https:\/\/doi.org\/10.5334\/dsj-2020-035","relation":{},"ISSN":["1683-1470"],"issn-type":[{"type":"electronic","value":"1683-1470"}],"subject":[],"published":{"date-parts":[[2020]]},"article-number":"35"}}