{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,18]],"date-time":"2025-11-18T20:30:40Z","timestamp":1763497840566,"version":"3.37.3"},"reference-count":40,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2022,9,8]],"date-time":"2022-09-08T00:00:00Z","timestamp":1662595200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,9,8]],"date-time":"2022-09-08T00:00:00Z","timestamp":1662595200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001459","name":"Ministry of Education - Singapore","doi-asserted-by":"publisher","award":["RG35\/20","MOE2019-T21-042"],"award-info":[{"award-number":["RG35\/20","MOE2019-T21-042"]}],"id":[{"id":"10.13039\/501100001459","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Data Sci Anal"],"published-print":{"date-parts":[[2024,1]]},"DOI":"10.1007\/s41060-022-00362-9","type":"journal-article","created":{"date-parts":[[2022,9,8]],"date-time":"2022-09-08T16:22:35Z","timestamp":1662654155000},"page":"111-125","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["What can scatterplots teach us about doing data science better?"],"prefix":"10.1007","volume":"17","author":[{"given":"Wilson Wen Bin","family":"Goh","sequence":"first","affiliation":[]},{"given":"Reuben Jyong Kiat","family":"Foo","sequence":"additional","affiliation":[]},{"given":"Limsoon","family":"Wong","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,9,8]]},"reference":[{"key":"362_CR1","doi-asserted-by":"publisher","first-page":"402","DOI":"10.1109\/TVCG.2017.2744184","volume":"24","author":"A Sarikaya","year":"2018","unstructured":"Sarikaya, A., Gleicher, M.: Scatterplots: tasks, data, and designs. IEEE Trans. Vis. Comput. Graphics 24, 402\u2013412 (2018). https:\/\/doi.org\/10.1109\/TVCG.2017.2744184","journal-title":"IEEE Trans. Vis. Comput. Graphics"},{"key":"362_CR2","doi-asserted-by":"publisher","first-page":"95","DOI":"10.1057\/palgrave.ivs.9500122","volume":"5","author":"E Bertini","year":"2006","unstructured":"Bertini, E., Santucci, G.: Give chance a chance: modeling density to enhance scatter plot quality through random data sampling. Inf. Vis. 5, 95\u2013110 (2006). https:\/\/doi.org\/10.1057\/palgrave.ivs.9500122","journal-title":"Inf. Vis."},{"key":"362_CR3","doi-asserted-by":"publisher","unstructured":"Carr, D.B. (1990) Looking at large data sets using binned data plots. United\nStates. https:\/\/doi.org\/10.2172\/6930282","DOI":"10.2172\/6930282"},{"key":"362_CR4","doi-asserted-by":"publisher","first-page":"1526","DOI":"10.1109\/TVCG.2013.65","volume":"19","author":"A Mayorga","year":"2013","unstructured":"Mayorga, A., Gleicher, M.: Splatterplots: overcoming overdraw in scatter plots. IEEE Trans. Vis. Comput. Graphics 19, 1526\u20131538 (2013). https:\/\/doi.org\/10.1109\/TVCG.2013.65","journal-title":"IEEE Trans. Visual Comput. Graphics"},{"key":"362_CR5","doi-asserted-by":"publisher","first-page":"1009","DOI":"10.1109\/TVCG.2009.122","volume":"15","author":"C Collins","year":"2009","unstructured":"Collins, C., et al.: Bubble sets: revealing set relations with isocontours over existing visualizations. IEEE Trans. Visual Comput. Graphics 15, 1009\u20131016 (2009). https:\/\/doi.org\/10.1109\/TVCG.2009.122","journal-title":"IEEE Trans. Visual Comput. Graphics"},{"key":"362_CR6","doi-asserted-by":"publisher","first-page":"2625","DOI":"10.1109\/TVCG.2013.150","volume":"19","author":"X Yuan","year":"2013","unstructured":"Yuan, X., et al.: Dimension projection matrix\/tree: interactive subspace visual exploration and analysis of high dimensional data. IEEE Trans. Visual Comput. Graphics 19, 2625\u20132633 (2013). https:\/\/doi.org\/10.1109\/TVCG.2013.150","journal-title":"IEEE Trans. Visual Comput. Graphics"},{"key":"362_CR7","doi-asserted-by":"publisher","first-page":"424","DOI":"10.2307\/2289444","volume":"82","author":"DB Carr","year":"1987","unstructured":"Carr, D.B., et al.: Scatterplot matrix techniques for large N. J. Am. Stat. Assoc. 82, 424\u2013436 (1987). https:\/\/doi.org\/10.2307\/2289444","journal-title":"J. Am. Stat. Assoc."},{"key":"362_CR8","unstructured":"Heinrich, J. et al. (2012). The parallel coordinates matrix. EuroVis (Short Papers)."},{"key":"362_CR9","doi-asserted-by":"publisher","first-page":"81","DOI":"10.1111\/j.1538-4632.1989.tb00879.x","volume":"21","author":"M Monmonier","year":"1989","unstructured":"Monmonier, M.: Geographic brushing: enhancing exploratory analysis of the scatterplot matrix. Geogr. Anal. 21, 81\u201384 (1989). https:\/\/doi.org\/10.1111\/j.1538-4632.1989.tb00879.x","journal-title":"Geogr. Anal."},{"key":"362_CR10","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.visinf.2020.09.004","volume":"4","author":"QV Nguyen","year":"2020","unstructured":"Nguyen, Q.V., et al.: Evaluation on interactive visualization data with scatterplots. Vis. Inf. 4, 1\u201310 (2020). https:\/\/doi.org\/10.1016\/j.visinf.2020.09.004","journal-title":"Vis. Inf."},{"key":"362_CR11","doi-asserted-by":"publisher","DOI":"10.1007\/s41060-020-00230-4","author":"S Ho","year":"2021","unstructured":"Ho, S., et al.: What can Venn diagrams teach us about doing data science better? Int. J. Data Sci. Anal. (2021). https:\/\/doi.org\/10.1007\/s41060-020-00230-4","journal-title":"Int. J. Data Sci. Anal."},{"key":"362_CR12","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0166742","volume":"12","author":"L Moneta-Koehler","year":"2017","unstructured":"Moneta-Koehler, L., et al.: The limitations of the GRE in predicting success in biomedical graduate school. PLoS ONE 12, e0166742 (2017). https:\/\/doi.org\/10.1371\/journal.pone.0166742","journal-title":"PLoS ONE"},{"key":"362_CR13","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0206570","volume":"13","author":"SL Petersen","year":"2018","unstructured":"Petersen, S.L., et al.: Multi-institutional study of GRE scores as predictors of STEM PhD degree completion: GRE gets a low mark. PLoS ONE 13, e0206570 (2018). https:\/\/doi.org\/10.1371\/journal.pone.0206570","journal-title":"PLoS ONE"},{"key":"362_CR14","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1080\/15578771.2015.1050562","volume":"12","author":"JO Wao","year":"2016","unstructured":"Wao, J.O., et al.: Relationship between admission GRE scores and graduation GPA scores of construction management graduate students. Int. J. Constr. Educ. Res. 12, 37\u201353 (2016). https:\/\/doi.org\/10.1080\/15578771.2015.1050562","journal-title":"Int. J. Constr. Educ. Res."},{"key":"362_CR15","doi-asserted-by":"publisher","first-page":"899","DOI":"10.1038\/nmeth.3587","volume":"12","author":"N Altman","year":"2015","unstructured":"Altman, N., Krzywinski, M.: Association, correlation and causation. Nat. Methods 12, 899\u2013900 (2015). https:\/\/doi.org\/10.1038\/nmeth.3587","journal-title":"Nat. Methods"},{"key":"362_CR16","doi-asserted-by":"publisher","first-page":"2261","DOI":"10.1002\/smj.3199","volume":"41","author":"E Starr","year":"2020","unstructured":"Starr, E., Goldfarb, B.: Binned scatterplots: a simple tool to make research easier and better. Strateg. Manag. J. 41, 2261\u20132274 (2020). https:\/\/doi.org\/10.1002\/smj.3199","journal-title":"Strateg. Manag. J."},{"key":"362_CR17","doi-asserted-by":"publisher","unstructured":"Cuklina, J. et al. (2021) Diagnostics and correction of batch effects in large-scale proteomic studies: a tutorial. Mol. Syst. Biol. 17, e10240. https:\/\/doi.org\/10.15252\/msb.202110240","DOI":"10.15252\/msb.202110240"},{"key":"362_CR18","doi-asserted-by":"publisher","first-page":"496","DOI":"10.1177\/2168479016654738","volume":"50","author":"RC Zink","year":"2016","unstructured":"Zink, R.C., Jiang, X.: Using contour plots to assess the sensitivity of clinical trial design assumptions. Ther. Innov. Regul. Sci. 50, 496\u2013509 (2016). https:\/\/doi.org\/10.1177\/2168479016654738","journal-title":"Ther. Innov. Regul. Sci."},{"key":"362_CR19","doi-asserted-by":"crossref","unstructured":"Wallner, G., Kriglstein, S.: Multivariate visualization of game metrics: an evaluation of hexbin maps. In: Proceedings of the Annual Symposium on Computer-Human Interaction in Play. Association for Computing Machinery (2020)","DOI":"10.1145\/3410404.3414233"},{"key":"362_CR20","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2022.3158093","author":"D Reimann","year":"2022","unstructured":"Reimann, D., et al.: Lollipops help align visual and statistical fit estimates in scatterplots with nonlinear models. IEEE Trans. Vis. Comput. Gr. (2022). https:\/\/doi.org\/10.1109\/TVCG.2022.3158093","journal-title":"IEEE Trans. Visual Comput. Gr."},{"key":"362_CR21","doi-asserted-by":"publisher","first-page":"531","DOI":"10.2307\/2288400","volume":"79","author":"WS Cleveland","year":"1984","unstructured":"Cleveland, W.S., McGill, R.: Graphical perception: theory, experimentation, and application to the development of graphical methods. J. Am. Stat. Assoc. 79, 531\u2013554 (1984). https:\/\/doi.org\/10.2307\/2288400","journal-title":"J. Am. Stat. Assoc."},{"key":"362_CR22","doi-asserted-by":"crossref","unstructured":"Heer, J., Bostock, M. (2010). Crowdsourcing graphical perception: using mechanical turk to assess visualization design. In: Proceedings of the SIGCHI Conference on Human Factors in Computing Systems. Association for Computing Machinery","DOI":"10.1145\/1753326.1753357"},{"key":"362_CR23","doi-asserted-by":"publisher","first-page":"707","DOI":"10.1109\/TVCG.2021.3114684","volume":"28","author":"CM McColeman","year":"2021","unstructured":"McColeman, C.M., et al.: Rethinking the ranks of visual channels. IEEE Trans. Visual Comput. Graphics 28, 707\u2013717 (2021)","journal-title":"IEEE Trans. Visual Comput. Graphics"},{"key":"362_CR24","doi-asserted-by":"publisher","first-page":"133","DOI":"10.1016\/S1535-6108(02)00032-6","volume":"1","author":"EJ Yeoh","year":"2002","unstructured":"Yeoh, E.J., et al.: Classification, subtype discovery, and prediction of outcome in pediatric acute lymphoblastic leukemia by gene expression profiling. Cancer Cell 1, 133\u2013143 (2002)","journal-title":"Cancer Cell"},{"key":"362_CR25","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pcbi.1006391","volume":"14","author":"T Yu","year":"2018","unstructured":"Yu, T.: A new dynamic correlation algorithm reveals novel functional aspects in single cell and bulk RNA-seq data. PLoS Comput. Biol. 14, e1006391 (2018). https:\/\/doi.org\/10.1371\/journal.pcbi.1006391","journal-title":"PLoS Comput. Biol."},{"key":"362_CR26","doi-asserted-by":"publisher","first-page":"644","DOI":"10.1016\/j.drudis.2017.11.011","volume":"23","author":"L Zhou","year":"2018","unstructured":"Zhou, L., et al.: Understanding missing proteins: a functional perspective. Drug Discov. Today 23, 644\u2013651 (2018). https:\/\/doi.org\/10.1016\/j.drudis.2017.11.011","journal-title":"Drug Discov. Today"},{"key":"362_CR27","doi-asserted-by":"publisher","first-page":"1993","DOI":"10.1021\/pr501138h","volume":"14","author":"B-JM Webb-Robertson","year":"2015","unstructured":"Webb-Robertson, B.-J.M., et al.: Review, evaluation, and discussion of the challenges of missing value imputation for mass spectrometry-based label-free global proteomics. J. Proteome Res. 14, 1993\u20132001 (2015). https:\/\/doi.org\/10.1021\/pr501138h","journal-title":"J. Proteome Res."},{"key":"362_CR28","doi-asserted-by":"publisher","first-page":"407","DOI":"10.1038\/nm.3807","volume":"21","author":"T Guo","year":"2015","unstructured":"Guo, T., et al.: Rapid mass spectrometric conversion of tissue biopsy samples into permanent quantitative digital proteome maps. Nat. Med. 21, 407\u2013413 (2015). https:\/\/doi.org\/10.1038\/nm.3807","journal-title":"Nat. Med."},{"key":"362_CR29","doi-asserted-by":"publisher","first-page":"71","DOI":"10.1186\/s13062-015-0098-x","volume":"10","author":"WW Goh","year":"2015","unstructured":"Goh, W.W., et al.: Quantitative proteomics signature profiling based on network contextualization. Biol. Direct 10, 71 (2015). https:\/\/doi.org\/10.1186\/s13062-015-0098-x","journal-title":"Biol. Direct"},{"key":"362_CR30","doi-asserted-by":"publisher","first-page":"159","DOI":"10.1007\/s41060-016-0024-z","volume":"2","author":"A Polyzou","year":"2016","unstructured":"Polyzou, A., Karypis, G.: Grade prediction with models specific to students and courses. Int. J. Data Sci. Anal. 2, 159\u2013171 (2016). https:\/\/doi.org\/10.1007\/s41060-016-0024-z","journal-title":"Int. J. Data Sci. Anal."},{"key":"362_CR31","doi-asserted-by":"crossref","unstructured":"Jaber, M. et al.:. A multi-granularity pattern-based sequence classification framework for educational data. In: 2016 IEEE International Conference on Data Science and Advanced Analytics (DSAA) (2016)","DOI":"10.1109\/DSAA.2016.46"},{"key":"362_CR32","doi-asserted-by":"publisher","first-page":"247","DOI":"10.1504\/IJDATS.2020.108080","volume":"12","author":"D Stamovlasis","year":"2020","unstructured":"Stamovlasis, D., et al.: A comparative evaluation of dissimilarity-based and model-based clustering in science education research: the case of children\u2019s mental models of the Earth. Int. J. Data Anal. Tech. Strategies 12, 247\u2013261 (2020). https:\/\/doi.org\/10.1504\/IJDATS.2020.108080","journal-title":"Int. J. Data Anal. Tech. Strategies"},{"key":"362_CR33","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1109\/MIS.2019.2936705","volume":"34","author":"L Cao","year":"2019","unstructured":"Cao, L.: Data science: profession and education. IEEE Intell. Syst. 34, 35\u201344 (2019). https:\/\/doi.org\/10.1109\/MIS.2019.2936705","journal-title":"IEEE Intell. Syst."},{"key":"362_CR34","doi-asserted-by":"publisher","first-page":"103","DOI":"10.1002\/jhbs.20078","volume":"41","author":"M Friendly","year":"2005","unstructured":"Friendly, M., Denis, D.: The early origins and development of the scatterplot. J. Hist. Behav. Sci. 41, 103\u2013130 (2005). https:\/\/doi.org\/10.1002\/jhbs.20078","journal-title":"J. Hist. Behav. Sci."},{"key":"362_CR35","doi-asserted-by":"publisher","first-page":"17","DOI":"10.1080\/00031305.1973.10478966","volume":"27","author":"FJ Anscombe","year":"1973","unstructured":"Anscombe, F.J.: Graphs in statistical analysis. Am. Stat. 27, 17\u201321 (1973). https:\/\/doi.org\/10.1080\/00031305.1973.10478966","journal-title":"Am. Stat."},{"key":"362_CR36","doi-asserted-by":"crossref","unstructured":"Matejka, J., Fitzmaurice, G.: Same Stats, Different Graphs: Generating Datasets with Varied Appearance and Identical Statistics through Simulated Annealing (2017)","DOI":"10.1145\/3025453.3025912"},{"key":"362_CR37","doi-asserted-by":"publisher","first-page":"1131","DOI":"10.1038\/nmeth.2258","volume":"9","author":"B Wong","year":"2012","unstructured":"Wong, B.: Visualizing biological data. Nat. Methods 9, 1131\u20131131 (2012). https:\/\/doi.org\/10.1038\/nmeth.2258","journal-title":"Nat. Methods"},{"key":"362_CR38","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pbio.1002128","volume":"13","author":"TL Weissgerber","year":"2015","unstructured":"Weissgerber, T.L., et al.: Beyond bar and line graphs: time for a new data presentation paradigm. PLoS Biol. 13, e1002128 (2015). https:\/\/doi.org\/10.1371\/journal.pbio.1002128","journal-title":"PLoS Biol."},{"key":"362_CR39","doi-asserted-by":"publisher","unstructured":"Giuliani, A.: Put the blame on the formula: an incredible (but real) tale from the top of modern science. Organisms Journal of Biological Sciences (2019). https:\/\/doi.org\/10.13133\/2532-5876_5.5","DOI":"10.13133\/2532-5876_5.5"},{"key":"362_CR40","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pcbi.1002277","volume":"7","author":"L Kall","year":"2011","unstructured":"Kall, L., Vitek, O.: Computational mass spectrometry-based proteomics. PLoS Comput. Biol. 7, e1002277 (2011). https:\/\/doi.org\/10.1371\/journal.pcbi.1002277","journal-title":"PLoS Comput. Biol."}],"container-title":["International Journal of Data Science and Analytics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-022-00362-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s41060-022-00362-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-022-00362-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,17]],"date-time":"2024-01-17T10:17:25Z","timestamp":1705486645000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s41060-022-00362-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,9,8]]},"references-count":40,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2024,1]]}},"alternative-id":["362"],"URL":"https:\/\/doi.org\/10.1007\/s41060-022-00362-9","relation":{},"ISSN":["2364-415X","2364-4168"],"issn-type":[{"type":"print","value":"2364-415X"},{"type":"electronic","value":"2364-4168"}],"subject":[],"published":{"date-parts":[[2022,9,8]]},"assertion":[{"value":"7 June 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 August 2022","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 September 2022","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests, financial or otherwise.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}