{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,7]],"date-time":"2025-07-07T13:27:38Z","timestamp":1751894858537,"version":"3.37.3"},"reference-count":54,"publisher":"Springer Science and Business Media LLC","issue":"29","license":[{"start":{"date-parts":[[2022,8,13]],"date-time":"2022-08-13T00:00:00Z","timestamp":1660348800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,8,13]],"date-time":"2022-08-13T00:00:00Z","timestamp":1660348800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100010410","name":"Education University of Hong Kong","doi-asserted-by":"crossref","award":["Dean\u2019s Research Fund 2018-19 (FLASS\/DRF\/IDS-3)"],"award-info":[{"award-number":["Dean\u2019s Research Fund 2018-19 (FLASS\/DRF\/IDS-3)"]}],"id":[{"id":"10.13039\/501100010410","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100010410","name":"Education University of Hong Kong","doi-asserted-by":"crossref","award":["Departmental Collaborative Research Fund 2019 (MIT\/DCRF-R2\/18-19)"],"award-info":[{"award-number":["Departmental Collaborative Research Fund 2019 (MIT\/DCRF-R2\/18-19)"]}],"id":[{"id":"10.13039\/501100010410","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100014736","name":"Lingnan University","doi-asserted-by":"crossref","award":["Faculty Research Grant (DB21A9)"],"award-info":[{"award-number":["Faculty Research Grant (DB21A9)"]}],"id":[{"id":"10.13039\/501100014736","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2022,12]]},"DOI":"10.1007\/s11042-022-13476-w","type":"journal-article","created":{"date-parts":[[2022,8,13]],"date-time":"2022-08-13T04:02:36Z","timestamp":1660363356000},"page":"42871-42887","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":8,"title":["A deep data augmentation framework based on generative adversarial networks"],"prefix":"10.1007","volume":"81","author":[{"given":"Qiping","family":"Wang","sequence":"first","affiliation":[]},{"given":"Ling","family":"Luo","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0965-3617","authenticated-orcid":false,"given":"Haoran","family":"Xie","sequence":"additional","affiliation":[]},{"given":"Yanghui","family":"Rao","sequence":"additional","affiliation":[]},{"given":"Raymond Y.K.","family":"Lau","sequence":"additional","affiliation":[]},{"given":"Detian","family":"Zhang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,8,13]]},"reference":[{"key":"13476_CR1","unstructured":"Abadi M, Agarwal A, Barham P, Brevdo E, Chen Z, Citro C, Corrado GS, Davis A, Dean J, Devin M, Ghemawat S (2016) TensorFlow: Large-scale machine learning on heterogeneous systems, arXiv:1603.04467"},{"key":"13476_CR2","doi-asserted-by":"crossref","unstructured":"Antoniou A, Storkey A, Edwards H (2018) Augmenting image classifiers using data augmentation generative adversarial networks. In: International conference on artificial neural networks, pp 594\u2013603","DOI":"10.1007\/978-3-030-01424-7_58"},{"key":"13476_CR3","unstructured":"Arjovsky M, Chintala S, Bottou L (2017) Wasserstein gan. arXiv:1701.07875"},{"key":"13476_CR4","unstructured":"Brock A, Donahue J, Simonyan K (2018) Large scale gan training for high fidelity natural image synthesis. arXiv:1809.11096"},{"key":"13476_CR5","doi-asserted-by":"crossref","unstructured":"Chen Y, Li W, Sakaridis C, Dai D, Van Gool L (2018) Domain adaptive faster r-cnn for object detection in the wild. In: The IEEE Conference on conference on computer vision and pattern recognition (CVPR), pp 3339\u20133348","DOI":"10.1109\/CVPR.2018.00352"},{"key":"13476_CR6","doi-asserted-by":"crossref","unstructured":"Cohen G, Afshar S, Tapson J, van Schaik A (2017) EMNIST: Extending MNIST to handwritten letters. In: 2017 International Joint Conference on Neural Networks (IJCNN), pp 2921\u20132926","DOI":"10.1109\/IJCNN.2017.7966217"},{"key":"13476_CR7","doi-asserted-by":"crossref","unstructured":"Cubuk ED, Zoph B, Man\u00e9 D, Vasudevan V, Le QV (2018) Autoaugment: Learning augmentation policies from data. arXiv:1805.09501","DOI":"10.1109\/CVPR.2019.00020"},{"key":"13476_CR8","doi-asserted-by":"crossref","unstructured":"Cui X, Goel V, Kingsbury B (2014) Data augmentation for deep neural network acoustic modeling. In: 2014 IEEE International conference on acoustics, speech and signal processing (ICASSP), pp 5582\u20135586","DOI":"10.1109\/ICASSP.2014.6854671"},{"key":"13476_CR9","unstructured":"Denton E, Chintala S, Szlam A, Fergus R (2015) Deep generative image models using a laplacian pyramid of adversarial networks. In: Advances in neural information processing systems (NIPS), pp 1486\u20131494"},{"key":"13476_CR10","doi-asserted-by":"crossref","unstructured":"Dixit M, Kwitt R, Niethammer M, Vasconcelos N (2017) Aga: Attribute-guided augmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 7455\u20137463","DOI":"10.1109\/CVPR.2017.355"},{"key":"13476_CR11","doi-asserted-by":"crossref","unstructured":"Fawzi A, Samulowitz H, Turaga D, Frossard P (2016) Adaptive data augmentation for image classification. In: IEEE international conference on image processing (ICIP), pp 3688\u20133692","DOI":"10.1109\/ICIP.2016.7533048"},{"key":"13476_CR12","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1016\/j.neucom.2018.09.013","volume":"321","author":"M Frid-Adar","year":"2018","unstructured":"Frid-Adar M, Diamant I, Klang E, Amitai M, Goldberger J, Greenspan H (2018) GAN-based synthetic medical image augmentation for increased cnn performance in liver lesion classification. Neurocomputing 321:321\u2013331","journal-title":"Neurocomputing"},{"key":"13476_CR13","doi-asserted-by":"crossref","unstructured":"Girshick R (2015) Fast R-CNN. In: International conference on computer vision (ICCV), pp 1440\u20131448","DOI":"10.1109\/ICCV.2015.169"},{"key":"13476_CR14","doi-asserted-by":"crossref","unstructured":"Gong Y, Wang L, Guo R, Lazebnik S (2014) Multi-scale orderless pooling of deep convolutional activation features. In: European conference on computer vision (ECCV), pp 392\u2013407","DOI":"10.1007\/978-3-319-10584-0_26"},{"key":"13476_CR15","unstructured":"Goodfellow I, Pouget-Abadie J, Mirza M, Xu B, Warde-Farley D, Ozair S, Courville A, Bengio Y (2014) Generative adversarial nets. In: Advances in neural information processing systems (NIPS), pp 2672\u20132680"},{"key":"13476_CR16","unstructured":"Gulrajani I, Ahmed F, Arjovsky M, Dumoulin V, Courville AC (2017) Improved training of wasserstein gans. In: Advances in neural information processing systems, pp 5767\u20135777"},{"key":"13476_CR17","unstructured":"Hauberg S, Freifeld O, Larsen ABL, Fisher J, Hansen LK (2016) Dreaming more data: Class-dependent distributions over diffeomorphisms for learned data augmentation. In: Proceedings of the 19th International conference on artificial intelligence and statistics, pp 342\u2013350"},{"key":"13476_CR18","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. In: IEEE conference on computer vision and pattern recognition (CVPR), pp 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"issue":"5","key":"13476_CR19","doi-asserted-by":"publisher","first-page":"359","DOI":"10.1016\/0893-6080(89)90020-8","volume":"2","author":"K Hornik","year":"1989","unstructured":"Hornik K, Stinchcombe M, White H (1989) Multilayer feedforward networks are universal approximators. Neural Netw 2(5):359\u2013366","journal-title":"Neural Netw"},{"key":"13476_CR20","doi-asserted-by":"crossref","unstructured":"Hu W, Huang Y, Wei L, Zhang F, Li H (2015) Deep convolutional neural networks for hyperspectral image classification. Journal of Sensors 2015, 258619","DOI":"10.1155\/2015\/258619"},{"key":"13476_CR21","unstructured":"Jaderberg M, Simonyan K, Vedaldi A, Zisserman A (2014) Synthetic data and artificial neural networks for natural scene text recognition. arXiv:1406.2227"},{"key":"13476_CR22","doi-asserted-by":"publisher","first-page":"35055","DOI":"10.1007\/s11042-020-08883-w","volume":"79","author":"G Jha","year":"2020","unstructured":"Jha G, Cecotti H (2020) Data augmentation for handwritten digit recognition using generative adversarial networks. Multimed Tools Appl 79:35055\u201335068","journal-title":"Multimed Tools Appl"},{"key":"13476_CR23","doi-asserted-by":"crossref","unstructured":"Jorge J, Vieco J, Paredes R, Sanchez JA, Benedi JM (2018) Empirical evaluation of variational autoencoders for data augmentation. In: International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications (VISIGRAPP), pp 96\u2013104","DOI":"10.5220\/0006618600960104"},{"key":"13476_CR24","unstructured":"Karras T, Aila T, Laine S, Lehtinen J (2017) Progressive growing of gans for improved quality, stability, and variation. arXiv:1710.10196"},{"key":"13476_CR25","doi-asserted-by":"crossref","unstructured":"Karras T, Laine S, Aila T (2018) A style-based generator architecture for generative adversarial networks. arXiv:1812.04948","DOI":"10.1109\/CVPR.2019.00453"},{"key":"13476_CR26","unstructured":"Krizhevsky A, Sutskever I, Hinton GE (2012) Imagenet classification with deep convolutional neural networks. In: Advances in Neural Information Processing Systems (NIPS), pp 1097\u20131105"},{"key":"13476_CR27","unstructured":"LeCun Y, Huang FJ, Bottou L (2014) Learning methods for generic object recognition with invariance to pose and lighting. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR), vol 2, pp II\u2013104"},{"key":"13476_CR28","doi-asserted-by":"crossref","unstructured":"Lecun Y, Bottou L, Bengio Y, Haffner P (1998) Gradient-based learning applied to document recognition. In: Proceedings of the IEEE, pp 2278\u20132324","DOI":"10.1109\/5.726791"},{"issue":"4","key":"13476_CR29","doi-asserted-by":"publisher","first-page":"593","DOI":"10.1109\/LGRS.2018.2878773","volume":"16","author":"W Li","year":"2019","unstructured":"Li W, Chen C, Zhang M, Li H, Du Q (2019) Data augmentation for hyperspectral image classification with deep cnn. IEEE Geosci Remote Sens Lett 16(4):593\u2013597","journal-title":"IEEE Geosci Remote Sens Lett"},{"issue":"7","key":"13476_CR30","first-page":"4931","volume":"79","author":"Z Li","year":"2018","unstructured":"Li Z, Guo J, Jiao W, Xu P, Liu B, Zhao X (2018) Random linear interpolation data augmentation for person re-identification. Multimed Tools Appl 79(7):4931\u20134947","journal-title":"Multimed Tools Appl"},{"key":"13476_CR31","doi-asserted-by":"crossref","unstructured":"Liu C, Yin F, Wang Q, Wang D (2011) ICDAR 2011 Chinese handwriting recognition competition. In: Proceedings of the 2011 international conference on document analysis and recognition (ICDAR), pp 1464\u20131469","DOI":"10.1109\/ICDAR.2011.291"},{"key":"13476_CR32","doi-asserted-by":"crossref","unstructured":"Long J, Shelhamer E, Darrell T (2015) Fully convolutional models for semantic segmentation. In: IEEE Conference on Computer vision and pattern recognition (CVPR), vol 3, p 4","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"13476_CR33","doi-asserted-by":"crossref","unstructured":"Mao X, Li Q, Xie H, Lau RY, Wang Z, Smolley SP (2016) Least squares generative adversarial networks. arXiv:1611.04076","DOI":"10.1109\/ICCV.2017.304"},{"key":"13476_CR34","unstructured":"Mariani G, Scheidegger F, Istrate R, Bekas C, Malossi C (2018) Bagan: Data augmentation with balancing gan. arXiv:1803.09655"},{"key":"13476_CR35","unstructured":"Mirza M, Osindero S (2014) Conditional generative adversarial nets. arXiv:1411.1784"},{"key":"13476_CR36","unstructured":"Miyato T, Kataoka T, Koyama M, Yoshida Y (2018) Spectral normalization for generative adversarial networks. arXiv:1802.05957"},{"key":"13476_CR37","unstructured":"Nowozin S, Cseke B, Tomioka R (2016) f-gan: Training generative neural samplers using variational divergence minimization. arXiv:1606.00709"},{"key":"13476_CR38","unstructured":"Odena A (2016) Semi-supervised learning with generative adversarial networks. arXiv:1606.01583"},{"key":"13476_CR39","doi-asserted-by":"crossref","unstructured":"Paulin M, Revaud J, Harchaoui Z, Perronnin F, Schmid C (2014) Transformation pursuit for image classification. In: IEEE Conference on computer vision and pattern recognition, pp 3646\u20133653","DOI":"10.1109\/CVPR.2014.466"},{"issue":"1","key":"13476_CR40","doi-asserted-by":"publisher","first-page":"145","DOI":"10.1016\/S0893-6080(98)00116-6","volume":"12","author":"N Qian","year":"1999","unstructured":"Qian N (1999) On the momentum term in gradient descent learning algorithms. Neural Netw 12(1):145\u2013151","journal-title":"Neural Netw"},{"key":"13476_CR41","unstructured":"Radford A, Metz L, Chintala S (2015) Unsupervised representation learning with deep convolutional generative adversarial networks. arXiv:1511.06434"},{"key":"13476_CR42","unstructured":"Salimans T, Goodfellow I, Zaremba W, Cheung V, Radford A, Chen X (2016) Improved techniques for training gans. In: Advances in Neural Information Processing Systems (NIPS), pp 2226\u20132234"},{"key":"13476_CR43","doi-asserted-by":"crossref","unstructured":"Simard PY, Steinkraus D, Platt JC (2003) Best practices for convolutional neural networks applied to visual document analysis. In: International Conference on Document Analysis and Recognition (ICDAR), vol 2, p 958","DOI":"10.1109\/ICDAR.2003.1227801"},{"key":"13476_CR44","unstructured":"Simonyan K, Zisserman A (2014) Very deep convolutional networks for large-scale image recognition. arXiv:1409.1556"},{"key":"13476_CR45","unstructured":"Springenberg JT (2015) Unsupervised and semi-supervised learning with categorical generative adversarial networks. arXiv:1511.06390"},{"key":"13476_CR46","doi-asserted-by":"crossref","unstructured":"Wang G, Kang W, Wu Q, Wang Z, Gao J (2018) Generative adversarial network (gan) based data augmentation for palmprint recognition. In: Digital Image Computing: Techniques and Applications (DICTA), pp 1\u20137","DOI":"10.1109\/DICTA.2018.8615782"},{"key":"13476_CR47","unstructured":"Wang J, Perez L (2017) The effectiveness of data augmentation in image classification using deep learning. arXiv:1712.04621"},{"issue":"3","key":"13476_CR48","doi-asserted-by":"publisher","first-page":"631","DOI":"10.1007\/s11554-017-0717-0","volume":"15","author":"SH Wang","year":"2018","unstructured":"Wang SH, Sun J, Phillips P, Zhao G, Zhang YD (2018) Polarimetric synthetic aperture radar image segmentation by convolutional neural network using graphical processing units. J Real Time Image Process 15(3):631\u2013642","journal-title":"J Real Time Image Process"},{"key":"13476_CR49","doi-asserted-by":"crossref","unstructured":"Yin X, Yu X, Sohn K, Liu X, Chandraker M (2018) Feature transfer learning for deep face recognition with long-tail data. CoRR arXiv:1803.09014","DOI":"10.1109\/CVPR.2019.00585"},{"key":"13476_CR50","doi-asserted-by":"crossref","unstructured":"Yu Q, Lam W (2019) Data augmentation based on adversarial autoencoder handling imbalance for learning to rank. In: AAAI Conference on Artificial Intelligence, vol 33, no 01, pp 411\u2013418","DOI":"10.1609\/aaai.v33i01.3301411"},{"key":"13476_CR51","doi-asserted-by":"publisher","first-page":"20617","DOI":"10.1007\/s11042-020-08918-2","volume":"79","author":"S Zeng","year":"2020","unstructured":"Zeng S, Zhang B, Gou J (2020) Learning double weights via data augmentation for robust sparse and collaborative representation-based classification. Multimed Tools Appl 79:20617\u201320638","journal-title":"Multimed Tools Appl"},{"key":"13476_CR52","unstructured":"Zhang H, Goodfellow I, Metaxas D, Odena A (2018) Self-attention generative adversarial networks. arXiv:1805.08318"},{"key":"13476_CR53","unstructured":"Zhong Z, Zheng L, Kang G, Li S, Yang Y (2017) Random erasing data augmentation. arXiv:1708.04896"},{"key":"13476_CR54","doi-asserted-by":"crossref","unstructured":"Zhu X, Liu Y, Qin Z, Li J (2017) Data augmentation in emotion classification using generative adversarial networks. arXiv:1711.00648","DOI":"10.1007\/978-3-319-93040-4_28"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-022-13476-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-022-13476-w\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-022-13476-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,11,26]],"date-time":"2022-11-26T22:53:18Z","timestamp":1669503198000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-022-13476-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,8,13]]},"references-count":54,"journal-issue":{"issue":"29","published-print":{"date-parts":[[2022,12]]}},"alternative-id":["13476"],"URL":"https:\/\/doi.org\/10.1007\/s11042-022-13476-w","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"type":"print","value":"1380-7501"},{"type":"electronic","value":"1573-7721"}],"subject":[],"published":{"date-parts":[[2022,8,13]]},"assertion":[{"value":"13 May 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"22 November 2021","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 July 2022","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 August 2022","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"<!--Emphasis Type='Bold' removed-->Conflict of Interests"}}]}}