{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T15:18:46Z","timestamp":1759331926883,"version":"3.37.3"},"reference-count":51,"publisher":"Springer Science and Business Media LLC","issue":"7-9","license":[{"start":{"date-parts":[[2021,2,2]],"date-time":"2021-02-02T00:00:00Z","timestamp":1612224000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,2,2]],"date-time":"2021-02-02T00:00:00Z","timestamp":1612224000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Ann Math Artif Intell"],"published-print":{"date-parts":[[2022,9]]},"DOI":"10.1007\/s10472-021-09728-4","type":"journal-article","created":{"date-parts":[[2021,2,2]],"date-time":"2021-02-02T05:09:48Z","timestamp":1612242588000},"page":"735-752","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":11,"title":["Interpreting rate-distortion of variational autoencoder and using model uncertainty for anomaly detection"],"prefix":"10.1007","volume":"90","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-4726-2441","authenticated-orcid":false,"given":"Seonho","family":"Park","sequence":"first","affiliation":[]},{"given":"George","family":"Adosoglou","sequence":"additional","affiliation":[]},{"given":"Panos M.","family":"Pardalos","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,2,2]]},"reference":[{"key":"9728_CR1","unstructured":"An, J., Cho, S.: Variational autoencoder based anomaly detection using reconstruction probability. Special Lect. IE 2(1) (2015)"},{"key":"9728_CR2","unstructured":"Ruff, L., Vandermeulen, R., Goernitz, N., Deecke, L., Siddiqui, S.A., Binder, A., M\u00fcller, E., Kloft, M.: Deep one-class classification. In: International conference on machine learning, pp. 4393\u20134402 (2018)"},{"key":"9728_CR3","doi-asserted-by":"crossref","unstructured":"Sakurada, M., Yairi, T.: Anomaly detection using autoencoders with nonlinear dimensionality reduction. In: Proceedings of the MLSDA 2014 2nd Workshop on Machine Learning for Sensory Data Analysis, pp. 4\u201311 (2014)","DOI":"10.1145\/2689746.2689747"},{"key":"9728_CR4","doi-asserted-by":"crossref","unstructured":"Marchi, E., Vesperini, F., Eyben, F., Squartini, S., Schuller, B.: A novel approach for automatic acoustic novelty detection using a denoising autoencoder with bidirectional LSTM neural networks. In: 2015 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp. 1996\u20132000. IEEE (2015)","DOI":"10.1109\/ICASSP.2015.7178320"},{"key":"9728_CR5","doi-asserted-by":"crossref","unstructured":"Zhou, C., Paffenroth, R.C.: Anomaly detection with robust deep autoencoders. In: Proceedings of the 23rd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 665\u2013674 (2017)","DOI":"10.1145\/3097983.3098052"},{"key":"9728_CR6","doi-asserted-by":"crossref","unstructured":"Dau, H.A., Ciesielski, V., Song, A.: Anomaly detection using replicator neural networks trained on examples of one class. In: Asia-Pacific Conference on Simulated Evolution and Learning, pp. 311\u2013322. Springer (2014)","DOI":"10.1007\/978-3-319-13563-2_27"},{"key":"9728_CR7","doi-asserted-by":"crossref","unstructured":"Perera, P., Nallapati, R., Xiang, B.: OCGAN: One-class novelty detection using GANs with constrained latent representations. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2898\u20132906 (2019)","DOI":"10.1109\/CVPR.2019.00301"},{"key":"9728_CR8","unstructured":"Chalapathy, R., Menon, A.K., Chawla, S.: Anomaly detection using one-class neural networks. arXiv:1802.06360 (2018)"},{"key":"9728_CR9","unstructured":"Pidhorskyi, S., Almohsen, R., Doretto, G.: Generative probabilistic novelty detection with adversarial autoencoders. In: Advances in neural information processing systems, pp. 6822\u20136833 (2018)"},{"issue":"4","key":"9728_CR10","doi-asserted-by":"publisher","first-page":"1992","DOI":"10.1109\/TIP.2017.2670780","volume":"26","author":"M Sabokrou","year":"2017","unstructured":"Sabokrou, M., Fayyaz, M., Fathy, M., Klette, R.: Deep-cascade: Cascading 3d deep neural networks for fast anomaly detection and localization in crowded scenes. IEEE Trans. Image Process. 26(4), 1992\u20132004 (2017)","journal-title":"IEEE Trans. Image Process."},{"key":"9728_CR11","doi-asserted-by":"crossref","unstructured":"Hawkins, S., He, H., Williams, G., Baxter, R.: Outlier detection using replicator neural networks. In: International Conference on Data Warehousing and Knowledge Discovery, pp. 170\u2013180. Springer (2002)","DOI":"10.1007\/3-540-46145-0_17"},{"key":"9728_CR12","unstructured":"Kingma, D.P., Welling, M.: Auto-encoding variational Bayes. arXiv:1312.6114 (2013)"},{"key":"9728_CR13","doi-asserted-by":"crossref","unstructured":"Berger, T.: Rate-distortion theory. Wiley Encyclopedia of Telecommunications (2003)","DOI":"10.1002\/0471219282.eot142"},{"key":"9728_CR14","unstructured":"Alemi, A.A., Poole, B., Fischer, I., Dillon, J.V., Saurous, R.A., Murphy, K.: Fixing a broken ELBO. arXiv:1711.00464 (2017)"},{"key":"9728_CR15","unstructured":"Gal, Y., Ghahramani, Z.: Dropout as a Bayesian approximation: Representing model uncertainty in deep learning. arXiv:1506.02142 (2015)"},{"key":"9728_CR16","unstructured":"Kendall, A., Gal, Y.: What uncertainties do we need in bayesian deep learning for computer vision? In: Advances in neural information processing systems, pp. 5574\u20135584 (2017)"},{"key":"9728_CR17","unstructured":"Makhzani, A., Shlens, J., Jaitly, N., Goodfellow, I., Frey, B.: Adversarial autoencoders. arXiv:1511.05644 (2015)"},{"key":"9728_CR18","first-page":"3371","volume":"11","author":"P Vincent","year":"2010","unstructured":"Vincent, P., Larochelle, H., Lajoie, I., Bengio, Y., Manzagol, P-A: Stacked denoising autoencoders: Learning useful representations in a deep network with a local denoising criterion. J. Mach. Learn. Res. 11, 3371\u20133408 (2010)","journal-title":"J. Mach. Learn. Res."},{"key":"9728_CR19","doi-asserted-by":"crossref","unstructured":"Masci, J., Meier, U., Cire\u015fan, D., Schmidhuber, J.: Stacked convolutional auto-encoders for hierarchical feature extraction. In: International conference on artificial neural networks, pp. 52\u201359. Springer (2011)","DOI":"10.1007\/978-3-642-21735-7_7"},{"key":"9728_CR20","unstructured":"Goodfellow, I., Pouget-Abadie, J., Mirza, M., Xu, B., Warde-Farley, D., Ozair, S., Courville, A., Bengio, Y.: Generative adversarial nets. In: Advances in neural information processing systems, pp. 2672\u20132680 (2014)"},{"key":"9728_CR21","doi-asserted-by":"crossref","unstructured":"Schlegl, T., Seeb\u00f6ck, P., Waldstein, S.M., Schmidt-Erfurth, U., Langs, G.: Unsupervised anomaly detection with generative adversarial networks to guide marker discovery. In: International conference on information processing in medical imaging, pp. 146\u2013157. Springer (2017)","DOI":"10.1007\/978-3-319-59050-9_12"},{"issue":"1","key":"9728_CR22","doi-asserted-by":"publisher","first-page":"45","DOI":"10.1023\/B:MACH.0000008084.60811.49","volume":"54","author":"DavidMJ Tax","year":"2004","unstructured":"Tax, DavidMJ, Duin, RobertPW: Support vector data description. Mach.s Learn. 54(1), 45\u201366 (2004)","journal-title":"Mach.s Learn."},{"issue":"7","key":"9728_CR23","doi-asserted-by":"publisher","first-page":"1443","DOI":"10.1162\/089976601750264965","volume":"13","author":"B Sch\u00f6lkopf","year":"2001","unstructured":"Sch\u00f6lkopf, B., Platt, J.C., Shawe-Taylor, J., Smola, A.J., Williamson, R.C.: Estimating the support of a high-dimensional distribution. Neural Comput. 13(7), 1443\u20131471 (2001)","journal-title":"Neural Comput."},{"key":"9728_CR24","unstructured":"Ruff, L., Vandermeulen, R.A., G\u00f6rnitz, N., Binder, A., M\u00fcller, E., M\u00fcller, K.-R., Kloft, M.: Deep semi-supervised anomaly detection. arXiv:1906.02694 (2019)"},{"key":"9728_CR25","unstructured":"Golan, I., El-Yaniv, R.: Deep anomaly detection using geometric transformations. In: Advances in Neural Information Processing Systems, pp. 9758\u20139769 (2018)"},{"key":"9728_CR26","unstructured":"Hendrycks, D., Mazeika, M., Kadavath, S., Song, D.: Using self-supervised learning can improve model robustness and uncertainty. In: Advances in Neural Information Processing Systems, pp. 15663\u201315674 (2019)"},{"key":"9728_CR27","unstructured":"Hendrycks, D., Gimpel, K.: A baseline for detecting misclassified and out-of-distribution examples in neural networks. arXiv:1610.02136(2016)"},{"key":"9728_CR28","unstructured":"Nalisnick, E., Matsukawa, A., Teh, Y.W., Gorur, D., Lakshminarayanan, B.: Do deep generative models know what they don\u2019t know? arXiv:1810.09136 (2018)"},{"key":"9728_CR29","unstructured":"Van den Oord, A., Kalchbrenner, N., Espeholt, L., Vinyals, O., Graves, A., et al.: Conditional image generation with pixelcnn decoders. In: Advances in neural information processing systems, pp. 4790\u20134798 (2016)"},{"key":"9728_CR30","unstructured":"Pang, G., Shen, C., Cao, L., Hengel, A.v.d.: Deep learning for anomaly detection: A review. arXiv:2007.02500 (2020)"},{"key":"9728_CR31","doi-asserted-by":"crossref","unstructured":"Ruff, L., Kauffmann, J.R., Vandermeulen, R.A., Montavon, G., Samek, W., Kloft, M., Dietterich, T.G., M\u00fcller, K.-R.: A unifying review of deep and shallow anomaly detection. arXiv:2009.11732 (2020)","DOI":"10.1109\/JPROC.2021.3052449"},{"key":"9728_CR32","unstructured":"Tishby, N., Pereira, F.C., Bialek, W.: The information bottleneck method. arXiv preprint physics\/0004057 (2000)"},{"key":"9728_CR33","doi-asserted-by":"crossref","unstructured":"Tishby, N., Zaslavsky, N.: Deep learning and the information bottleneck principle. In: 2015 IEEE Information Theory Workshop (ITW), pp. 1\u20135. IEEE (2015)","DOI":"10.1109\/ITW.2015.7133169"},{"key":"9728_CR34","unstructured":"Brekelmans, R., Moyer, D., Galstyan, A., VerSteeg, G.: Exact rate-distortion in autoencoders via echo noise. In: Advances in Neural Information Processing Systems, pp. 3884\u20133895 (2019)"},{"key":"9728_CR35","unstructured":"Blau, Y., Michaeli, T.: Rethinking lossy compression: The rate-distortion-perception tradeoff. arXiv:1901.07821 (2019)"},{"key":"9728_CR36","doi-asserted-by":"crossref","unstructured":"Lastras, L.A.: Information theoretic lower bounds on negative log likelihood. arXiv:1904.06395 (2019)","DOI":"10.52591\/lxai2018120310"},{"issue":"5","key":"9728_CR37","first-page":"6","volume":"2","author":"I Higgins","year":"2017","unstructured":"Higgins, I., Matthey, L., Pal, A., Burgess, C., Glorot, X., Botvinick, M., Mohamed, S., Lerchner, A.: \u03b2-VAE: Learning basic visual concepts with a constrained variational framework. Iclr 2(5), 6 (2017)","journal-title":"Iclr"},{"key":"9728_CR38","unstructured":"Kingma, D.P., Ba, J.: Adam: A method for stochastic optimization. arXiv:1412.6980 (2014)"},{"key":"9728_CR39","first-page":"2121","volume":"12","author":"J Duchi","year":"2011","unstructured":"Duchi, J., Hazan, E., Singer, Y.: Adaptive subgradient methods for online learning and stochastic optimization. J. Mach. Learn. Res. 12, 2121\u20132159 (2011)","journal-title":"J. Mach. Learn. Res."},{"issue":"2","key":"9728_CR40","doi-asserted-by":"publisher","first-page":"223","DOI":"10.1137\/16M1080173","volume":"60","author":"L Bottou","year":"2018","unstructured":"Bottou, L., Curtis, F.E., Nocedal, J.: Optimization methods for large-scale machine learning. Siam Rev. 60(2), 223\u2013311 (2018)","journal-title":"Siam Rev."},{"issue":"3","key":"9728_CR41","doi-asserted-by":"publisher","first-page":"953","DOI":"10.1007\/s10957-019-01624-6","volume":"184","author":"S Park","year":"2020","unstructured":"Park, S., Jung, S.H., Pardalos, P.M.: Combining stochastic adaptive cubic regularization with negative curvature for nonconvex optimization. J. Optim. Theory Appl. 184(3), 953\u2013971 (2020)","journal-title":"J. Optim. Theory Appl."},{"key":"9728_CR42","unstructured":"Hoffman, M.D., Johnson, M.J.: ELBO surgery: yet another way to carve up the variational evidence lower bound. In: Workshop in Advances in Approximate Bayesian Inference, NIPS, vol. 1, pp. 2 (2016)"},{"key":"9728_CR43","unstructured":"Tomczak, J.M., Welling, M.: VAE with a VampPrior. arXiv:1705.07120 (2017)"},{"key":"9728_CR44","unstructured":"Kim, H., Mnih, A.: Disentangling by factorising. arXiv:1802.05983 (2018)"},{"issue":"1","key":"9728_CR45","first-page":"1929","volume":"15","author":"N Srivastava","year":"2014","unstructured":"Srivastava, N., Hinton, G., Krizhevsky, A., Sutskever, I., Salakhutdinov, R.: Dropout: a simple way to prevent neural networks from overfitting. J. Mach. Learn. Res. 15(1), 1929\u20131958 (2014)","journal-title":"J. Mach. Learn. Res."},{"key":"9728_CR46","doi-asserted-by":"crossref","unstructured":"Becker, R.A.: The variance drain and Jensen\u2019s inequality. CAEPR Working Paper No. 2012-004 (2012)","DOI":"10.2139\/ssrn.2027471"},{"issue":"3","key":"9728_CR47","doi-asserted-by":"publisher","first-page":"278","DOI":"10.1080\/00031305.2017.1419145","volume":"73","author":"JG Liao","year":"2019","unstructured":"Liao, J.G., Berg, A.: Sharpening Jensen\u2019s inequality. Am. Stat. 73(3), 278\u2013281 (2019)","journal-title":"Am. Stat."},{"key":"9728_CR48","unstructured":"LeCun, Y.: The MNIST database of handwritten digits. http:\/\/yann.lecun.com\/exdb\/mnist\/ (1998)"},{"key":"9728_CR49","unstructured":"Xiao, H., Rasul, K., Vollgraf, R.: Fashion-MNIST: a novel image dataset for benchmarking machine learning algorithms. arXiv:1708.07747 (2017)"},{"key":"9728_CR50","unstructured":"Krizhevsky, A., Nair, V., Hinton, G.: The CIFAR-10 dataset. online: http:\/\/www.cs.toronto.edu\/kriz\/cifar.html. vol. 55 (2014)"},{"key":"9728_CR51","unstructured":"Ioffe, S., Szegedy, C.: Batch normalization: Accelerating deep network training by reducing internal covariate shift. arXiv:1502.03167 (2015)"}],"container-title":["Annals of Mathematics and Artificial Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10472-021-09728-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10472-021-09728-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10472-021-09728-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,8,10]],"date-time":"2022-08-10T02:11:08Z","timestamp":1660097468000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10472-021-09728-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,2,2]]},"references-count":51,"journal-issue":{"issue":"7-9","published-print":{"date-parts":[[2022,9]]}},"alternative-id":["9728"],"URL":"https:\/\/doi.org\/10.1007\/s10472-021-09728-4","relation":{},"ISSN":["1012-2443","1573-7470"],"issn-type":[{"type":"print","value":"1012-2443"},{"type":"electronic","value":"1573-7470"}],"subject":[],"published":{"date-parts":[[2021,2,2]]},"assertion":[{"value":"3 January 2021","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 February 2021","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}