{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,6]],"date-time":"2026-05-06T06:27:43Z","timestamp":1778048863908,"version":"3.51.4"},"reference-count":59,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2024,2,12]],"date-time":"2024-02-12T00:00:00Z","timestamp":1707696000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,2,12]],"date-time":"2024-02-12T00:00:00Z","timestamp":1707696000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"NSFC","doi-asserted-by":"crossref","award":["2072265, 62021002"],"award-info":[{"award-number":["2072265, 62021002"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["The VLDB Journal"],"published-print":{"date-parts":[[2024,5]]},"DOI":"10.1007\/s00778-024-00840-5","type":"journal-article","created":{"date-parts":[[2024,2,12]],"date-time":"2024-02-12T12:02:26Z","timestamp":1707739346000},"page":"727-752","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":8,"title":["Time series data encoding in Apache IoTDB: comparative analysis and recommendation"],"prefix":"10.1007","volume":"33","author":[{"given":"Tianrui","family":"Xia","sequence":"first","affiliation":[]},{"given":"Jinzhao","family":"Xiao","sequence":"additional","affiliation":[]},{"given":"Yuxiang","family":"Huang","sequence":"additional","affiliation":[]},{"given":"Changyu","family":"Hu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9503-2755","authenticated-orcid":false,"given":"Shaoxu","family":"Song","sequence":"additional","affiliation":[]},{"given":"Xiangdong","family":"Huang","sequence":"additional","affiliation":[]},{"given":"Jianmin","family":"Wang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,2,12]]},"reference":[{"key":"840_CR1","unstructured":"Aamand, A., Indyk, P., Vakilian, A.: (Learned) frequency estimation algorithms under Zipfian distribution. CoRR, arXiv:1908.05198 (2019)"},{"key":"840_CR2","doi-asserted-by":"crossref","unstructured":"Abadi, D.J., Madden, S., Ferreira, M.: Integrating compression and execution in column-oriented database systems. In: Proceedings of the ACM SIGMOD International Conference on Management of Data, Chicago, Illinois, USA, June 27\u201329, 2006, pp. 671\u2013682. ACM (2006)","DOI":"10.1145\/1142473.1142548"},{"key":"840_CR3","doi-asserted-by":"crossref","unstructured":"Bartik, M., Ubik, S., Kubal\u00edk, P.: LZ4 compression algorithm on FPGA. In: 2015 IEEE International Conference on Electronics, Circuits, and Systems, ICECS 2015, Cairo, Egypt, December 6\u20139, 2015, pp. 179\u2013182. IEEE (2015)","DOI":"10.1109\/ICECS.2015.7440278"},{"issue":"3","key":"840_CR4","doi-asserted-by":"publisher","first-page":"93:1","DOI":"10.1145\/3264903","volume":"2","author":"D W Blalock","year":"2018","unstructured":"Blalock, D. W., Madden, S., Guttag, J. V.: Sprintz: time series compression for the internet of things. Proc. ACM Interact. Mob. Wearab. Ubiquit. Technol. 2(3), 93:1-93:23 (2018)","journal-title":"Proc. ACM Interact. Mob. Wearab. Ubiquit. Technol."},{"key":"840_CR5","unstructured":"Breiman, L., Friedman, J.H., Olshen, R.A., Stone, C.J.: Classification and Regression Trees. Wadsworth (1984)"},{"issue":"1","key":"840_CR6","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman, L.: Random forests. Mach. Learn. 45(1), 5\u201332 (2001)","journal-title":"Mach. Learn."},{"key":"840_CR7","unstructured":"Burrows, M., Wheeler, D.: A block-sorting lossless data compression algorithm. In: Digital SRC Research Report, Citeseer (1994)"},{"key":"840_CR8","doi-asserted-by":"crossref","unstructured":"Campobello, G., Segreto, A., Zanafi, S., Serrano, S.: RAKE: a simple and efficient lossless compression algorithm for the internet of things. In: 25th European Signal Processing Conference, EUSIPCO 2017, Kos, Greece, August 28\u2013September 2, 2017, pp. 2581\u20132585. IEEE (2017)","DOI":"10.23919\/EUSIPCO.2017.8081677"},{"key":"840_CR9","doi-asserted-by":"crossref","unstructured":"Cen, L., Kipf, A., Marcus, R., Kraska, T.: LEA: a learned encoding advisor for column stores. In: aiDM \u201921: 4th Workshop in Exploiting AI Techniques for Data Management, Virtual Event, China, 25 June, 2021, pp. 32\u201335. ACM (2021)","DOI":"10.1145\/3464509.3464885"},{"issue":"10","key":"840_CR10","doi-asserted-by":"publisher","first-page":"198:1","DOI":"10.1145\/3560814","volume":"55","author":"G Chiarot","year":"2023","unstructured":"Chiarot, G., Silvestri, C.: Time series compression survey. ACM Comput. Surv. 55(10), 198:1-198:32 (2023)","journal-title":"ACM Comput. Surv."},{"issue":"8","key":"840_CR11","doi-asserted-by":"publisher","first-page":"3111","DOI":"10.1109\/TSP.2006.875394","volume":"54","author":"M Dalai","year":"2006","unstructured":"Dalai, M., Leonardi, R.: Approximations of one-dimensional digital signals under the l$${}_{\\text{ infty }}$$ norm. IEEE Trans. Signal Process. 54(8), 3111\u20133124 (2006)","journal-title":"IEEE Trans. Signal Process."},{"key":"840_CR12","unstructured":"Drucker, H., Burges, C.J.C., Kaufman, L., Smola, A.J., Vapnik, V.: Support vector regression machines. In: Advances in Neural Information Processing Systems 9, NIPS, Denver, CO, USA, December 2\u20135, 1996, pp. 155\u2013161. MIT Press (1996)"},{"issue":"2","key":"840_CR13","doi-asserted-by":"publisher","first-page":"193","DOI":"10.1007\/s00778-014-0368-8","volume":"24","author":"F Eichinger","year":"2015","unstructured":"Eichinger, F., Efros, P., Karnouskos, S., B\u00f6hm, K.: A time-series compression technique and its application to the smart grid. VLDB J. 24(2), 193\u2013218 (2015)","journal-title":"VLDB J."},{"issue":"1","key":"840_CR14","doi-asserted-by":"publisher","first-page":"23:1","DOI":"10.1145\/3588703","volume":"1","author":"C Fang","year":"2023","unstructured":"Fang, C., Song, S., Guan, H., Huang, X., Wang, C., Wang, J.: Grouping time series for efficient columnar storage. Proc. ACM Manag. Data 1(1), 23:1-23:26 (2023)","journal-title":"Proc. ACM Manag. Data"},{"issue":"2","key":"840_CR15","doi-asserted-by":"publisher","first-page":"255","DOI":"10.1080\/0952813X.2010.505800","volume":"23","author":"E Fink","year":"2011","unstructured":"Fink, E., Gandhi, H.S.: Compression of time series by extracting major extrema. J. Exp. Theor. Artif. Intell. 23(2), 255\u2013270 (2011)","journal-title":"J. Exp. Theor. Artif. Intell."},{"issue":"3","key":"840_CR16","doi-asserted-by":"publisher","first-page":"399","DOI":"10.1109\/TIT.1966.1053907","volume":"12","author":"S W Golomb","year":"1966","unstructured":"Golomb, S. W.: Run-length encodings (corresp.). IEEE Trans. Inf. Theory 12(3), 399\u2013401 (1966)","journal-title":"IEEE Trans. Inf. Theory"},{"key":"840_CR17","doi-asserted-by":"crossref","unstructured":"Hastie, T., Tibshirani, R., Friedman, J.H.: The Elements of Statistical Learning: Data Mining, Inference, and Prediction. Springer Series in Statistics, 2nd edn. Springer (2009)","DOI":"10.1007\/978-0-387-84858-7"},{"issue":"1\u20133","key":"840_CR18","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1016\/0004-3702(89)90049-0","volume":"40","author":"GE Hinton","year":"1989","unstructured":"Hinton, G.E.: Connectionist learning procedures. Artif. Intell. 40(1\u20133), 185\u2013234 (1989)","journal-title":"Artif. Intell."},{"issue":"2","key":"840_CR19","doi-asserted-by":"publisher","first-page":"65","DOI":"10.1016\/0020-0190(96)00090-7","volume":"59","author":"PG Howard","year":"1996","unstructured":"Howard, P.G., Vitter, J.S.: Parallel lossless image compression using Huffman and arithmetic coding. Inf. Process. Lett. 59(2), 65\u201373 (1996)","journal-title":"Inf. Process. Lett."},{"key":"840_CR20","unstructured":"http:\/\/opentsdb.net\/"},{"key":"840_CR21","unstructured":"https:\/\/archive.ics.uci.edu"},{"key":"840_CR22","unstructured":"https:\/\/github.com\/apache\/iotdb\/tree\/research\/encoding-exp"},{"key":"840_CR23","unstructured":"https:\/\/github.com\/thssdb\/encoding-exp"},{"key":"840_CR24","unstructured":"https:\/\/github.com\/thulab\/iotdb-benchmark"},{"key":"840_CR25","unstructured":"https:\/\/iotdb.apache.org\/"},{"key":"840_CR26","unstructured":"https:\/\/iotdb.apache.org\/UserGuide\/Master\/Data-Concept\/Encoding.html"},{"key":"840_CR27","unstructured":"https:\/\/thulab.github.io\/iotdb-quality\/"},{"key":"840_CR28","unstructured":"https:\/\/www.gnu.org\/software\/gzip\/"},{"key":"840_CR29","unstructured":"https:\/\/www.influxdata.com\/"},{"key":"840_CR30","unstructured":"https:\/\/www.kaggle.com\/datasets\/"},{"key":"840_CR31","unstructured":"https:\/\/www.kaggle.com\/datasets\/eliasdabbas\/web-server-access-logs"},{"key":"840_CR32","unstructured":"https:\/\/www.kaggle.com\/datasets\/shawon10\/web-log-dataset"},{"key":"840_CR33","unstructured":"https:\/\/www.kaggle.com\/datasets\/winmedals\/incident-event-log-dataset"},{"key":"840_CR34","unstructured":"https:\/\/www.microsoft.com\/en-us\/download\/details.aspx"},{"key":"840_CR35","doi-asserted-by":"crossref","unstructured":"Huang, S., Chen, Y., Chen, X., Liu, K., Xu, X., Wang, C., Brown, K., Halilovic, I.: The next generation operational data historian for IoT based on informix. In: International Conference on Management of Data, SIGMOD 2014, Snowbird, UT, USA, June 22\u201327, 2014, pp. 169\u2013176. ACM (2014)","DOI":"10.1145\/2588555.2595638"},{"key":"840_CR36","doi-asserted-by":"crossref","unstructured":"Jiang, H., Liu, C., Paparrizos, J., Chien, A.A., Ma, J., Elmore, A.J.: Good to the last bit: Data-driven encoding with codecdb. In: SIGMOD \u201921: International Conference on Management of Data, Virtual Event, China, June 20\u201325, 2021, pp. 843\u2013856. ACM (2021)","DOI":"10.1145\/3448016.3457283"},{"key":"840_CR37","unstructured":"Katsis, Y., Freund, Y., Papakonstantinou, Y.: Combining databases and signal processing in plato. In: 7th Biennial Conference on Innovative Data Systems Research, CIDR 2015, Asilomar, CA, USA, January 4\u20137, 2015, Online Proceedings (2015). https:\/\/www.cidrdb.org"},{"key":"840_CR38","doi-asserted-by":"crossref","unstructured":"Khelifati, A., Khayati, M., Cudr\u00e9-Mauroux, P.: CORAD: correlation-aware compression of massive time series using sparse dictionary coding. In: 2019 IEEE International Conference on Big Data (IEEE BigData), Los Angeles, CA, USA, December 9\u201312, 2019, pp. 2289\u20132298. IEEE (2019)","DOI":"10.1109\/BigData47090.2019.9005580"},{"key":"840_CR39","unstructured":"Lazaridis, I., Mehrotra, S.: Capturing sensor-generated time series with quality guarantees. In: Proceedings of the 19th International Conference on Data Engineering, March 5\u20138, 2003, Bangalore, India, pp. 429\u2013440. IEEE Computer Society (2003)"},{"issue":"11","key":"840_CR40","doi-asserted-by":"publisher","first-page":"3058","DOI":"10.14778\/3551793.3551852","volume":"15","author":"P Liakos","year":"2022","unstructured":"Liakos, P., Papakonstantinopoulou, K., Kotidis, Y.: Chimp: Efficient lossless floating point compression for time series databases. Proc. VLDB Endow. 15(11), 3058\u20133070 (2022)","journal-title":"Proc. VLDB Endow."},{"issue":"11","key":"840_CR41","doi-asserted-by":"publisher","first-page":"2586","DOI":"10.14778\/3476249.3476305","volume":"14","author":"C Liu","year":"2021","unstructured":"Liu, C., Jiang, H., Paparrizos, J., Elmore, A.J.: Decomposed bounded floats for fast compression and queries. Proc. VLDB Endow. 14(11), 2586\u20132598 (2021)","journal-title":"Proc. VLDB Endow."},{"issue":"6","key":"840_CR42","doi-asserted-by":"publisher","first-page":"1821","DOI":"10.1007\/s10618-019-00647-x","volume":"33","author":"CH Lubba","year":"2019","unstructured":"Lubba, C.H., Sethi, S.S., Knaute, P., Schultz, S.R., Fulcher, B.D., Jones, N.S.: catch22: Canonical time-series characteristics\u2014selected through highly comparative time-series analysis. Data Min. Knowl. Discov. 33(6), 1821\u20131852 (2019)","journal-title":"Data Min. Knowl. Discov."},{"key":"840_CR43","doi-asserted-by":"crossref","unstructured":"Marascu, A., Pompey, P., Bouillet, E., Wurst, M., Verscheure, O., Grund, M., Cudr\u00e9-Mauroux, P.: TRISTAN: real-time analytics on massive time series using sparse dictionary compression. In: 2014 IEEE International Conference on Big Data (IEEE BigData 2014), Washington, DC, USA, October 27\u201330, 2014, pp. 291\u2013300. IEEE Computer Society (2014)","DOI":"10.1109\/BigData.2014.7004244"},{"key":"840_CR44","doi-asserted-by":"crossref","unstructured":"Nong, G., Zhang, S., Chan, W.H.: Linear suffix array construction by almost pure induced-sorting. In: 2009 Data Compression Conference (DCC 2009), 16\u201318 March 2009, Snowbird, UT, USA, pp. 193\u2013202. IEEE Computer Society (2009)","DOI":"10.1109\/DCC.2009.42"},{"issue":"1 &2","key":"840_CR45","doi-asserted-by":"publisher","first-page":"85","DOI":"10.1016\/0020-0255(94)00108-N","volume":"84","author":"GH Ong","year":"1995","unstructured":"Ong, G.H., Huang, S.: A data compression scheme for Chinese text files using Huffman coding and a two-level dictionary. Inf. Sci. 84(1 &2), 85\u201399 (1995)","journal-title":"Inf. Sci."},{"issue":"4","key":"840_CR46","doi-asserted-by":"publisher","first-page":"548","DOI":"10.1109\/TIT.1977.1055739","volume":"23","author":"RC Pasco","year":"1977","unstructured":"Pasco, R.C.: Source coding algorithms for fast data compression (ph.d. thesis abstr.). IEEE Trans. Inf. Theory 23(4), 548 (1977)","journal-title":"IEEE Trans. Inf. Theory"},{"issue":"12","key":"840_CR47","doi-asserted-by":"publisher","first-page":"1816","DOI":"10.14778\/2824032.2824078","volume":"8","author":"T Pelkonen","year":"2015","unstructured":"Pelkonen, T., Franklin, S., Cavallaro, P., Huang, Q., Meza, J., Teller, J., Veeraraghavan, K.: Gorilla: a fast, scalable, in-memory time series database. Proc. VLDB Endow. 8(12), 1816\u20131827 (2015)","journal-title":"Proc. VLDB Endow."},{"issue":"4","key":"840_CR48","first-page":"16","volume":"16","author":"BY Ryabko","year":"1980","unstructured":"Ryabko, B.Y.: Data compression by means of a \u201cbook stack\u2019\u2019. Probl. Pered. Informat. 16(4), 16\u201321 (1980)","journal-title":"Probl. Pered. Informat."},{"key":"840_CR49","doi-asserted-by":"crossref","unstructured":"Samulowitz, H., Reddy, C., Sabharwal, A., Sellmann, M.: Snappy: a simple algorithm portfolio. In: Theory and Applications of Satisfiability Testing - SAT 2013 - 16th International Conference, Helsinki, Finland, July 8\u201312, 2013. Proceedings, Volume 7962 of Lecture Notes in Computer Science, pp. 422\u2013428. Springer (2013)","DOI":"10.1007\/978-3-642-39071-5_33"},{"key":"840_CR50","doi-asserted-by":"publisher","first-page":"423","DOI":"10.1007\/BF02574699","volume":"6","author":"R Seidel","year":"1991","unstructured":"Seidel, R.: Small-dimensional linear programming and convex hulls made easy. Discret. Comput. Geom. 6, 423\u2013434 (1991)","journal-title":"Discret. Comput. Geom."},{"key":"840_CR51","doi-asserted-by":"crossref","unstructured":"Spiegel, J., Wira, P., Hermann, G.: A comparative experimental study of lossless compression algorithms for enhancing energy efficiency in smart meters. In: 16th IEEE International Conference on Industrial Informatics, INDIN 2018, Porto, Portugal, July 18\u201320, 2018, pp. 447\u2013452. IEEE (2018)","DOI":"10.1109\/INDIN.2018.8471921"},{"key":"840_CR52","unstructured":"Walder, J., Kr\u00e1tk\u00fd, M., Platos, J.: Fast fibonacci encoding algorithm. In: Proceedings of the Dateso 2010 Annual International Workshop on DAtabases, TExts, Specifications and Objects, Stedronin-Plazy, Czech Republic, April 21\u201323, 2010, Volume 567 of CEUR Workshop Proceedings, pp. 72\u201383. CEUR-WS.org (2010)"},{"issue":"2","key":"840_CR53","doi-asserted-by":"publisher","first-page":"195:1","DOI":"10.1145\/3589775","volume":"1","author":"C Wang","year":"2023","unstructured":"Wang, C., Qiao, J., Huang, X., Song, S., Hou, H., Jiang, T., Rui, L., Wang, J., Sun, J.: Apache IoTDB: a time series database for IoT applications. Proc. ACM Manag. Data 1(2), 195:1-195:27 (2023)","journal-title":"Proc. ACM Manag. Data"},{"issue":"6","key":"840_CR54","doi-asserted-by":"publisher","first-page":"8","DOI":"10.1109\/MC.1984.1659158","volume":"17","author":"TA Welch","year":"1984","unstructured":"Welch, T.A.: A technique for high-performance data compression. Computer 17(6), 8\u201319 (1984)","journal-title":"Computer"},{"key":"840_CR55","doi-asserted-by":"crossref","unstructured":"Wong, R.C., Fu, A.W.: Mining top-k item sets over a sliding window based on zipfian distribution. In: Proceedings of the 2005 SIAM International Conference on Data Mining, SDM 2005, Newport Beach, CA, USA, April 21\u201323, 2005, pp. 516\u2013520. SIAM (2005)","DOI":"10.1137\/1.9781611972757.52"},{"key":"840_CR56","doi-asserted-by":"crossref","unstructured":"Yousri, R., Alsenwi, M., Saeed\u00a0Darweesh, M., Ismail, T.: A design for an efficient hybrid compression system for EEG data. In: 2021 International Conference on Electronic Engineering (ICEEM), pp. 1\u20136 (2021)","DOI":"10.1109\/ICEEM52022.2021.9480377"},{"key":"840_CR57","doi-asserted-by":"crossref","unstructured":"Yu, X., Peng, Y., Li, F., Wang, S., Shen, X., Mai, H., Xie, Y.: Two-level data compression using machine learning in time series database. In: 36th IEEE International Conference on Data Engineering, ICDE 2020, Dallas, TX, USA, April 20\u201324, 2020, pp. 1333\u20131344. IEEE (2020)","DOI":"10.1109\/ICDE48307.2020.00119"},{"key":"840_CR58","doi-asserted-by":"crossref","unstructured":"Yu, H., Huang, F., Lin, C.: Dual coordinate descent methods for logistic regression and maximum entropy models. Mach. Learn. 85(1\u20132), 41\u201375 (2011)","DOI":"10.1007\/s10994-010-5221-8"},{"key":"840_CR59","doi-asserted-by":"crossref","unstructured":"Ziv, J., Lempel, A.: A universal algorithm for sequential data compression. IEEE Trans. Inf. Theory 23(3), 337\u2013343 (1977)","DOI":"10.1109\/TIT.1977.1055714"}],"container-title":["The VLDB Journal"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00778-024-00840-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00778-024-00840-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00778-024-00840-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,4,23]],"date-time":"2024-04-23T07:06:59Z","timestamp":1713856019000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00778-024-00840-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,2,12]]},"references-count":59,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2024,5]]}},"alternative-id":["840"],"URL":"https:\/\/doi.org\/10.1007\/s00778-024-00840-5","relation":{},"ISSN":["1066-8888","0949-877X"],"issn-type":[{"value":"1066-8888","type":"print"},{"value":"0949-877X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,2,12]]},"assertion":[{"value":"13 January 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"14 December 2023","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 January 2024","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 February 2024","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}