{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,7]],"date-time":"2026-05-07T16:24:06Z","timestamp":1778171046581,"version":"3.51.4"},"reference-count":110,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"3","license":[{"start":{"date-parts":[[2025,3,1]],"date-time":"2025-03-01T00:00:00Z","timestamp":1740787200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2025,3,1]],"date-time":"2025-03-01T00:00:00Z","timestamp":1740787200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,3,1]],"date-time":"2025-03-01T00:00:00Z","timestamp":1740787200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100000923","name":"Australian Research Council","doi-asserted-by":"publisher","award":["DP210101859"],"award-info":[{"award-number":["DP210101859"]}],"id":[{"id":"10.13039\/501100000923","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100000923","name":"Australian Research Council","doi-asserted-by":"publisher","award":["FT230100549"],"award-info":[{"award-number":["FT230100549"]}],"id":[{"id":"10.13039\/501100000923","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62088102"],"award-info":[{"award-number":["62088102"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Pattern Anal. Mach. Intell."],"published-print":{"date-parts":[[2025,3]]},"DOI":"10.1109\/tpami.2024.3509434","type":"journal-article","created":{"date-parts":[[2024,11,29]],"date-time":"2024-11-29T18:51:55Z","timestamp":1732906315000},"page":"1644-1659","source":"Crossref","is-referenced-by-count":7,"title":["DiffAct++: Diffusion Action Segmentation"],"prefix":"10.1109","volume":"47","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9279-7912","authenticated-orcid":false,"given":"Daochang","family":"Liu","sequence":"first","affiliation":[{"name":"School of Physics, Mathematics and Computing, University of Western Australia, Crawley, WA, Australia"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0872-6677","authenticated-orcid":false,"given":"Qiyue","family":"Li","sequence":"additional","affiliation":[{"name":"National Engineering Research Center of Visual Technology, National Key Laboratory for Multimedia Information Processing, School of Computer Science, National Biomedical Imaging Center, Peking University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Anh-Dung","family":"Dinh","sequence":"additional","affiliation":[{"name":"School of Computer Science, Faculty of Engineering, University of Sydney, Darlington, NSW, Australia"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5372-0656","authenticated-orcid":false,"given":"Tingting","family":"Jiang","sequence":"additional","affiliation":[{"name":"National Engineering Research Center of Visual Technology, National Key Laboratory for Multimedia Information Processing, School of Computer Science, National Biomedical Imaging Center, Peking University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8216-1128","authenticated-orcid":false,"given":"Mubarak","family":"Shah","sequence":"additional","affiliation":[{"name":"Center for Research in Computer Vision, University of Central Florida, Orlando, FL, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4756-0609","authenticated-orcid":false,"given":"Chang","family":"Xu","sequence":"additional","affiliation":[{"name":"School of Computer Science, Faculty of Engineering, University of Sydney, Darlington, NSW, Australia"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/s00371-012-0752-6"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2021.3117472"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00940"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00369"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.3021756"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58595-2_3"},{"key":"ref7","article-title":"ASFormer: Transformer for action segmentation","volume-title":"Proc. Brit. Mach. Vis. Conf.","author":"Yi"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2023.3327284"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2023.3261988"},{"key":"ref10","first-page":"1","article-title":"Denoising diffusion implicit models","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Song"},{"key":"ref11","first-page":"8780","article-title":"Diffusion models beat GANs on image synthesis","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Dhariwal"},{"key":"ref12","first-page":"6840","article-title":"Denoising diffusion probabilistic models","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Ho"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00930"},{"key":"ref14","article-title":"TricorNet: A hybrid temporal convolutional and recurrent network for video action segmentation","author":"Ding","year":"2017"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.216"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46487-9_3"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.113"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00705"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00638"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2019.8803088"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/3DV50981.2020.00073"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-92659-5_18"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01653"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2021.04.121"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2022.108764"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN55064.2022.9891932"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10097024"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.2299\/jsp.27.75"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01404"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1007\/s10489-023-05259-z"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2023.3285416"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01272"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2022.104567"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1007\/s11042-023-16041-1"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ICME55011.2023.00178"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1007\/s11063-022-11133-9"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1007\/s00530-022-00998-4"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00950"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1007\/s10044-023-01166-8"},{"key":"ref40","article-title":"Enhancing transformer backbone for egocentric video action segmentation","author":"Reza","year":"2023"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2020.03.066"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2023.3284080"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00236"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01253"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01599"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58517-4_10"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01926"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01023"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/WACV45572.2020.9093535"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00947"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-27818-1_46"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01242"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/WACV48630.2021.00237"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2022\/115"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1049\/ell2.12678"},{"key":"ref56","first-page":"14 890","article-title":"Don\u2019t pour cereal into coffee: Differentiable temporal logic for temporal action segmentation","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Xu"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19833-5_4"},{"key":"ref58","article-title":"Temporal segment transformer for action segmentation","author":"Liu","year":"2023"},{"key":"ref59","article-title":"DIR-AS: Decoupling individual identification and temporal reasoning for action segmentation","author":"Wang","year":"2023"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10096960"},{"key":"ref61","article-title":"BIT: Bi-level temporal modeling for efficient supervised action segmentation","author":"Lu","year":"2023"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/WACV.2019.00027"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1145\/3581783.3611842"},{"key":"ref64","first-page":"5152","article-title":"Temporal Gaussian mixture layer for videos","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Piergiovanni"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01258"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01941"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2022.3169976"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46448-0_31"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00771"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19833-5_2"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00332"},{"key":"ref72","first-page":"2256","article-title":"Deep unsupervised learning using nonequilibrium thermodynamics","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Sohl-Dickstein"},{"key":"ref73","article-title":"Generative modeling by estimating gradients of the data distribution","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Song"},{"key":"ref74","first-page":"12 438","article-title":"Improved techniques for training score-based generative models","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Song"},{"key":"ref75","article-title":"Score-based generative modeling through stochastic differential equations","author":"Song","year":"2020"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00578"},{"key":"ref78","article-title":"Latent diffusion energy-based model for interpretable text modeling","author":"Yu","year":"2022"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01043"},{"key":"ref80","first-page":"2416","article-title":"DiffusionClip: Text-guided image manipulation using diffusion models","volume-title":"Proc. IEEE Conf. Comput. Vis. Pattern Recognit.","author":"Kim"},{"key":"ref81","first-page":"23 689","article-title":"BinauralGrad: A two-stage conditional diffusion probabilistic model for binaural audio synthesis","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Leng"},{"key":"ref82","article-title":"BDDM: Bilateral denoising diffusion models for fast and high-quality speech synthesis","author":"Lam","year":"2022"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.3390\/e25101469"},{"key":"ref84","article-title":"Diffusion models for video prediction and infilling","author":"H\u00f6ppe","year":"2022"},{"key":"ref85","first-page":"23 371","article-title":"MCVD-masked conditional video diffusion for prediction, generation, and interpolation","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Voleti"},{"key":"ref86","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.02096"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01816"},{"key":"ref88","first-page":"1","article-title":"Label-efficient semantic segmentation with diffusion models","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Baranchuk"},{"key":"ref89","article-title":"SegDiff: Image segmentation with diffusion probabilistic models","author":"Amit","year":"2021"},{"key":"ref90","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01253"},{"key":"ref91","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01365"},{"key":"ref92","article-title":"Diffusing surrogate dreams of video scenes to predict video memorability","author":"Sweeney","year":"2022"},{"key":"ref93","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i3.25484"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00951"},{"key":"ref95","article-title":"DiffusionVMR: Diffusion model for video moment retrieval","author":"Zhao","year":"2023"},{"key":"ref96","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00947"},{"key":"ref97","article-title":"Anomaly detection in satellite videos using diffusion models","author":"Awasthi","year":"2023"},{"key":"ref98","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP49359.2023.10222594"},{"key":"ref99","article-title":"Understanding diffusion models: A unified perspective","author":"Luo","year":"2022"},{"key":"ref100","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01036"},{"key":"ref101","first-page":"1","article-title":"Classifier-free diffusion guidance","volume-title":"Proc. NeurIPS 2021 Workshop Deep Generative Models Downstream Appl.","author":"Ho"},{"key":"ref102","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP46576.2022.9897444"},{"key":"ref103","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2011.5995444"},{"key":"ref104","doi-asserted-by":"publisher","DOI":"10.1145\/2493432.2493482"},{"key":"ref105","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.105"},{"key":"ref106","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.02042"},{"key":"ref107","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.502"},{"key":"ref108","first-page":"5775","article-title":"DPM-Solver: A fast ode solver for diffusion probabilistic model sampling in around 10 steps","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Lu"},{"key":"ref109","article-title":"MedSegDiff: Medical image segmentation with diffusion probabilistic model","author":"Wu","year":"2022"},{"key":"ref110","article-title":"Progressive distillation for fast sampling of diffusion models","author":"Salimans","year":"2022"}],"container-title":["IEEE Transactions on Pattern Analysis and Machine Intelligence"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/34\/10873290\/10772006.pdf?arnumber=10772006","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,6]],"date-time":"2025-02-06T18:37:44Z","timestamp":1738867064000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10772006\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,3]]},"references-count":110,"journal-issue":{"issue":"3"},"URL":"https:\/\/doi.org\/10.1109\/tpami.2024.3509434","relation":{},"ISSN":["0162-8828","2160-9292","1939-3539"],"issn-type":[{"value":"0162-8828","type":"print"},{"value":"2160-9292","type":"electronic"},{"value":"1939-3539","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,3]]}}}