{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,29]],"date-time":"2026-03-29T16:30:25Z","timestamp":1774801825799,"version":"3.50.1"},"reference-count":120,"publisher":"Elsevier BV","issue":"13-14","license":[{"start":{"date-parts":[[1999,12,1]],"date-time":"1999-12-01T00:00:00Z","timestamp":944006400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Parallel Computing"],"published-print":{"date-parts":[[1999,12]]},"DOI":"10.1016\/s0167-8191(99)00070-8","type":"journal-article","created":{"date-parts":[[2003,4,25]],"date-time":"2003-04-25T08:06:40Z","timestamp":1051258000000},"page":"1907-1929","source":"Crossref","is-referenced-by-count":62,"title":["Advances in the dataflow computational model"],"prefix":"10.1016","volume":"25","author":[{"given":"Walid A","family":"Najjar","sequence":"first","affiliation":[]},{"given":"Edward A","family":"Lee","sequence":"additional","affiliation":[]},{"given":"Guang R","family":"Gao","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/S0167-8191(99)00070-8_BIB1","unstructured":"Annapolis Micro Systems, Wildforce Board Web Page, http:\/\/www.annapmicro.com"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB2","unstructured":"B.S. Ang, Arvind, D. Chiou, StarT the next generation: integrating global caches and dataflow architecture, in: G.R. Gao, L. Bic, J.-L. Gaudiot (Eds.), Advanced Topics in Dataflow Computing and Multithreading, IEEE Computer Society Press, Silver Spring, MD, 1995, pp. 19\u201354"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB3","unstructured":"B.S. Ang, D. Chiou, D. Rosenband, M. Ehrlich, L. Rudolph, Arvind, Start-voyager: a flexible platform for exploring scalable smp issues, CSG Memo 415, Computation Structures Group, MIT Lab. for Comput. Sci., December 1998"},{"issue":"3","key":"10.1016\/S0167-8191(99)00070-8_BIB4","doi-asserted-by":"crossref","first-page":"300","DOI":"10.1109\/12.48862","article-title":"Executing a program on the MIT tagged-token dataflow architecture","volume":"39","author":"Arvind","year":"1990","journal-title":"IEEE Trans. Comput."},{"issue":"2","key":"10.1016\/S0167-8191(99)00070-8_BIB5","doi-asserted-by":"crossref","first-page":"42","DOI":"10.1109\/MC.1982.1653940","article-title":"The U-interpreter","volume":"15","author":"Arvind","year":"1982","journal-title":"Computer"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB6","doi-asserted-by":"crossref","unstructured":"Arvind, R. Iannucci, A critique of multiprocessing von Neumann style, in: International Symposium on Computer Architecture, Stokholm, Sweden, 1983","DOI":"10.1145\/800046.801684"},{"issue":"4","key":"10.1016\/S0167-8191(99)00070-8_BIB7","doi-asserted-by":"crossref","first-page":"598","DOI":"10.1145\/69558.69562","article-title":"I-structures: data structures for parallel computing","volume":"11","author":"Arvind","year":"1989","journal-title":"ACM Trans. on Program. Languages Syst."},{"key":"10.1016\/S0167-8191(99)00070-8_BIB8","doi-asserted-by":"crossref","first-page":"11","DOI":"10.1109\/2.204677","article-title":"Processor reconfiguration through instruction set metamorphosis","volume":"26","author":"Athanas","year":"1993","journal-title":"Computer"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB9","doi-asserted-by":"crossref","unstructured":"P.S. Barth, R.S. Nikhil, Arvind, M\u2013structures: extending a parallel, non-strict, functional language with state, CSG Memo 327, Computation Structures Group, MIT Lab. for Comput. Sci., March 1991","DOI":"10.1007\/3540543961_26"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB10","doi-asserted-by":"crossref","unstructured":"M.J. Beckerle, Overview of the START(\u2217T) multithreaded computer, in: Digest of Papers, COMPCON Spring '93, San Francisco, CA, February 1993, pp. 148\u2013156","DOI":"10.1109\/CMPCON.1993.289655"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB11","unstructured":"A. Benedetti, P. Perona, Feature detection on a reconfigurable computer, in: Conference on Computer Vision and Pattern Recognition, Santa Barbara, CA, 1998"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB12","doi-asserted-by":"crossref","unstructured":"A. Benveniste, G. Berry, The synchronous approach to reactive and real-time systems, in: Proceedings of the IEEE, vol. 79 (9), 1991, pp. 1270\u20131282","DOI":"10.1109\/5.97297"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB13","doi-asserted-by":"crossref","unstructured":"A. Benveniste, P. Caspi, P. Le Guernic, N. Halbwachs, Data-flow synchronous languages, in: J.W. de Bakker, W.-P. de Roever, G. Rozenberg (Eds.), A Decade of Concurrency \u2013 Reflections and Perspectives, Lecture Notes in Computer Science, vol. 803, Springer, Berlin, 1994, pp. 1\u201345","DOI":"10.1007\/3-540-58043-3_16"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB14","doi-asserted-by":"crossref","unstructured":"P. Bertin, D. Roncin, J. Vuillemin, Programmable active memories: a performance assesment, in: G. Borriello, C. Ebeling (Eds.), Research on Integrated Systems, MIT Press, Cambridge, MA, 1993, pp. 88\u2013102","DOI":"10.1007\/3-540-56731-3_12"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB15","doi-asserted-by":"crossref","unstructured":"P. Bertin, H. Touati, PAM programming environments: practice and experience, in: Proceedings of the IEEE Workshop on FPGAs for Custom Computing Machines, IEEE Computer Soc. Press, Los Alamitos, CA, 1994, pp. 133\u2013139","DOI":"10.1109\/FPGA.1994.315599"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB16","doi-asserted-by":"crossref","unstructured":"G. Bilsen, M. Engels, R. Lauwereins, J.A. Peperstraete, Static scheduling of multi-rate and cyclo-static DSP applications, in: Proceedings of the 1994 Workshop on VLSI Signal Processing, IEEE Press, New York, 1994","DOI":"10.1109\/VLSISP.1994.574738"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB17","unstructured":"M. Bolotski, A. DeHon, T.F. Knight, Unifying FPGAs and SIMD arrays, in: Proceedings of the FPGA Workshop, 1994"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB18","doi-asserted-by":"crossref","unstructured":"J.T. Buck, E.A. Lee, Scheduling dynamic dataflow graphs with bounded memory using the token flow model, in: Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing, vol. I, Minneapolis, MN, April 1993, pp. 429\u2013432","DOI":"10.1109\/ICASSP.1993.319147"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB19","doi-asserted-by":"crossref","unstructured":"J.T. Buck, Scheduling dynamic dataflow draphs with bounded memory using the token flow model, Technical Report UCB\/ERL 93\/69, Ph.D. Dissertation, Department of EECS, University of California, Berkeley, CA 94720, 1993","DOI":"10.1109\/ICASSP.1993.319147"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB20","unstructured":"J.T. Buck, S. Ha, E.A. Lee, D.G. Messerschmitt, Ptolemy: a framework for simulating and prototyping heterogeneous systems (special issue on Simulation Software Development) Int. J. Comput. Simulation, 4 (1994) 155\u2013182 (http:\/\/ptolemy.eecs.berkeley.edu\/papers\/JEurSim)"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB21","doi-asserted-by":"crossref","unstructured":"J.T. Buck, Static scheduling and code generation from dynamic dataflow graphs with integer-valued control systems, Invited Paper, in: Proceedings of the IEEE Asilomar Conference on Signals, Systems, and Computers, 31 October\u20132 November, Pacific Grove, CA, 1994","DOI":"10.1109\/ACSSC.1994.471505"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB22","author":"Buell","year":"1996"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB23","doi-asserted-by":"crossref","unstructured":"S. Cadambi, J. Weener, S.C. Goldstein, H. Schmit, D.E. Thomas, Managing pipeline-reconfigurable FPGAs, in: Sixth International Symposium on Field Programmable Gate Arrays, 1998","DOI":"10.1145\/275107.275120"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB24","unstructured":"R. Carley, S.C. Goldstein, T. Mukherjee, R. Rutenbar, H. Schmit, D. Thomas, PipeRench Web Page, Carnegie-Mellon University, http:\/\/www.ece.cmu.edu\/research\/piperench\/"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB25","doi-asserted-by":"crossref","unstructured":"D. Chiou, B.S. Ang, Arvind, M.J. Beckerle, A. Boughton, R. Greiner, J.E. Hicks, J.C. Hoe, StarT-NG: delivering seamless parallel computing, CSG Memo 371, Computation Structures Group, MIT Lab. for Comput. Sci., February 1995","DOI":"10.1007\/BFb0020458"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB26","doi-asserted-by":"crossref","unstructured":"C.E. Cox, W. Ekkehard Blanz, Ganglion \u2013 a fast hardware implementation of a connectionist classifier, in: Proceedings of the IEEE Custom Integrated Circuits Conference, IEEE Press, New York, 1991, pp. 6.5.1\u20136.5.4","DOI":"10.1109\/CICC.1991.164044"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB27","doi-asserted-by":"crossref","unstructured":"S.A. Cuccaro, C.F. Reese, The CM-2X: a hybrid CM-2\/Xilinx prototype, in: Proceedings of the IEEE Workshop on FPGAs for Custom Computing Machines, IEEE Computer Soc. Press, Los Alamitos, CA, 1993, pp. 121\u2013131","DOI":"10.1109\/FPGA.1993.279471"},{"issue":"2","key":"10.1016\/S0167-8191(99)00070-8_BIB28","doi-asserted-by":"crossref","first-page":"26","DOI":"10.1109\/MC.1982.1653939","article-title":"Data flow program graphs","volume":"15","author":"Davis","year":"1982","journal-title":"Computer"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB29","doi-asserted-by":"crossref","unstructured":"A. DeHon, Comparing computing machines, in: Configurable Computing: Technology and Applications, Proceedings of SPIE 3526, November 1998, p. 124","DOI":"10.1117\/12.327025"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB30","doi-asserted-by":"crossref","unstructured":"J.B. Dennis, First version of a data-flow procedure language, in: Proceedings of the Colloque sur la Programmation, Lecture Notes in Computer Science, vol. 19, Paris, France, April 9\u201311, Springer, Berlin, 1974, pp. 362\u2013376","DOI":"10.1007\/3-540-06859-7_145"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB31","unstructured":"J.B. Dennis, Data flow ideas for supercomputers, in: Digest of Papers, COMPCON Spring '84, San Francisco, CA, February\u2013March 1984, pp. 15\u201319"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB32","doi-asserted-by":"crossref","unstructured":"J.B. Dennis, G.R. Gao, An efficient pipelined dataflow processor architecture, in: Proceedings of the Supercomputing '88, Orlando, FL, November 1988, pp. 368\u2013373","DOI":"10.1109\/SUPERC.1988.44674"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB33","doi-asserted-by":"crossref","unstructured":"J.B. Dennis, G.R. Gao, Multithreaded architectures: principles, projects, and issues, ACAPS Technical Memo 29, School of Computer Science, McGill University, Montr\u00e9al, Qu\u00e9., February 1994, in: ftp:\/\/ftp-acaps.cs.mcgill.ca\/pub\/doc\/memos","DOI":"10.1007\/978-1-4615-2698-8_1"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB34","doi-asserted-by":"crossref","unstructured":"J.B. Dennis, G.R. Gao, Multithreaded architectures: principles, projects, and issues, in: R.A. Iannucci, G.R. Gao, R.H. Halstead Jr., B. Smith (Eds.), Multithreaded Computer Architecture: A Summary of the State of the Art, chapter 1, Kluwer Academic Publishers, Norwel l, Massachusetts, 1994","DOI":"10.1007\/978-1-4615-2698-8_1"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB35","unstructured":"J.B. Dennis, G.R. Gao, On memory models and cache management for shared-memory multiprocessors, ACAPS Technical Memo 90, School of Computer Science, McGill University, Montr\u00e9al, Qu\u00e9., December. 1994, in: ftp:\/\/ftp-acaps.cs.mcgill.ca\/pub\/doc\/memos"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB36","unstructured":"J.B. Dennis, Streams data types for signal processing, in: J-L. Gaudiot, L. Bic (Eds.), Advanced Topics in Dataflow Computing and Multithreading, Prentice-Hall, Englewood Cliffs, NJ, 1995"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB37","doi-asserted-by":"crossref","unstructured":"J.B. Dennis, G.R. Gao, On memory models and cache management for shared-memory multiprocessors, in: Parallel and Distributed Processing, IEEE Computer Soc., 1995","DOI":"10.1109\/SPDP.1995.530683"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB38","doi-asserted-by":"crossref","unstructured":"J.B. Dennis, A parallel program execution model supporting modular software construction, in: Proceedings of the Massively Parallel Programming Models (MPPM-97), IEEE Computer Soc., 1997, pp 50\u201360","DOI":"10.1109\/MPPM.1997.715961"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB39","doi-asserted-by":"crossref","unstructured":"J.B. Dennis, General parallel computation can be performed with a cycle-free heap, in: Proceedings of the International Conference on Parallel Architectures and Compiler Technology, Paris, France, October 1996, pp. 96\u2013103","DOI":"10.1109\/PACT.1998.727177"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB40","doi-asserted-by":"crossref","unstructured":"C. Ebeling, D.C. Cronquist, P. Franklin, RaPiD \u2013 reconfigurable pipelined datapath, in Proceedings of the Field Programmable Logic, 1996","DOI":"10.1007\/3-540-61730-2_13"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB41","doi-asserted-by":"crossref","unstructured":"G. Estrin, Parallel processing in a restructurable computer system, IEEE Trans. Elect. Comput. (1963)","DOI":"10.1109\/PGEC.1963.263558"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB42","series-title":"A Code Mapping Scheme for Dataflow Software Pipelining","author":"Gao","year":"1990"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB43","doi-asserted-by":"crossref","unstructured":"G.R. Gao, H.H.J. Hum, J.-M. Monti, Towards an efficient hybrid dataflow architecture model, in: Proceedings of the PARLE '91, vol. I, Lecture Notes in Computer Science, vol. 505, Eindhoven, The Netherlands, June 1991, Springer, Berlin, pp. 355\u2013371","DOI":"10.1007\/978-3-662-25209-3_24"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB44","doi-asserted-by":"crossref","unstructured":"G.R. Gao, R. Govindarajan, P. Panangaden, Well-behaved dataflow for DSP computation, in: Proceedings of the ICASSP-92, San Francisco, March 1992","DOI":"10.1109\/ICASSP.1992.226558"},{"issue":"4","key":"10.1016\/S0167-8191(99)00070-8_BIB45","doi-asserted-by":"crossref","first-page":"293","DOI":"10.1006\/jpdc.1993.1113","volume":"19","author":"Gao","year":"1993","journal-title":"An efficient hybrid dataflow architecture model, J. Parallel Distrib. Comput."},{"key":"10.1016\/S0167-8191(99)00070-8_BIB46","unstructured":"G.R. Gao, V. Sarkar, Location consistency: stepping beyond the barriers of memory coherence and serializability, ACAPS Technical Memo 78, School of Computer Science, McGill University, Montr\u00e9al, Qu\u00e9., December 1994, in: ftp:\/\/ftp-acaps.cs.mcgill.ca\/pub\/doc\/memos"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB47","unstructured":"G.R. Gao, L. Bic, J-L. Gaudiot (Eds.), Advanced Topics in Dataflow Computing and Multithreading, IEEE Computer Soc. Press, New York, 1995, book contains papers presented at the Second International Workshop on Dataflow Computers, Hamilton Island, Australia, May 1992"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB48","doi-asserted-by":"crossref","unstructured":"G.R. Gao, V. Sarkar, On the importance of an end-to-end view of memory consistency in future computer systems, in: Proceedings of the International Symposium on High Performance Computing, Fukuoka, Japan, 1997, pp. 30\u201341","DOI":"10.1007\/BFb0024201"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB49","unstructured":"G.R. Gao, V. Sarkar, Location consistency \u2013 a new memory model and cache consistency protocol, CAPSL Technical Memo 16, Department of Elec. and Computer Engineering, University of Delaware, Newark, Delaware, February 1998, in: ftp:\/\/ftp.capsl.udel.edu\/pub\/doc\/memos"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB50","unstructured":"K. Gharachorloo, A. Gupta, J. Hennessy, Revision to `memory consistency and event ordering in scalable shared-memory multiprocessors', Technical Report No. CSL-TR-93-568, Computer Systems Lab., Stanford University, Stanford, CA, April 1993"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB51","doi-asserted-by":"crossref","unstructured":"K. Gharachorloo, D. Lenoski, J. Laudon, P. Gibbons, A. Gupta, J. Hennessy, Memory consistency and event ordering in scalable shared-memory multiprocessors, in: Proceedings of the ISCA-17, Seattle, Washington, May 1990, pp. 15\u201326","DOI":"10.1145\/325096.325102"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB52","doi-asserted-by":"crossref","unstructured":"A. Girault, B. Lee, E.A. Lee, Hierarchical finite state machines with multiple concurrency models, IEEE Trans. on CAD, 1999, 18 (6) (1999). (Revised from Memorandum UCB\/ERL M97\/57, Electronics Research Laboratory, University of California, Berkeley, CA 94720, August 1997) (http:\/\/ptolemy.eecs.berkeley.edu\/papers\/98\/starcharts)","DOI":"10.1109\/43.766725"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB53","doi-asserted-by":"crossref","first-page":"81","DOI":"10.1109\/2.67197","article-title":"Building and using a highly parallel programmable logic array","volume":"24","author":"Gokhale","year":"1991","journal-title":"IEEE Comput."},{"key":"10.1016\/S0167-8191(99)00070-8_BIB54","doi-asserted-by":"crossref","unstructured":"R. Hartenstein et al., A reconfigurable machine for applications in image and video compression, in: Conference on Compression Technologies and Standards for Image and Video Compression, Amesterdam, Netherlands, 1995","DOI":"10.1117\/12.201186"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB55","unstructured":"J.R. Hauser, J. Wawrzynek, Garp: a MIPS processor with a reconfigurable co-processor, in: Proceedings of the IEEE Symposium on Field-Programmable Custom Computing Machines, April 1997"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB56","doi-asserted-by":"crossref","unstructured":"L.J. Hendren, G.R. Gao, X. Tang, Y. Zhu, X. Xue, H. Cai, P. Ouellet, Compiling C for the EARTH multithreaded architecture, ACAPS Technical Memo 101, School of Computer Science, McGill University, Montr\u00e9al, Qu\u00e9., March 1996, in: ftp:\/\/ftp-acaps.cs.mcgill.ca\/pub\/doc\/memos","DOI":"10.1109\/PACT.1996.552551"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB57","doi-asserted-by":"crossref","first-page":"28","DOI":"10.1109\/2.707614","article-title":"Multiprocessors should support simple memory-consistency models","volume":"31","author":"Hill","year":"1998","journal-title":"Computer"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB58","doi-asserted-by":"crossref","unstructured":"J. Horstmannshoff, T. Gr\u00f6tker, H. Meyr, Mapping multirate dataflow to complex RT level hardware models, in: 11th International Conference on Application-specific Systems, Architectures and Processors, 1997, (ASAP'97)","DOI":"10.1109\/ASAP.1997.606834"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB59","unstructured":"H.H.-J. Hum, The super-actor machine: a hybrid dataflow\/von Neumann architecture, Ph.D. Thesis, McGill University, Montr\u00e9al, Qu\u00e9., May 1992"},{"issue":"4","key":"10.1016\/S0167-8191(99)00070-8_BIB60","doi-asserted-by":"crossref","first-page":"287","DOI":"10.1016\/0167-739X(92)90064-I","article-title":"A high-speed memory organization for hybrid dataflow\/von Neumann computing","volume":"8","author":"Hum","year":"1992","journal-title":"Future Generation Comput. Syst."},{"issue":"4","key":"10.1016\/S0167-8191(99)00070-8_BIB61","doi-asserted-by":"crossref","first-page":"319","DOI":"10.1007\/BF03356753","article-title":"A study of the earth-manna multithreaded system","volume":"24","author":"Hum","year":"1996","journal-title":"Int. J. Parallel Programming"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB62","doi-asserted-by":"crossref","unstructured":"R.A. Iannucci, Toward a dataflow\/von Neumann hybrid architecture, in: Proceedings of the ISCA-15, Honolulu, Haw., May\u2013June 1988, pp. 131\u2013140","DOI":"10.1109\/ISCA.1988.5222"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB63","doi-asserted-by":"crossref","unstructured":"R.A. Iannucci, G.R. Gao, R.H. Halstead Jr., B. Smith (Eds.), Multithreaded Computer Architecture: A Summary of the State of the Art, Kluwer Academic Publishers, Norwell, Massachusetts, 1994, book contains papers presented at the Workshop on Multithreaded Computers, Albuquerque, New Mexico, November 1991","DOI":"10.1007\/978-1-4615-2698-8"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB64","doi-asserted-by":"crossref","unstructured":"S. Jenks, J.-L. Gaudiot, Exploiting locality and tolerating remote memory access latency using thread migration, Int. J. Parallel Programming, 1996, in press","DOI":"10.1007\/BF02699904"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB65","doi-asserted-by":"crossref","unstructured":"S. Jenks, J.-L. Gaudiot, Nomadic threads \u2013 a migrating multithreaded approach to remote memory accesses in multiprocessors, in: Proceedings of the International Conference on Parallel Architectures and Compilation Techniques (PACT '96), Boston, Massachusetts, October 1996","DOI":"10.1109\/PACT.1996.554028"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB66","doi-asserted-by":"crossref","unstructured":"S. Jenks, J.-L. Gaudiot, Nomadic threads: A migrating multithreaded approach to remote memory accesses in multiprocessors, in: Proceedings of the 1996 Conference on Parallel Architectures and Compilation Techniques, Boston, Massachusetts, October 1996","DOI":"10.1109\/PACT.1996.554028"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB67","series-title":"Synchronous Programming of Reactive Systems","author":"Halbwachs","year":"1993"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB68","doi-asserted-by":"crossref","unstructured":"N. Halbwachs, P. Caspi, P. Raymond, D. Pilaud, The synchronous data flow programming language LUSTRE, in: Proceedings of the IEEE, vol. 79 (9), pp. 1305\u20131319","DOI":"10.1109\/5.97300"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB69","doi-asserted-by":"crossref","first-page":"31","DOI":"10.1016\/0167-6423(87)90035-9","article-title":"Statecharts: a visual formalism for complex systems","volume":"8","author":"Harel","year":"1987","journal-title":"Sci. Comput. Programming"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB70","unstructured":"G. Kahn, The semantics of a simple language for parallel programming, in: Proceedings of the IFIP Congress 74, North-Holland, Amsterdam, 1974"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB71","unstructured":"C. Kim, J.-L. Gaudiot, Data-flow and multithreaded architectures, in: Encyclopedia of Electrical and Electronics Engineering, Wiley, New York, 1997"},{"issue":"10","key":"10.1016\/S0167-8191(99)00070-8_BIB72","doi-asserted-by":"crossref","first-page":"30","DOI":"10.1109\/2.7055","article-title":"A data-driven VLSI array for arbitrary algorithms","volume":"21","author":"Koren","year":"1988","journal-title":"Computer"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB73","unstructured":"J.-L. Gaudiot, L. Bic (Eds.), Advanced Topics in Data-Flow Computing, Prentice-Hall, New york, 1991"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB74","unstructured":"Y. Kodama, S. Sakai, Y. Yamaguchi, A prototype of a highly parallel dataflow machine EM-4 and its preliminary evaluation. in: Proceedings of the InfoJapan 90, October 1990, pp. 291\u2013298"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB75","doi-asserted-by":"crossref","unstructured":"Y. Kodama, H. Sakane, M. Sato, H. Yamana, S. Sakai, Y. Yamaguchi, The EM-X parallel computer: architecture and basic performance, in: Proceedings of the ISCA-22, Santa Margher ita Ligure, Italy, June 1995, pp. 14\u201323","DOI":"10.1145\/223982.223987"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB76","unstructured":"KRI, Khoral Research Inc. Web Page, http:\/\/www.kri.com"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB77","unstructured":"F. Kurdahi, N. Bagherzadeh, The Morphosys Project, University of California, Irvine, 1998, http:\/\/www.eng.uci.edu\/morphosys"},{"issue":"9","key":"10.1016\/S0167-8191(99)00070-8_BIB78","doi-asserted-by":"crossref","first-page":"690","DOI":"10.1109\/TC.1979.1675439","article-title":"How to make a multiprocessor computer that correctly executes multiprocess programs","volume":"28","author":"Lamport","year":"1979","journal-title":"IEEE Trans. Comput."},{"key":"10.1016\/S0167-8191(99)00070-8_BIB79","series-title":"DSP Processor Fundamentals Architectures and Features","author":"Lapsley","year":"1997"},{"issue":"9","key":"10.1016\/S0167-8191(99)00070-8_BIB80","doi-asserted-by":"crossref","DOI":"10.1109\/5.97301","article-title":"Programming real-time applications with SIGNAL","volume":"79","author":"Le Guernic","year":"1991","journal-title":"Proc. IEEE"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB81","doi-asserted-by":"crossref","unstructured":"E.A. Lee, D.G. Messerschmitt, Static scheduling of synchronous data flow programs for digital signal processing, IEEE Trans. Comput. (1987)","DOI":"10.1109\/TC.1987.5009446"},{"issue":"2","key":"10.1016\/S0167-8191(99)00070-8_BIB82","doi-asserted-by":"crossref","DOI":"10.1109\/71.89067","article-title":"Consistency in dataflow graphs","volume":"2","author":"Lee","year":"1991","journal-title":"IEEE Trans. Parallel Distributed Syst."},{"issue":"5","key":"10.1016\/S0167-8191(99)00070-8_BIB83","doi-asserted-by":"crossref","first-page":"773","DOI":"10.1109\/5.381846","article-title":"Dataflow process networks","volume":"83","author":"Lee","year":"1995","journal-title":"Proc. IEEE"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB84","unstructured":"E.A. Lee, A denotational semantics for dataflow with firing, Memorandum UCB\/ERL M97\/3, Electronics Research Laboratory, UC Berkeley, January 1997"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB85","doi-asserted-by":"crossref","unstructured":"D. Lenoski, J. Laudon, T. Joe, D. Nakahira, L. Stevens, A. Gupta, J. Hennessy. The DASH prototype: implementation and performance, in: Proceedings of the ISCA-19, Gold Coast, Australia, May 1992, pp. 92\u2013103","DOI":"10.1145\/139669.139706"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB86","unstructured":"W.-Y. Lin, J.-L. Gaudiot, I-structure software cache: a split-phase transaction runtime cache system, in: Proceedings of the 1996 Conference on Parallel Architectures and Compilation Techniques, Boston, Massachusetts, October 1996, pp. 122\u2013126"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB87","doi-asserted-by":"crossref","first-page":"38","DOI":"10.1109\/2.642810","article-title":"Seeking solutions in configurable computing","volume":"30","author":"Mangione-Smith","year":"1997","journal-title":"IEEE Comput."},{"key":"10.1016\/S0167-8191(99)00070-8_BIB88","doi-asserted-by":"crossref","first-page":"115","DOI":"10.1109\/2.625338","article-title":"Application design for configurable computing","volume":"30","author":"Mangione-Smith","year":"1997","journal-title":"Computer"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB89","series-title":"The Temporal Logic of Reactive and Concurrent Systems","author":"Manna","year":"1991"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB90","doi-asserted-by":"crossref","unstructured":"O.C. Maquelin, H.H.J. Hum, G.R. Gao, Costs and benefits of multithreading with off-the-shelf RISC processors, in: Proceedings of the EURO-PAR '95, no. 966 in Lecture Notes in Computer Science, Stockholm, Sweden, Springer, August 1995, pp. 117\u2013128","DOI":"10.1007\/BFb0020459"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB91","unstructured":"A. M\u00e1rquez, K.B. Theobald, X. Tang, T. Sterling, G.R. Gao, A superstrand architecture and its compilation, CAPSL Technical Memo 18, Department of Elec. and Computer Engineering, University of Delaware, Newark, Delaware, March 1998"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB92","unstructured":"A. Marquez, K.B. Theobald, X. Tang, G.R. Gao, A superstrand architecture and its compilation, in: Proceedings of the MTEAC99 Workshop held in conjunction with HPCA-5, Orlando, FL, January 1999"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB93","unstructured":"B. Mendelson, B. Patel, I. Koren, Designing special purpose co-processors using the data-flow paradigm, in: J.-L. Gaudiot, L. Bic (Eds.), Advanced Topics in Data-Flow Computing, Prentice-Hall, Englewood Cliffs, NJ, 1991, pp. 547\u2013570"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB94","doi-asserted-by":"crossref","unstructured":"B. Mendelson, G.M. Silberman, Mapping data flow programs on a VLSI array of processors, in: Proceedings of the International Symposium on Computer Architecture, Pittsburgh, Pennsylvania, June 1987, pp. 72\u201380","DOI":"10.1145\/30350.30359"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB95","doi-asserted-by":"crossref","unstructured":"W.A. Najjar, W.M. Miller, A.P.W. B\u00f6hm, An analysis of loop latency in dataflow execution, in: Proceedings of the ISCA-19, Gold Coast, Australia, May 1992, pp. 352\u2013360","DOI":"10.1145\/146628.140397"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB96","unstructured":"W. Najjar, J.-L. Gaudiot, Multi-level execution in data-flow architectures, in: Proceedings of the ICPP '87, St. Charles, Ill., August 1987, pp. 32\u201339"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB97","unstructured":"W. Najjar, A.P.W. Bohm, B. Draper, R. Beveridge, The Cameron Project, Colorado State University, Fort Collins, CO 1998, http:\/\/www.cs.colostate.edu\/cameron"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB98","doi-asserted-by":"crossref","unstructured":"S.S. Nemawarkar, Performance modeling and analysis of multithreaded architectures, Ph.D. Thesis, Montr\u00e9al, Qu\u00e9., August 1996","DOI":"10.1109\/MASCOT.1996.501002"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB99","doi-asserted-by":"crossref","unstructured":"R.S. Nikhil, Arvind, Can dataflow subsume von Neumann computing? in: Proceedings of the ISCA-16, Jerusalem, Israel, May\u2013June 1989, pp. 262\u2013272","DOI":"10.1145\/74926.74955"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB100","doi-asserted-by":"crossref","unstructured":"K. Okamoto, S. Sakai, H. Matsuoka, T. Yokota, H. Hirono, Multithread execution mechanisms on RICA-1 for massi vely parallel computation, in: Proceedings of the 1996 Conference on Parallel Architectures and Compilation Techniques, Boston, Massachusetts, October 1996, pp. 116\u2013121","DOI":"10.1109\/PACT.1996.552653"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB101","unstructured":"Oxford Hardware Compilation Group, The Handel Language, 1997"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB102","unstructured":"E.K. Pauer, C.S. Myers, P.D. Fiore, J.M. Smith, C.M. Crawford, E.A. Lee, J. Lundblad, C.X. Hylands, Algorithm analysis and mapping environment for adaptive computing systems, Second Annual Workshop on High Performance Embedded Computing, MIT Lincoln Labs, Lexington, MA, September 1998 (http:\/\/ptolemy.eecs.berkeley.edu\/papers\/98\/ACSmapping\/)"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB103","doi-asserted-by":"crossref","unstructured":"J. Rasure, S. Kubica, The KHOROS application development environment, in: J.L. Crowley (Ed.), Experimental Environments for Computer Vision and Image Processing, HICa, New Jersey, 1994","DOI":"10.1142\/9789812797827_0001"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB104","doi-asserted-by":"crossref","unstructured":"S.K. Reinhardt, J.R. Larus, D.A. Wood, Tempest and typhoon: user-level shared memory, in: Proceedings of the ISCA-21, Chicago, Ill., April 1994, pp. 325\u2013336","DOI":"10.1145\/192007.192062"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB105","unstructured":"X. Tang. Compiling for multithreaded architectures, Ph.D. Thesis, University of Delaware, Newark, DE, April 1999"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB106","doi-asserted-by":"crossref","unstructured":"S. Sakai, K. Okamoto, H. Matsuoka, H. Hirono, Y. Kodama, M. Sato, Super-threading: architectural and software mechanisms for optimizing parallel computation, in: Conference Proceedings of the 1993 International Conference on Supercomputing, Tokyo, Japan, July 1993, pp. 251\u2013260","DOI":"10.1145\/165939.165976"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB107","doi-asserted-by":"crossref","unstructured":"H. Schmit, Incremental reconfiguration for pipelined applications, IEEE Symposium on FPGAs for Custom Computing Machines, 1997","DOI":"10.1109\/FPGA.1997.624604"},{"issue":"26","key":"10.1016\/S0167-8191(99)00070-8_BIB108","doi-asserted-by":"crossref","first-page":"42","DOI":"10.1109\/MC.1993.274941","article-title":"Scaling parallel programs for multiprocessors: methodology and examples","volume":"6","author":"Singh","year":"1993","journal-title":"IEEE Computer"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB109","doi-asserted-by":"crossref","unstructured":"A. Sohn, M. Sato, N. Yoo, J.-L. Gaudiot, Data and workload distribution in a multithreaded architecture, J. Parallel Distributed Process. 1997, pp. 256\u2013264","DOI":"10.1006\/jpdc.1996.1262"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB110","doi-asserted-by":"crossref","unstructured":"X. Tang, J. Wang, K.B. Theobald, G.R. Gao, Thread partitioning and scheduling based on cost model, in: Proceedings of the SPAA `97, Newport, R hode Island, June 1997, pp. 272\u2013281","DOI":"10.1145\/258492.258519"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB111","doi-asserted-by":"crossref","unstructured":"X. Tang, G.R. Gao, How hard is thread partitioning and how bad is a list scheduling based partitioning algorithm? in: Proceedings of the Tenth Annual ACM Symposium on Parallel Algorithms and Architectures, Puerto Vallarta, Mexico, June 1998","DOI":"10.1145\/277651.277679"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB112","unstructured":"K.B. Theobald. EARTH: an efficient architecture for running threads, Ph.D. Thesis, Montr\u00e9al, Qu\u00e9., January 1999"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB113","doi-asserted-by":"crossref","unstructured":"T. von Eicken, D.E. Culler, S.C. Goldstein, K.E. Schauser, Active messages: a mechanism for integrated communication and computation, in: Proceedings of the ISCA-19, Gold Coast, Australia, May 1992, pp. 256\u2013266","DOI":"10.1145\/139669.140382"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB114","doi-asserted-by":"crossref","unstructured":"J. Vuillemin et al., Programmable active memories: reconfigurable systems come of age, IEEE Trans. on VLSI Syst. (1996)","DOI":"10.1109\/92.486081"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB115","doi-asserted-by":"crossref","first-page":"86","DOI":"10.1109\/2.612254","article-title":"Baring it all to software: raw machines","volume":"30","author":"Waingold","year":"1997","journal-title":"IEEE Comput."},{"key":"10.1016\/S0167-8191(99)00070-8_BIB116","doi-asserted-by":"crossref","unstructured":"M. Warren, J.K. Salmon, A parallel hashed oct-tree n-body algorithm, in: Proceedings of the Supercomputing '93, Portland, Oregon, November 1993, pp. 12\u201321","DOI":"10.1145\/169627.169640"},{"issue":"4","key":"10.1016\/S0167-8191(99)00070-8_BIB117","doi-asserted-by":"crossref","first-page":"308","DOI":"10.1006\/jpdc.1993.1114","article-title":"Architectural improvements for a data-driven vlsi processing array","volume":"19","author":"Weiss","year":"1993","journal-title":"J. Parallel Distributed Comput."},{"key":"10.1016\/S0167-8191(99)00070-8_BIB118","unstructured":"N. Wirth, The Hardware Description Language Lola, June 1995"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB119","doi-asserted-by":"crossref","unstructured":"M.J. Wirthlin, B.L. Hutchings, DISC : the dynamic instruction set computer, in: J. Schewel (Ed.), Field Programmable Gate Arrays for Fast Board Development and Reconfigurable Computing, vol. SPIE 2607, 1995, pp. 92\u2013103","DOI":"10.1117\/12.221328"},{"key":"10.1016\/S0167-8191(99)00070-8_BIB120","doi-asserted-by":"crossref","unstructured":"M.J. Wirthlin, B.L. Hutchings, Improving functional density through run time constant propogation, in: International Symposium on Field Programmable Gate Arrays, April 1997, pp. 86\u201392","DOI":"10.1145\/258305.258316"}],"container-title":["Parallel Computing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0167819199000708?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0167819199000708?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2024,12,4]],"date-time":"2024-12-04T07:55:16Z","timestamp":1733298916000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0167819199000708"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1999,12]]},"references-count":120,"journal-issue":{"issue":"13-14","published-print":{"date-parts":[[1999,12]]}},"alternative-id":["S0167819199000708"],"URL":"https:\/\/doi.org\/10.1016\/s0167-8191(99)00070-8","relation":{},"ISSN":["0167-8191"],"issn-type":[{"value":"0167-8191","type":"print"}],"subject":[],"published":{"date-parts":[[1999,12]]}}}