%%% -*-BibTeX-*- %%% ==================================================================== %%% BibTeX-file{ %%% author = "Nelson H. F. Beebe", %%% version = "1.04", %%% date = "25 October 2010", %%% time = "17:27:12 MDT", %%% filename = "supercomputing91.bib", %%% University of Utah %%% Department of Mathematics, 110 LCB %%% 155 S 1400 E RM 233 %%% Salt Lake City, UT 84112-0090 %%% USA", %%% telephone = "+1 801 581 5254", %%% FAX = "+1 801 581 4148", %%% URL = "http://www.math.utah.edu/~beebe", %%% checksum = "13008 2282 10580 106056", %%% email = "beebe at math.utah.edu, beebe at acm.org, %%% beebe at ieee.org (Internet)", %%% codetable = "ISO/ASCII", %%% keywords = "bibliography, BibTeX, Supercomputing '91", %%% license = "public domain", %%% supported = "yes", %%% docstring = "This is a complete bibliography of papers %%% published in the proceedings of %%% Supercomputing '91. %%% %%% The organizers of this conference series %%% maintain a World-Wide Web site at %%% %%% http://www.supercomp.org/ %%% %%% where pointers to Web pages for the %%% conferences from 1994 to date may be found. %%% %%% At version 1.04, the year coverage looked %%% like this: %%% %%% 1991 ( 92) %%% %%% InProceedings: 91 %%% Proceedings: 1 %%% %%% Total entries: 92 %%% %%% This bibliography was prepared from data %%% collected from major library catalogs, from %%% the IEEE INSPEC database, and from the TeX %%% User Group bibliography archive. %%% %%% In this bibliography, entries are sorted in %%% publication order, using ``bibsort %%% -byvolume''. %%% %%% The checksum field above contains a CRC-16 %%% checksum as the first value, followed by the %%% equivalent of the standard UNIX wc (word %%% count) utility output of lines, words, and %%% characters. This is produced by Robert %%% Solovay's checksum utility.", %%% } %%% ==================================================================== %%% ==================================================================== %%% Acknowledgement abbreviations: @String{ack-nhfb = "Nelson H. F. Beebe, University of Utah, Department of Mathematics, 110 LCB, 155 S 1400 E RM 233, Salt Lake City, UT 84112-0090, USA, Tel: +1 801 581 5254, FAX: +1 801 581 4148, e-mail: \path|beebe@math.utah.edu|, \path|beebe@acm.org|, \path|beebe@ieee.org| (Internet), URL: \path|http://www.math.utah.edu/~beebe/|"} %%% ==================================================================== %%% Publishers and their addresses: @String{pub-IEEE = "IEEE Computer Society Press"} @String{pub-IEEE:adr = "1109 Spring Street, Suite 300, Silver Spring, MD 20910, USA"} %%% ==================================================================== %%% Bibliography entries. @InProceedings{Pugh:1991:OTF, author = "W. Pugh", title = "The {Omega} test: a fast and practical integer programming algorithm for dependence analysis", crossref = "IEEE:1991:PSA", pages = "4--13", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C1180 (Optimisation techniques); C4240 (Programming and algorithm theory); C6150G (Diagnostic, testing, debugging and evaluating systems)", corpsource = "Dept. of Comput. Sci., Maryland Univ., College Park, MD, USA", keywords = "approximate algorithms; array references; computational complexity; dependence analysis; Fourier-Motzkin variable elimination; integer programming; integer programming algorithm; Omega test; polynomial time complexity; production compilers; program testing; worst-case exponential time complexity", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Loeliger:1991:PTT, author = "J. Loeliger and R. Metzger and M. Seligman and S. Stroud", title = "Pointer target tracking --- an empirical study", crossref = "IEEE:1991:PSA", pages = "14--23", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6150C (Compilers, interpreters and other processors)", keywords = "C-series supercomputers; language-independent interprocedural optimizer; pointer target tracking; program compilers", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Mellor-Crummey:1991:ODD, author = "J. Mellor-Crummey", title = "On-the-fly detection of data races for programs with nested fork-join parallelism", crossref = "IEEE:1991:PSA", pages = "24--33", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5640 (Protocols); C6110P (Parallel programming); C6150G (Diagnostic, testing, debugging and evaluating systems)", corpsource = "Center for Res. on Parallel Comput., Rice Univ., Houston, TX, USA", keywords = "data races for programs; debugging; dynamic nesting; monitored program execution; nested fork-join parallelism; on-the-fly detection; parallel constructs; parallel programming; program debugging; program testing; protocol; protocols; run-time detection; shared-memory programs; worst-case run-time overhead", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Picano:1991:PCE, author = "S. Picano and E. D. {Brooks, III} and J. E. Hoag", title = "Programming costs of explicit memory localization on a large scale shared memory multiprocessor", crossref = "IEEE:1991:PSA", pages = "36--45", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5440 (Multiprocessor systems and techniques); C6110P (Parallel programming); C6120 (File organisation)", corpsource = "Sch. of Electr. Eng., Purdue Univ., West Lafayette, IN, USA", keywords = "BBN TC2000; buffer storage; explicit memory localization; large scale shared memory multiprocessor; MIMD parallel computer; multiprocessing systems; network simulation program; parallel programming; performance gains; programming costs; software controlled cache coherence mechanism; storage management", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Shing:1991:CMD, author = "H. Shing and L. M. Ni", title = "A conflict-free memory design for multiprocessors", crossref = "IEEE:1991:PSA", pages = "46--55", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5310 (Storage system design); C5440 (Multiprocessor systems and techniques); C6120 (File organisation)", corpsource = "Dept. of Comput. Sci., Michigan State Univ., East Lansing, MI, USA", keywords = "conflict-free memory design; data consistency; file organisation; hot spot problem; interconnection network structure; low cost mechanism; low latency; memory architecture; multiprocessing systems; multiprocessors; process synchronization; shared memory organization; synchronisation", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{deDinechin:1991:UFE, author = "B. D. {de Dinechin}", title = "A ultra fast {Euclidean} division algorithm for prime memory systems", crossref = "IEEE:1991:PSA", pages = "56--65", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5230 (Digital arithmetic methods); C5310 (Storage system design)", corpsource = "CEA, Centre d'Etudes de Limeil-Valenton, Villeneuve St. George, France", keywords = "address mapping; address skewing; digital arithmetic; hardware implementation; image processing memory systems; memory architecture; multibank memory design; nonlinear skewing schemes; prime memory systems; supercomputer; two's complement binary arithmetic; ultra fast Euclidean division algorithm", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Cohen:1991:HSS, author = "M. Cohen and M. Foster and D. Kratzer and P. Malone and A. Solem", title = "A high school supercomputing challenge", crossref = "IEEE:1991:PSA", pages = "68--75", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5440 (Multiprocessor systems and techniques); C7810C (Computer-aided instruction)", corpsource = "Los Alamos Nat. Lab., NM, USA", keywords = "computational science project; educational computing; high school supercomputing challenge; high-performance computers; parallel processing; science and computing knowledge", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Sadananda:1991:CCA, author = "R. Sadananda", title = "Chaotic cardiac arrhythmias", crossref = "IEEE:1991:PSA", pages = "76--84", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "A8730C (Electrical activity); C7330 (Biology and medicine)", corpsource = "Dept. of Biomed. Eng., Northwestern Univ., Evanston, IL, USA", keywords = "cardiology; chaotic cardiac arrhythmias; computer simulation; coupled biological oscillators; digital simulation; fibrillations; medical computing; myocardial cells; nonlinear equations; phase locking; phase response behavior; physiological models; piecewise linear equations", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Hiranandani:1991:COF, author = "S. Hiranandani and K. Kennedy and C.-W. Tseng", title = "Compiler optimizations for {FortranD} on {MIMD} distributed-memory machines", crossref = "IEEE:1991:PSA", pages = "86--100", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5440 (Multiprocessor systems and techniques); C6140D (High level languages); C6150C (Compilers, interpreters and other processors)", corpsource = "Dept. of Comput. Sci., Rice Univ., Houston, TX, USA", keywords = "code generation strategy; communication costs; compiler optimisation; data decomposition; data dependence; FORTRAN; Fortran D; iPSC/860; load imbalance; MIMD distributed-memory machines; node programs; parallel machines; program compilers", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Koelbel:1991:CGR, author = "C. Koelbel", title = "Compiler-time generation of regular communications patterns", crossref = "IEEE:1991:PSA", pages = "101--110", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6150C (Compilers, interpreters and other processors); C6150N (Distributed systems)", corpsource = "Center for Res. on Parallel Comput., Rice Univ., Houston, TX, USA", keywords = "block-distributed arrays; communication of nonlocal values; compile time analysis; compile-time generation; cyclicly-distributed arrays; distributed memory machine; distributed processing; global name space; Kali language; mapping; numerical algorithms; program compilers; regular communications patterns; run-time analysis", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Ramanujan:1991:TMI, author = "J. Ramanujan and P. Sadayappan", title = "Tiling multidimensional iteration spaces for nonshared memory machines", crossref = "IEEE:1991:PSA", pages = "111--120", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6110P (Parallel programming); C6150C (Compilers, interpreters and other processors)", corpsource = "Dept. of Electr. and Comput. Eng., Louisiana State Univ., Baton Rouge, LA, USA", keywords = "deadlock-free tiles; loop iterations; multiply nested loops; nested loops; nonshared memory machines; parallel programming; partitioning; program compilers; tiling multidimensional iteration spaces", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Kung:1991:NAA, author = "H. T. Kung and J. Subhlok", title = "A new approach for automatic parallelization of block linear algebra computations", crossref = "IEEE:1991:PSA", pages = "122--129", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4140 (Linear algebra); C6110P (Parallel programming)", corpsource = "Sch. of Comput. Sci., Carnegie Mellon Univ., Pittsburgh, PA, USA", keywords = "automatic generation; automatic parallelization; block linear algebra computations; block routines; data distribution scheme; fine-grain parallel architectures; fully automatic system; highly parallel systolic algorithms; iWarp; LAPACK; linear algebra; parallel programming; parallel programs; performance results; sequential block routine", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Markstein:1991:WFF, author = "V. Markstein and P. Markstein and T. Nguyen and S. Poole", title = "Wide format floating-point math libraries", crossref = "IEEE:1991:PSA", pages = "130--138", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5230 (Digital arithmetic methods); C5470 (Performance evaluation and testing); C7310 (Mathematics)", corpsource = "ISQUARE, Inc., Austin, TX, USA", keywords = "128 bit; 64 bit; accuracy evaluations; Convex C-240; Cray Y-MP; digital arithmetic; floating-point formats; Hewlett--Packard 9000/720; IBM 3090E/VF; IBM System/6000; math libraries; mathematics computing; parallel processing; performance; performance evaluation; transcendental functions; wide format floating point math libraries", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Nicholas:1991:DCD, author = "H. Nicholas and G. Giras and V. Hartonas-Garmhausen and M. Kopko and C. Maher and A. Ropelewski", title = "Distributing the comparison of {DNA} and protein sequences across heterogeneous supercomputers", crossref = "IEEE:1991:PSA", pages = "139--146", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "A8715 (Molecular biophysics); C7330 (Biology and medicine)", corpsource = "Pittsburgh Supercomputing Center, PA, USA", keywords = "control program; Cray Y-MP; DNA; DNA sequences; heterogeneous supercomputers; libraries; MaxSegs algorithm; medical computing; protein sequences; proteins; Thinking Machines CM-2 system; workstation", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Simmons:1991:PCT, author = "M. L. Simmons and H. J. Wasserman and O. M. Lubeck and C. Eoyang and R. Mendez and H. Harada and M. Ishiguro", title = "A performance comparison of three supercomputers: {Fujitsu VP-2600}, {NEC SX-3}, and {Cray Y-MP}", crossref = "IEEE:1991:PSA", pages = "150--157", year = "1991", bibdate = "Sat Oct 24 13:05:56 1998", acknowledgement = ack-nhfb, classification = "C5440 (Multiprocessor systems and techniques); C5470 (Performance evaluation and testing)", corpsource = "Los Alamos Nat. Lab., NM, USA", keywords = "Cray Y-MP; Fujitsu VP-2600; highly vectorizable production-type codes; memory bandwidth; Mendez Fluid dynamics codes; multiple vector pipelines; NEC SX-3; parallel processing; performance comparison; performance evaluation; second-generation supercomputers; standard Los Alamos benchmark set; supercomputers; vector register organization", sponsororg = "IEEE; ACM", treatment = "P Practical; R Product Review", } @InProceedings{Bailey:1991:NPB, author = "D. H. Bailey and E. Barszcz and J. T. Barton and D. S. Browning and R. L. Carter and L. Dagum and R. A. Fatoohi and P. O. Frederickson and T. A. Lasinski and R. S. Schreiber and H. D. Simon and V. Venkatakrishnan and S. K. Weeratunga", title = "The {NAS} parallel benchmarks-summary and preliminary results", crossref = "IEEE:1991:PSA", pages = "158--165", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "A4710 (General theory, simulation and other computational methods); C5440 (Multiprocessor systems and techniques); C5470 (Performance evaluation and testing); C7460 (Aerospace engineering)", corpsource = "NASA Ames Res. Centr, Moffett Field, CA, USA", keywords = "aerospace computing; CFD codes; computational aerosciences applications; computer fluid dynamics; data motions; flow simulation; highly parallel systems; NAS parallel benchmarks; numerical aerodynamic simulation; parallel kernels; parallel processing; performance evaluation; supercomputers", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Bailey:1991:PRT, author = "D. H. Bailey and P. O. Frederickson", title = "Performance results for two of the {NAS} parallel benchmarks", crossref = "IEEE:1991:PSA", pages = "166--173", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "A4710 (General theory, simulation and other computational methods); C1140G (Monte Carlo methods); C4190 (Other numerical methods); C5440 (Multiprocessor systems and techniques); C5470 (Performance evaluation and testing); C7460 (Aerospace engineering)", corpsource = "NASA Ames Res. Center, Moffett Field, CA, USA", keywords = "aerospace computing; Connection Machine-2; Cray Y-MP; fast Fourier transforms; flow simulation; implementation schemes; Intel iPSC/860; Monte Carlo methods; Monte Carlo statistical calculation; numerical aerodynamic simulation; parallel benchmarks; parallel computer systems; parallel processing; performance evaluation; performance results; Poisson partial differential equation solver; three-dimensional fast Fourier transforms", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Baer:1991:EOP, author = "J.-L. Baer and T.-F. Chen", title = "An effective on-chip preloading scheme to reduce data access penalty", crossref = "IEEE:1991:PSA", pages = "176--186", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5310 (Storage system design); C6120 (File organisation)", corpsource = "Dept. of Comput. Sci. and Eng., Washington Univ., Seattle, WA, USA", keywords = "buffer storage; clock cycles; data access penalty reduction; data cache misses; file organisation; hardware support function; instruction stream; look- ahead program counter; memory access models; memory architecture; memory latency; on-chip data cache; on-chip preloading scheme; operand references; reference prediction table; trace-driven simulation", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Bird:1991:ULR, author = "P. L. Bird and R. A. Uhlig", title = "Using lookahead to reduce memory bank contention for decoupled operand references", crossref = "IEEE:1991:PSA", pages = "187--196", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4240 (Programming and algorithm theory); C5310 (Storage system design); C6120 (File organisation)", corpsource = "Adv. Comput. Res. Inst., Lyon, France", keywords = "bank management hardware; complexity; computational complexity; decoupled operand references; high throughput memory designs; lookahead; memory architecture; memory bank contention reduction; operand references; simulation; storage management; storage system control structure; table lookup", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Dubois:1991:DCE, author = "M. Dubois and J.-C. Wang and L. A. Barroso and K. Lee and Y.-S. Chen", title = "Delayed consistency and its effects on the miss rate of parallel programs", crossref = "IEEE:1991:PSA", pages = "197--206", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4240P (Parallel programming and algorithm theory); C5640 (Protocols); C6110P (Parallel programming)", corpsource = "Dept. of Electr. Eng. Syst., Univ. of Southern California, Los Angeles, CA, USA", keywords = "cache-based systems; complexity; computational complexity; delayed consistency; delayed protocols; execution-driven simulations; miss rate; parallel algorithms; parallel programming; parallel programs; performance comparison; protocols; weakly ordered consistency model", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Hatcher:1991:ASP, author = "P. J. Hatcher and M. J. Quinn and R. J. Anderso and A. J. Lapadula and B. K. Seevers and A. F. Bennett", title = "Architecture-independent scientific programming in dataparallel {C}: three case studies", crossref = "IEEE:1991:PSA", pages = "208--217", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6110P (Parallel programming); C6140D (High level languages); C6150C (Compilers, interpreters and other processors); C7340 (Geophysics)", corpsource = "Dept. of Comput. Sci., New Hampshire Univ., Durham, NC, USA", keywords = "architecture independent scientific programming; C code; C language; compiled programs; dataparallel C; geophysics computing; Intel iPSC/2; multicomputers; multiprocessors; nCUBE 3200; ocean circulation model; parallel programming; performance; program compilers; Sequent Symmetry S81; shallow-water atmospheric model; Sharks World model; SIMD programming language", sponsororg = "IEEE; ACM", treatment = "A Application; P Practical", } @InProceedings{Hirayama:1991:SFP, author = "H. Hirayama and M. Ikeda and N. Sagawa", title = "Solution functions of {PDEQSOL} (partial differential equation solver language) for fluid problems", crossref = "IEEE:1991:PSA", pages = "218--227", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4170 (Differential equations)C4185 (Finite element analysis); C6110P (Parallel programming); C6115 (Programming support); C7320 (Physics and Chemistry)", corpsource = "Hitachi VLSI Eng. Ltd., Tokyo, Japan", keywords = "benchmark; finite element analysis; finite element method; fluid problems; Fortran 77 program; integrated problem-solving environment; integrated software; parallel programming; partial differential equation solver language; partial differential equations; performance evaluation; physics computing; problem solving; programming environments; solution algorithms; supercomputers; translator; vectorization ratios; very high-level descriptions", sponsororg = "IEEE; ACM", treatment = "A Application; P Practical", } @InProceedings{Sethian:1991:CTF, author = "J. A. Sethian and J.-P. Brunet and A. Greenberg and J. P. Mesirov", title = "Computing turbulent flow in complex geometries on a massively parallel processor", crossref = "IEEE:1991:PSA", pages = "230--241", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "A4710 (General theory, simulation and other computational methods); A4725 (Turbulent flows, convection, and heat transfer); C5440 (Multiprocessor systems and techniques); C7320 (Physics and Chemistry)", corpsource = "Dept. of Math., California Univ., Berkeley, CA, USA", keywords = "adaptive creation; complex geometries; computational element; Connection Machine CM-2; flow simulation; Lagrangian schemes; massively parallel processor; merger; parallel data structures; parallel elliptic solvers; parallel N- body solvers; parallel processing; physics computing; random vortex method; rollup; turbulence; turbulent flow computing; vortex shedding", sponsororg = "IEEE; ACM", treatment = "A Application; P Practical", } @InProceedings{Elton:1991:LBM, author = "B. H. Elton", title = "A lattice {Boltzmann} method for a two-dimensional viscous {Burgers} equation: computational results", crossref = "IEEE:1991:PSA", pages = "242--252", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "A5110 (Kinetic and transport theory); C4170 (Differential equations); C7320 (Physics and Chemistry)", corpsource = "Fujitsu America Inc., San Jose, CA, USA", keywords = "Boltzmann equation; computational results; conditionally monotone finite difference method; difference equations; flow simulation; kinetic theory of gases; l/sub 1/-norm; lattice Boltzmann method; nonlinear advection-diffusion equation; physics computing; two-dimensional viscous Burgers equation", sponsororg = "IEEE; ACM", treatment = "P Practical; T Theoretical or Mathematical", } @InProceedings{Mechoso:1991:DCM, author = "C. R. Mechoso and C.-C. Ma and J. D. Farrar and J. A. Saphr and Moore and R. W.", title = "Distribution of a climate model across high-speed networks", crossref = "IEEE:1991:PSA", pages = "253--260", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "A9260S (Climatology); A9385 (Instrumentation and techniques for geophysical, hydrospheric and lower atmosphere research); A9575P (Mathematical and computer techniques); C7340 (Geophysics); C7350 (Astronomy and astrophysics)", corpsource = "Dept. of Atmos. Sci., Los Angeles Univ., CA, USA", keywords = "astrophysics computing; atmospheric techniques; climate model; climatology; coupled atmosphere-ocean general circulation model; geographically separated locations; geophysics computing; heterogeneous computing environments; high-speed networks; parallelism", sponsororg = "IEEE; ACM", treatment = "A Application; P Practical", } @InProceedings{Cann:1991:RFD, author = "D. Cann", title = "Retire {FORTRAN}? {A} debate rekindled", crossref = "IEEE:1991:PSA", pages = "264--272", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6110P (Parallel programming); C6140D (High level languages)", corpsource = "Lawrence Livermore Nat. Lab., CA, USA", keywords = "abstraction; Cray Sisal; FORTRAN; functional language; parallel execution; parallel programming; performance; programming language; scientific computing", sponsororg = "IEEE; ACM", treatment = "G General Review; P Practical", } @InProceedings{Lee:1991:OOP, author = "J. K. Lee and D. Gannon", title = "Object oriented parallel programming experiments and results", crossref = "IEEE:1991:PSA", pages = "273--282", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6110J (Object-oriented programming); C6110P (Parallel programming); C6115 (Programming support)", corpsource = "Dept. of Comput. Sci., Indiana Univ., Bloomington, IN, USA", keywords = "data distribution; distributed collection model; massive parallelism; memory locality; object oriented parallel programming; object-oriented programming; parallel programming; PC++; performance; programming environments", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Gursoy:1991:HLS, author = "A. Gursoy and L. V. Kale", title = "High level support for divide-and-conquer parallelism", crossref = "IEEE:1991:PSA", pages = "283--292", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6110P (Parallel programming); C6140D (High level languages)", corpsource = "Dept. of Comput. Sci., Illinois Univ., Urbana, IL, USA", keywords = "C language; Chare Kernel parallel programming; divide-and-conquer parallelism; dynamic load balancing; high level languages; high level support; iPSC/2; machine-independent execution; NCUBE/two; parallel programming; Sequent symmetry; synchronisation; synchronization; translator", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Ewing:1991:VPI, author = "R. Ewing and P. O'Leary and J. Sochacki", title = "Vector\slash parallel implementation of a porous media flow code", crossref = "IEEE:1991:PSA", pages = "294--303", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "A4710 (General theory, simulation and other computational methods); A4755M (Flow through porous media); C4240 (Programming and algorithm theory); C7340 (Geophysics)", corpsource = "Inst. for Sci. Comput., Wyoming Univ., Laramie, WY, USA", keywords = "computational complexity; computational model; flow simulation; flow through porous media; geophysics computing; large-scale simulation; miscible fluids; oil recovery processes; porous media flow code; supercomputing; timings; viscous fingering", sponsororg = "IEEE; ACM", treatment = "A Application; P Practical", } @InProceedings{Young:1991:HPV, author = "L. C. Young and S. E. Zaratonello", title = "High performance vector processing in reservoir simulation", crossref = "IEEE:1991:PSA", pages = "304--315", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "A4710 (General theory, simulation and other computational methods); A4755M (Flow through porous media); C4170 (Differential equations); C5440 (Multiprocessor systems and techniques); C7340 (Geophysics)", corpsource = "Reservoir Simulation Research Corp., Tulsa, OK, USA", keywords = "600 MFLOPS; black-oil problems; computational performance; difference equations; finite-difference formulation; flow simulation; flow through porous media; Fujitsu VP2600/10 supercomputer; geophysics computing; high performance vector processing; parallel processing; reservoir simulation", sponsororg = "IEEE; ACM", treatment = "A Application; P Practical", } @InProceedings{Myczkowski:1991:SMA, author = "J. Myczkowski and G. Steele", title = "Seismic modeling at {15 Gigaflops} on the {Connection Machine}", crossref = "IEEE:1991:PSA", pages = "316--326", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "A9130 (Seismology); C4170 (Differential equations); C5440 (Multiprocessor systems and techniques); C7340 (Geophysics)", corpsource = "Thinking Machines Corp., Cambridge, MA, USA", keywords = "14 GFLOPS; acoustic wave equation; CM-2 supercomputer; Connection Machine; difference equations; finite difference algorithm; floating point unit; geophysics computing; instruction sequence; interprocessor grid communication; massively parallel machine; memory interface; parallel processing; seismic modelling code; seismology; sponge boundary conditions; stencil compiler", sponsororg = "IEEE; ACM", treatment = "A Application; P Practical", } @InProceedings{Dongarra:1991:GBP, author = "J. J. Dongarra and A. Karp and K. Miura and H. D. Simon", title = "{Gordon Bell Prize} lectures (supercomputer applications)", crossref = "IEEE:1991:PSA", pages = "328--337", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5440 (Multiprocessor systems and techniques)", corpsource = "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN, USA", keywords = "128-node Intel iPSC/860; compiler speedup; Connections Machine; electronic structure; floating point processors; Fortran 77; Fortran 90; grid generation program; parallel processing; partial differential equation; price/performance award; scientific and engineering problems; supercomputers", sponsororg = "IEEE; ACM", treatment = "G General Review; P Practical", } @InProceedings{Sabot:1991:CPE, author = "G. Sabot and L. Tennies and A. Vasilevsky and R. Shapiro", title = "Compiler parallelization of an elliptic grid generator for {1990 Gordon Bell Prize}", crossref = "IEEE:1991:PSA", pages = "338--346", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5440 (Multiprocessor systems and techniques); C6150C (Compilers, interpreters and other processors)", corpsource = "Thinking Machines Corp., Cambridge, MA, USA", keywords = "1990 Gordon Bell Prize; application code; automatically parallelizing compiler; compiler parallelisation; Connection Machine Fortran 1.0 compiler; cycle counting analysis; elliptic grid generator; FORTRAN; Fortran program; numerical simulation; parallel processing; program compilers; Sun workstation", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Beal:1991:GAP, author = "D. Beal and C. Lambrinoudakis", title = "{GPFP}: an array processing element for the next generation of massively parallel supercomputer architectures", crossref = "IEEE:1991:PSA", pages = "348--357", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "B1265F (Microprocessors and microcomputers); B2570D (CMOS integrated circuits); C5130 (Microprocessor chips); C5220P (Parallel architecture); C5230 (Digital arithmetic methods)", corpsource = "Dept. of Comput. Sci., Queen Mary and Westfield Coll., London Univ., UK", keywords = "1.6 micron; 2.5 GFLOPS; 50 MHz; 50-MHz clock; ALU; arithmetic and logic unit; array processing element; CMOS integrated circuits; CMOSIC; cost-effective extra functionality; digital arithmetic; floating point arithmetic; general purpose with floating point support; GPFP; MasPar; massively parallel SIMD arrays; massively parallel supercomputer architectures; microprocessor chips; on-chip memory; parallel architectures; processing element; VLSI", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Karmarkar:1991:NPA, author = "N. Karmarkar", title = "A new parallel architecture for sparse matrix computation based on finite projective geometries", crossref = "IEEE:1991:PSA", pages = "358--369", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4140 (Linear algebra); C5220P (Parallel architecture)", corpsource = "AT and T Bell Labs., Murray Hill, NJ, USA", keywords = "data-routing; finite projective geometries; load balancing; mathematical structure; matrix algebra; memory-access conflicts; parallel architecture; parallel architectures; parallel systems; pattern of interconnection; sparse matrix computation", sponsororg = "IEEE; ACM", treatment = "A Application; P Practical", } @InProceedings{Jordan:1991:TMO, author = "H. F. Jordan and V. P. Heuring", title = "Time multiplexed optical computers", crossref = "IEEE:1991:PSA", pages = "370--378", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "B4125 (Fibre optics); B4180 (Optical logic devices and optical computing techniques); C5270 (Optical computing techniques)", corpsource = "Dept. of Electr. and Comput. Eng., Colorado Univ., Boulder, CO, USA", keywords = "architecture; bit serial; directional couplers; interconnection; logic devices; optical counter; optical fibers; optical fibres; optical information processing; proof-of-principle experiment; temporal latency; time division multiplexing; time multiplexed optical computers", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Fiduccia:1991:UMN, author = "C. M. Fiduccia and E. M. Jacobson", title = "Universal multistage networks via linear permutations", crossref = "IEEE:1991:PSA", pages = "380--389", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C1160 (Combinatorial mathematics); C4230M (Multiprocessor interconnection)", corpsource = "Supercomputing Res. Center, Bowie, MD, USA", keywords = "de Bruijn graph; directed 2-graphs; directed graphs; invertible linear operator; linear permutations; multiprocessor interconnection networks; N/2 nodes; shuffle-exchange network; universal multistage networks", sponsororg = "IEEE; ACM", treatment = "P Practical; T Theoretical or Mathematical", } @InProceedings{Wei:1991:DAE, author = "S. Wei and S. Levy", title = "Design and analysis of efficient hierarchical interconnection networks", crossref = "IEEE:1991:PSA", pages = "390--399", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4230M (Multiprocessor interconnection); C5670 (Network performance)", corpsource = "Dept. of Comput. Sci., Rutgers Univ., New Brunswick, NJ, USA", keywords = "average internode distance; design parameters; diameter; fault tolerance capability; hierarchical interconnection networks; intercluster traffic density; interface nodes; message-passing architectures; multiprocessor interconnection networks; performance evaluation; performance measures", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Farrens:1991:ATS, author = "M. Farrens and B. Wetmore and A. Woodruff", title = "Alleviation of tree saturation in multistage interconnection networks", crossref = "IEEE:1991:PSA", pages = "400--409", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C1160 (Combinatorial mathematics); C4230M (Multiprocessor interconnection); C5670 (Network performance)", corpsource = "Div. of Comput. Sci., California Univ., Davis, CA, USA", keywords = "bleeding; feedback damping scheme; feedback threshold value; hot spot contention; memory modules; memory queue size; multiprocessor interconnection networks; multistage interconnection networks; network simulation; performance evaluation; system performance; tree saturation alleviation; trees (mathematics)", sponsororg = "IEEE; ACM", treatment = "P Practical; T Theoretical or Mathematical", } @InProceedings{Cheng:1991:EAI, author = "D. Y. Cheng and D. M. Pase", title = "An evaluation of automatic and interactive parallel programming tools", crossref = "IEEE:1991:PSA", pages = "412--423", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5470 (Performance evaluation and testing); C6110P (Parallel programming); C6115 (Programming support); C7460 (Aerospace engineering)", corpsource = "NASA Ames Res. Center, Moffett Field, CA, USA", keywords = "aerospace computing; aerospace simulation; automatic tools; benchmarks; code transformation; Cray Y-MP; interactive parallel programming tools; interactive systems; machine-specific optimizations; NAS; Numerical Aerodynamics Simulation; parallel programming; performance; performance degradation; performance evaluation; software tools", sponsororg = "IEEE; ACM", treatment = "A Application; P Practical", } @InProceedings{Hall:1991:ITP, author = "M. W. Hall and K. Kennedy and K. S. McKinley", title = "Interprocedural transformations for parallel code generation", crossref = "IEEE:1991:PSA", pages = "424--434", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6110P (Parallel programming); C6150C (Compilers, interpreters and other processors); C6150G (Diagnostic, testing, debugging and evaluating systems)", corpsource = "Dept. of Comput. Sci., Rice Univ., Houston, TX, USA", keywords = "compiler optimization; interprocedural transformations; loop parallelization; machine model; parallel code generation; parallel programming; parallelism-enhancing transformations; Perfect Benchmarks; performance evaluation; performance improvements; procedure calls; program compilers; scientific programs; shared-memory multiprocessor", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Beguelin:1991:GDT, author = "A. Beguelin and J. J. Dongarra and G. A. Geist and R. Manchek and V. S. Sunderam", title = "Graphical development tools for network-based concurrent supercomputing", crossref = "IEEE:1991:PSA", pages = "435--444", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6110P (Parallel programming); C6115 (Programming support); C6180G (Graphical user interfaces)", corpsource = "Oak Ridge Nat Lab., TN, USA", keywords = "application program; graphical development tools; graphical user interfaces; HeNCE; heterogeneous network computing environment; integrated graphical tools; network-based concurrent supercomputing; parallel programming; parallel programs; Parallel Virtual Machine; process management and communication; programming environments; PVM; software package; X-window-based software environment", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Plimpton:1991:SAR, author = "S. Plimpton and G. Mastin and D. Ghiglia", title = "Synthetic aperture radar image processing on parallel supercomputers", crossref = "IEEE:1991:PSA", pages = "446--452", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "B6140C (Optical information and image processing); B6320 (Radar equipment, systems and applications); C5260B (Computer vision and picture processing); C7410F (Communications)", corpsource = "Sandia Nat. Labs., Albuquerque, NM, USA", keywords = "2-D FFTs; CM-2; computerised picture processing; fast Fourier transforms; nCUBE 2 hypercube; parallel processing; parallel supercomputers; performance data; phase gradient autofocusing; polar reformatter; radar applications; synthetic aperture radar image processing; telecommunications computing; uncompensated phase errors", sponsororg = "IEEE; ACM", treatment = "A Application; P Practical", } @InProceedings{Hotchkiss:1991:ASI, author = "R. S. Hotchkiss and C. L. Wampler", title = "The auditorialization of scientific information", crossref = "IEEE:1991:PSA", pages = "453--461", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "B6130 (Speech analysis and processing techniques); B6140 (Signal processing and detection); C5260 (Digital signal processing); C5585 (Speech recognition and synthesis)", corpsource = "Los Alamos Nat. Lab., NM, USA", keywords = "auditorialization; computerised signal processing; cryptography; encoding; encrypt; functional data; mathematical functions; scientific information; sequences of music; sound errors; speech analysis and processing; speech recognition", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Tamayo:1991:PAS, author = "P. Tamayo and J. P. Mesirov and B. M. Boghosian", title = "Parallel approaches to short range molecular dynamics simulations", crossref = "IEEE:1991:PSA", pages = "462--470", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "A6120J (Computer simulation of static and dynamic behaviour); C4240P (Parallel programming and algorithm theory); C7320 (Physics and Chemistry)", corpsource = "Thinking Machine Corp., Cambridge, MA, USA", keywords = "coarse-grained cells; computational requirements; Connection Machine CM-2; linked lists; molecular dynamics method; parallel algorithms; parallel machines; performance evaluation; physics computing; short range molecular dynamics simulations; Verlet neighbor lists", sponsororg = "IEEE; ACM", treatment = "A Application; P Practical", } @InProceedings{Friedell:1991:VBM, author = "M. Friedell and M. LaPolla and S. Kochhar and S. Sistare and Juda and J.", title = "Visualizing the behavior of massively parallel programs", crossref = "IEEE:1991:PSA", pages = "472--480", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6110P (Parallel programming); C6115 (Programming support); C6150G (Diagnostic, testing, debugging and evaluating systems)", corpsource = "Harvard Univ., Cambridge, MA, USA", keywords = "behaviour visualization; computer-aided design system; conceptual framework; Connection Machine; debugging; integrated visualization environment; massively parallel programs; parallel programming; program debugging; program testing; programming environments; prototype system; SIMD programs; user-interaction paradigm", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Goldberg:1991:PDS, author = "A. J. Goldberg and J. L. Hennessy", title = "Performance debugging shared memory multiprocessor programs with {MTOOL}", crossref = "IEEE:1991:PSA", pages = "481--490", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6110P (Parallel programming); C6115 (Programming support); C6150G (Diagnostic, testing, debugging and evaluating systems); C6180G (Graphical user interfaces)", corpsource = "Stanford Univ., CA, USA", keywords = "graphical user interfaces; low overhead instrumentation; MTOOL; parallel programming; performance evaluation; performance losses; program debugging; shared memory parallel programs; Silicon Graphics multiprocessors; software tool; software tools; synchronisation; synchronization bottlenecks; time bottlenecks; window-based user interface", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Utter-Honig:1991:GAP, author = "S. Utter-Honig and C. M. Pancake", title = "Graphical animation of parallel {Fortran} programs", crossref = "IEEE:1991:PSA", pages = "491--500", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6110P (Parallel programming); C6130B (Graphics techniques); C6150G (Diagnostic, testing, debugging and evaluating systems)", corpsource = "Cornell Nat. Supercomputer Facility, Cornell Univ., Itahca, NY, USA", keywords = "computer animation; FORTRAN; hierarchically organized source code; lock/event synchronization; parallel Fortran programs; parallel programming; performance analysis; performance evaluation; PF-View; program behavior; software tools; synchronisation; textural trace information; tool; visualizing the behavior", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Chang:1991:SPP, author = "Yao-Jen Chang and J.-L. C. Wu and Jingshown Wu", title = "Scheduling parallel programs with non-uniform parallelism profiles", crossref = "IEEE:1991:PSA", pages = "502--511", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6110P (Parallel programming); C6150J (Operating systems)", corpsource = "Dept. of Electr. Eng., Nat. Taiwan Univ., Taipei, Taiwan", keywords = "databases; job turnaround time; multiprocessing systems; nonuniform parallelism profiles; operating system; parallel algorithms; parallel programming; parallel programs scheduling; parallelizing compilers; performance evaluation; processor allocation; scheduling; speedup; task graphs", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Ieumwananonthachai:1991:IMC, author = "A. Ieumwananonthachai and A. N. Aizawa and S. R. Schwartz and Wah and B. W. and J. C. Yan", title = "Intelligent mapping of communicating processes in distributed computing systems", crossref = "IEEE:1991:PSA", pages = "512--521", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C1230 (Artificial intelligence); C4240 (Programming and algorithm theory); C6150N (Distributed systems)", corpsource = "Coord. Sci. Lab., Illinois Univ., Champaign, IL, USA", keywords = "automatically designing heuristics; communicating processes; computational complexity; distributed computing systems; distributed processing; heuristic programming; NP-hard; optimal routing of messages; post-game analysis; real-time systems; simulations; solution quality; statistical method; TEACHER 4.1", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Kodama:1991:LBF, author = "Y. Kodama and S. Sakai and Y. Yamaguchi", title = "Load balancing by function distribution on the {EM-4} prototype", crossref = "IEEE:1991:PSA", pages = "522--531", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5440 (Multiprocessor systems and techniques); C5470 (Performance evaluation and testing); C6150N (Distributed systems)", corpsource = "Electrotech. Lab., Ibaraki, Japan", keywords = "allocation functions; divide-and-conquer program; dynamic characteristics; EM-4; function distribution; game tree program; load balancing methods; local-minimum load; MLPE packets; parallel dataflow machine; parallel processing; performance evaluation; resource allocation", sponsororg = "IEEE; ACM", treatment = "X Experimental", } @InProceedings{Meindl:1991:GIG, author = "J. D. Meindl", title = "Gigascale integration ({GSI}) technology", crossref = "IEEE:1991:PSA", pages = "534--538", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "B1265 (Digital electronics); B2570 (Semiconductor integrated circuits); C5120 (Logic and switching circuits)", corpsource = "Rensselaer Polytech. Inst., Troy, NY, USA", keywords = "chip area; chip performance index; delays; gigascale integration; integrated circuit technology; macrovariables; minimum feature size; number of transistors per minimum feature area; power-delay product; reciprocal length versus delay; singular metric; switching operations; technological forecasting; transmission operations; VLSI", sponsororg = "IEEE; ACM", treatment = "G General Review", } @InProceedings{Willen:1991:EGP, author = "D. E. Willen", title = "Exploration geophysics, parallel computing and reality", crossref = "IEEE:1991:PSA", pages = "540--??", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "A9130R (Explosion seismology); A9365 (Data acquisition, processing and storage); A9385 (Instrumentation and techniques for geophysical, hydrospheric and lower atmosphere research); C5440 (Multiprocessor systems and techniques); C7340 (Geophysics)", corpsource = "EXXON Production Research Co., Houston, TX, USA", keywords = "complex near surface; density effects; elastic effects; exploration geophysics; geophysical prospecting; geophysics computing; inverse problems; layered Earth approximations; parallel processing; seismic data; seismology; structured models; TeraFLOPS; TFLOPS; traveltime calculations; wave propagation", sponsororg = "IEEE; ACM", treatment = "G General Review", } @InProceedings{Rutledge:1991:AIL, author = "J. M. Rutledge and D. R. Jones and W. H. Chen and E. Y. Chung", title = "Application issues for large scale reservoir simulation on massively parallel computers", crossref = "IEEE:1991:PSA", pages = "541--??", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "A9385 (Instrumentation and techniques for geophysical, hydrospheric and lower atmosphere research); C5440 (Multiprocessor systems and techniques); C6150N (Distributed systems); C7340 (Geophysics); C7450 (Chemical engineering)", keywords = "chemical engineering computing; computational speed; distributed memory machines; geophysics computing; indirect addressing; intensive computational needs; large scale reservoir simulation; linear equation solver; load balancing; massively parallel computers; oil technology; parallel processing; petroleum reservoir models; resource allocation; robustness; shared memory computers; unit stride; vector supercomputers", sponsororg = "IEEE; ACM", treatment = "G General Review", } @InProceedings{Kendall:1991:LSR, author = "R. P. Kendall and J. R. Wallis and J. A. Foster and J. S. Nolen", title = "Large scale reservoir simulation in the concurrent processing milieu", crossref = "IEEE:1991:PSA", pages = "542--??", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C7340 (Geophysics); C7450 (Chemical engineering)", keywords = "chemical engineering computing; concurrent processing milieu; fine granularity; geophysics computing; numerical reservoir simulation; oil technology; parallel processing; performance gains; simulation technology", sponsororg = "IEEE; ACM", treatment = "G General Review", } @InProceedings{Smith:1991:VCC, author = "L. L. Smith", title = "Vectorizing {C} compilers: how good are they?", crossref = "IEEE:1991:PSA", pages = "544--553", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6110P (Parallel programming); C6140D (High level languages); C6150C (Compilers, interpreters and other processors)", corpsource = "Supercomputing Res. Center, Bowie, MD, USA", keywords = "automatic vectorization; C language; C loop kernels; Convex Application Compiler; Convex cc compiler; Cray 2 scc compiler; Cray YMP scc compiler; parallel programming; pipeline processing; program compilers; program testing; vectorizing C compilers", sponsororg = "IEEE; ACM", treatment = "P Practical; X Experimental", } @InProceedings{Glen:1991:CMH, author = "R. R. Glen and D. V. Pryor and J. M. Conroy and T. Johnson", title = "Characterizing memory hot spots in a shared memory {MIMD} machine", crossref = "IEEE:1991:PSA", pages = "554--566", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5220P (Parallel architecture); C5440 (Multiprocessor systems and techniques); C6150N (Distributed systems)", corpsource = "Supercomputing Res. Center, Bowie, MD, USA", keywords = "bistability; critical section; first come/first serve queuing mechanism; massively parallel MIMD computers; memory hot spot; memory stride; multiprocessing systems; pseudorandom interleaving; separate memory accesses; shared memory locations; shared memory MIMD machine; split transaction; storage management; supercomputers; threads; throughput prediction", sponsororg = "IEEE; ACM", treatment = "P Practical; T Theoretical or Mathematical", } @InProceedings{Miller:1991:IOB, author = "E. L. Miller and R. H. Katz", title = "Input\slash output behavior of supercomputing applications", crossref = "IEEE:1991:PSA", pages = "567--576", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5440 (Multiprocessor systems and techniques); C6150N (Distributed systems)", corpsource = "Dept. of Electr. Eng. and Comput. Sci., California Univ., Berkeley, CA, USA", keywords = "access pattern; buffer storage; bursty I/O request pattern; caching simulations; CPU utilization; Cray computers; Cray Y-MP CPU; digital simulation; file cache; file references; input-output programs; parallel processing; read-ahead; solid-state disk; storage management; supercomputer I/O traces; write-behind", sponsororg = "IEEE; ACM", treatment = "P Practical; X Experimental", } @InProceedings{Chronopoulos:1991:TEP, author = "A. T. Chronopoulos", title = "Towards efficient parallel implementation of the {CG} method applied to a class of block tridiagonal linear systems", crossref = "IEEE:1991:PSA", pages = "578--587", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4140 (Linear algebra); C4170 (Differential equations); C4240P (Parallel programming and algorithm theory); C5220P (Parallel architecture)", corpsource = "Dept. of Comput, Sci., Minnesota Univ., Minneapolis, MN, USA", keywords = "block tridiagonal linear systems; conjugate gradient methods; CRAY-2; elliptic partial differential equation; Hypercube parallel computers; memory hierarchy; message passing private memory machines; parallel algorithms; parallel architectures; parallel machines; parameterized vector architecture; partial differential equations; shared memory machines; vector processors", sponsororg = "IEEE; ACM", treatment = "X Experimental", } @InProceedings{Pommerell:1991:PIL, author = "C. Pommerell and W. Fichtner", title = "{PILS}: an iterative linear solver package for ill-conditioned systems", crossref = "IEEE:1991:PSA", pages = "588--599", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4140 (Linear algebra); C7310 (Mathematics)", corpsource = "Integrated Syst. Lab., ETH, Zurich, Switzerland", keywords = "equation solution; ill-conditioned systems; iterative linear solver package; linear algebra; linear equations; mathematics computing; multidimensional solution; ordering; partial differential equations; PILS; preconditioning; production; software implementation; software package; software packages", sponsororg = "IEEE; ACM", treatment = "P Practical; T Theoretical or Mathematical", } @InProceedings{Malard:1991:TPD, author = "J. Malard", title = "Threshold pivoting for dense {LU} factorization on distributed memory multiprocessor", crossref = "IEEE:1991:PSA", pages = "600--607", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4140 (Linear algebra); C4240P (Parallel programming and algorithm theory)", corpsource = "Sch. of Comput. Sci., McGill Univ., Montreal, Que., Canada", keywords = "block column wrapping; dense LU factorization; distributed memory multiprocessor; matrix algebra; multicasts; parallel algorithms; parallel programming; row wrapping", sponsororg = "IEEE; ACM", treatment = "X Experimental", } @InProceedings{Hummel:1991:FPR, author = "S. F. Hummel and E. Schonberg and L. E. Flynn", title = "Factoring: a practical and robust method for scheduling parallel loops", crossref = "IEEE:1991:PSA", pages = "610--619", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6110P (Parallel programming); C6150C (Compilers, interpreters and other processors)", corpsource = "CRI, Ecole Nat. Sup{\'e}rieure des Mines de Paris, Fontainebleau, France", keywords = "factoring; guided self-scheduling; independent iterations; optimal finishing time; parallel languages; parallel programming; parallel-loop characteristics; program compilers; PTRAN restructuring compiler; resource allocation; RP3 runtime system; scheduling; scheduling parallel loops; static chunking", sponsororg = "IEEE; ACM", treatment = "P Practical; X Experimental", } @InProceedings{Chen:1991:ESD, author = "D.-K. Chen and P.-C. Yew", title = "An empirical study on {DOACROSS} loops", crossref = "IEEE:1991:PSA", pages = "620--632", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6110P (Parallel programming); C6150C (Compilers, interpreters and other processors)", corpsource = "Center for Supercomput. Res. and Dev., Illinois Univ., Urbana, IL, USA", keywords = "concurrent DOACROSS loop execution; cross-iteration dependences; digital simulation; execution-driven simulation; KAP; MaxPar; optimizing compilers; parallel machines; parallel programming; parallelizing compiler; program compilers", sponsororg = "IEEE; ACM", treatment = "P Practical; X Experimental", } @InProceedings{Yang:1991:FSS, author = "T. Yang and A. Gerasoulis", title = "A fast static scheduling algorithm for {DAGs} on an unbounded number of processors", crossref = "IEEE:1991:PSA", pages = "633--642", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C1160 (Combinatorial mathematics); C4240P (Parallel programming and algorithm theory); C6110P (Parallel programming); C6150N (Distributed systems)", corpsource = "Dept. of Comput. Sci., Rutgers Univ., New Brunswick, NJ, USA", keywords = "coarse tree graphs; communication overhead; completely connected processors; computational complexity; DAG; DAGs; directed acyclic task graphs; directed graphs; dominant sequences clustering; fork; heuristic algorithm; join; parallel algorithms; parallel programming; parallel time; scheduling; static scheduling algorithm", sponsororg = "IEEE; ACM", treatment = "P Practical; T Theoretical or Mathematical", } @InProceedings{Qiao:1991:TOC, author = "C. Qiao and R. G. Melham", title = "Time-division optical communications in multiprocessor arrays", crossref = "IEEE:1991:PSA", pages = "644--653", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "B6150C (Switching theory); B6260 (Optical links and equipment); C4230M (Multiprocessor interconnection); C5440 (Multiprocessor systems and techniques); C6150N (Distributed systems)", corpsource = "Dept. of Comput. Sci., Pittsburgh Univ., PA, USA", keywords = "clock distribution method; high communication bandwidth; message pipelining; multiprocessing systems; multiprocessor arrays; optical communication; optical signal transmission; optical waveguides; predictable propagation delays; synchronisation; synchronization; time division multiplexing; time-division multiplexing; unidirectional propagation", sponsororg = "IEEE; ACM", treatment = "T Theoretical or Mathematical", } @InProceedings{Felperin:1991:FRP, author = "S. A. Felperin and L. Gravano and G. D. Pifarre and J. C. L. Sanz", title = "Fully-adaptive routing: packet switching performance and wormhole algorithms", crossref = "IEEE:1991:PSA", pages = "654--663", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "B6150C (Switching theory); C4230M (Multiprocessor interconnection); C5220P (Parallel architecture); C5470 (Performance evaluation and testing)", keywords = "deadlock-free adaptive routing; fully adaptive minimal worm-hole routing algorithm; hypercube; injection models; latency; livelock-free adaptive routing; mesh; packet switching; packet switching performance; parallel architectures; performance evaluation; saturation point; simulation study; telecommunication traffic; throughput; traffic models; wormhole algorithms", sponsororg = "IEEE; ACM", treatment = "P Practical; X Experimental", } @InProceedings{Kung:1991:NME, author = "H. T. Kung and R. Sansom and S. Schlick and P. Steenkiste and M. Arnould and F. J. Bitz and F. Christianson and E. C. Cooper and {\"O}. Menzilcio{\u{g}}lu and D. Ombres and B. Zill", title = "Network-based multicomputers: an emerging parallel architecture", crossref = "IEEE:1991:PSA", pages = "664--673", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5220P (Parallel architecture); C5440 (Multiprocessor systems and techniques); C5620 (Computer networks and techniques)", corpsource = "Sch. of Comput. Sci., Carnegie Mellon Univ., Pittsburgh, PA, USA", keywords = "computer networks; copy operations; high bandwidth; high-speed crossbar switches; host interrupts; host-network interface overhead; low latency; multicomputer applications; multiprocessing systems; Nectar; network-based multicomputers; parallel architecture; parallel architectures; protocol; system-specific interconnects", sponsororg = "IEEE; ACM", treatment = "P Practical; X Experimental", } @InProceedings{Chervin:1991:CMP, author = "R. Chervin", title = "Climate modeling with parallel vector supercomputers", crossref = "IEEE:1991:PSA", pages = "677--??", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "A9260B (General circulation); A9260S (Climatology); A9365 (Data acquisition, processing and storage); C7340 (Geophysics)", corpsource = "Nat. Center for Atmos. Res., Boulder, CO, USA", keywords = "atmospheric movements; climate modeling; climatology; global atmospheric models; global climate system; model performance enhancement; National Center for Atmospheric Research; NCAR; ocean models; parallel processing; parallel vector supercomputers; performance evaluation; reduced execution time", sponsororg = "IEEE; ACM", treatment = "G General Review", } @InProceedings{Dannevik:1991:CMM, author = "W. Dannevik", title = "Computing modeling in a {MIMD} environment", crossref = "IEEE:1991:PSA", pages = "678--??", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "A9210D (Dynamics of the deep ocean); A9210F (Dynamics of the upper ocean); A9260B (General circulation); A9260S (Climatology); A9365 (Data acquisition, processing and storage); C6110P (Parallel programming); C7340 (Geophysics)", corpsource = "Lawrence Livermore Nat. Lab., CA, USA", keywords = "1D domain decomposition; 2D decomposition; atmospheric circulation model; atmospheric movements; BBN TC2000 MIMD system; climate model numerical algorithms; climatology; data structure definition; distributed-memory programming models; finite difference models; general circulation models; geophysics computing; load-balancing; message-passing paradigms; MIMD environment; oceanography; parallel efficiency; parallel processing; Semtner-Chervin ocean circulation model; shared-memory programming model; spatial resolution; time-advance algorithm selection", sponsororg = "IEEE; ACM", treatment = "P Practical; T Theoretical or Mathematical", } @InProceedings{Smith:1991:OMC, author = "R. D. Smith and J. K. Dukowicz and R. C. Malone", title = "Ocean modeling on the {Connection Machine}", crossref = "IEEE:1991:PSA", pages = "679--??", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "A9210D (Dynamics of the deep ocean); A9210F (Dynamics of the upper ocean); A9260B (General circulation); A9365 (Data acquisition, processing and storage); C6110P (Parallel programming); C7340 (Geophysics)", corpsource = "Los Alamos Nat. Lab., NM, USA", keywords = "3D primitive equations; 4-processor XMP; coastal topography; Connection Machine; data structure; DOE CHAMMP program; geophysics computing; global ocean model; longitude-depth slab; Los Alamos CM-2 Connection Machine; ocean-bottom topography; oceanography; parallel processing; Semtner-Chervin ocean model; stratified fluid flow; surface-pressure formulation", sponsororg = "IEEE; ACM", treatment = "T Theoretical or Mathematical; X Experimental", } @InProceedings{Chiueh:1991:IMM, author = "T.-C. Chiueh", title = "An integrated memory management scheme for dynamic alias resolution", crossref = "IEEE:1991:PSA", pages = "682--691", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5220P (Parallel architecture); C5440 (Multiprocessor systems and techniques); C6150J (Operating systems); C6150N (Distributed systems)", corpsource = "Dept. of Electr. Eng. and Comput. Sci., California Univ., Berkeley, CA, USA", keywords = "indirect resolution; integrated memory management; machine cycle time; memory mapped register; multiprocessor configurations; on-chip data cache; pipeline depth; processor registers; storage allocation; storage management; tagged register", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Corporal:1991:MFH, author = "{Corporal, H.} and H. Mulder", title = "{MOVE}: a framework for high-performance processor design", crossref = "IEEE:1991:PSA", pages = "692--701", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5220P (Parallel architecture)", corpsource = "Dept. of Electr. Eng., Delft Univ. of Technol., Netherlands", keywords = "configurable; data operations; data transport; hardware organization; hardware utilization; high-performance processors; instruction-level-parallelism; MOVE; parallel architectures; pipeline processing; pipelining; scalable; short cycle implementations", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Bird:1991:SPP, author = "P. L. Bird and U. F. Pleban", title = "A semantics-directed partitioning of a processor architecture", crossref = "IEEE:1991:PSA", pages = "702--709", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4210 (Formal logic); C4240 (Programming and algorithm theory); C5220P (Parallel architecture)", corpsource = "Adv. Comput. Res. Inst., Lyon, France", keywords = "action semantics; computer architecture; decoupled address generation; decoupled control activity; denotational semantics; formal languages; formal semantic model; MISD machine; parallel architectures; processor architecture; programming language semantics; programming theory; semantics partitioning; semantics-directed partitioning", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Zagha:1991:RSV, author = "M. Zagha and G. E. Blelloch", title = "Radix sort for vector multiprocessors", crossref = "IEEE:1991:PSA", pages = "712--721", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4240P (Parallel programming and algorithm theory); C6110P (Parallel programming); C6130 (Data handling techniques)", corpsource = "Sch. of Comput. Sci., Carnegie Mellon Univ., Pittsburgh, PA, USA", keywords = "Cray computers; CRAY-Y-MP; data-parallel algorithm; parallel algorithms; pipeline processing; radix sort algorithm; sorting; vector multiprocessors", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Kanada:1991:MVP, author = "Y. Kanada", title = "A method of vector processing for shared symbolic data", crossref = "IEEE:1991:PSA", pages = "722--731", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4210 (Formal logic); C4240P (Parallel programming and algorithm theory); C6120 (File organisation)", corpsource = "Hitachi Ltd., Tokyo, Japan", keywords = "address calculation sorting; data structures; dynamic data structures; filtering-overwritten-label method; graphs; hash table; Hitachi S-810; lists; multiple processings; parallel algorithms; parallel programming; parallel rewriting; programming theory; rewriting systems; shared elements; shared symbolic data; symbolic processing algorithms; trees; vector processing", sponsororg = "IEEE; ACM", treatment = "T Theoretical or Mathematical", } @InProceedings{Alnuweiri:1991:OBV, author = "H. M. Alnuweiri", title = "Optimal bounded-degree {VLSI} networks for sorting in a constant number of rounds", crossref = "IEEE:1991:PSA", pages = "732--739", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "B2570 (Semiconductor integrated circuits); C4230M (Multiprocessor interconnection); C4240P (Parallel programming and algorithm theory); C6130 (Data handling techniques)", corpsource = "Dept. of Electr. Eng., British Columbia Univ., Vancouver, BC, Canada", keywords = "bounded-degree VLSI networks; computational complexity; enumeration-sort; I/O pins; index-mapping methodology; multiple chip networks; multiprocessor interconnection networks; optimal VLSI sorters; parallel programming; partitioning; programming theory; reduced-area shuffle networks; rotate-sort; sorting; VLSI", sponsororg = "IEEE; ACM", treatment = "T Theoretical or Mathematical", } @InProceedings{Theobald:1991:EPA, author = "K. B. Theobald and G. R. Gao", title = "An efficient parallel algorithm for all pairs examination", crossref = "IEEE:1991:PSA", pages = "742--753", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C1110 (Algebra); C4140 (Linear algebra); C4240P (Parallel programming and algorithm theory)", corpsource = "Sch. of Comput. Sci., McGill Univ., Montreal, Que., Canada", keywords = "all pairs examination; automorphic transformations; communication steps; computational complexity; group theory; linear feedback shift registers; matrix algebra; network traffic; parallel algorithm; parallel algorithms; permutation groups; processor time; run-time overhead", sponsororg = "IEEE; ACM", treatment = "T Theoretical or Mathematical", } @InProceedings{Woo:1991:PPF, author = "M.-l. Woo and R. A. Renaut", title = "Parallel power-of-two {FFTs} on hypercubes", crossref = "IEEE:1991:PSA", pages = "754--763", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4190 (Other numerical methods); C4230M (Multiprocessor interconnection); C4240P (Parallel programming and algorithm theory)", corpsource = "Dept. of Math., Arizona State Univ., Tempe, AZ, USA", keywords = "computational complexity; distance one algorithm; distance two algorithm; fast Fourier transforms; hypercube architectures; hypercube networks; interprocessor communications; ordered power-of-two fast Fourier transforms; packet transmission; parallel algorithms; parallel power of two FFTs; time complexity", sponsororg = "IEEE; ACM", treatment = "T Theoretical or Mathematical", } @InProceedings{Narayanan:1991:ARD, author = "P. J. Narayanan", title = "Analysis of replicated data algorithms on processor array architectures", crossref = "IEEE:1991:PSA", pages = "764--773", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C1250 (Pattern recognition); C4230M (Multiprocessor interconnection); C4240P (Parallel programming and algorithm theory)", corpsource = "Dept. of Comput. Sci., Maryland Univ., College Park, MD, USA", keywords = "3-D mesh; array interconnection networks; computerised picture processing; data parallelism; data replication; hypercube connected connection machine; image processing algorithms; multiprocessor interconnection networks; nonglobal architectures; operation parallelism; parallel algorithms; processor array architectures; replicated data algorithms", sponsororg = "IEEE; ACM", treatment = "T Theoretical or Mathematical; X Experimental", } @InProceedings{Tzeng:1991:DHR, author = "N.-F. Tzeng", title = "Design of a highly reliable cube-connected cycles architecture", crossref = "IEEE:1991:PSA", pages = "776--785", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4230M (Multiprocessor interconnection); C5220P (Parallel architecture); C5470 (Performance evaluation and testing)", corpsource = "Center for Adv. Comput. Studies, Univ. of Southwestern Louisiana, Lafayette, LA, USA", keywords = "area overhead; cross connections; fault tolerant computing; fault tolerant cube connected cycles architecture; multiprocessor interconnection networks; parallel architectures; processing element; reconfiguration procedure; reliable cube-connected cycles architecture; XCCC layout", sponsororg = "IEEE; ACM", treatment = "T Theoretical or Mathematical", } @InProceedings{Taylor:1991:TFA, author = "V. E. Taylor and A. Ranade and D. G. Messerschmitt", title = "Three-dimensional finite-element analyses: implications for computer architectures", crossref = "IEEE:1991:PSA", pages = "786--795", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4140 (Linear algebra); C4185 (Finite element analysis); C4240P (Parallel programming and algorithm theory); C5220P (Parallel architecture); C6110P (Parallel programming); C6120 (File organisation)", corpsource = "Dept. of Electr. Eng. and Comput. Sci., California Univ., Berkeley, CA, USA", keywords = "columns; computer architectures; data path design; data structure; data structures; finite element analysis; floating-point units; matrix algebra; memory bandwidth; parallel architectures; parallel programming; programming theory; rows; sparse matrices; sparsity pattern", sponsororg = "IEEE; ACM", treatment = "P Practical; T Theoretical or Mathematical", } @InProceedings{Tomkins:1991:MPC, author = "J. L. Tomkins and J. P. VanDyke", title = "Massively parallel computing and the mid-course tracking problem", crossref = "IEEE:1991:PSA", pages = "796--804", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6110P (Parallel programming); C7150 (Military)", corpsource = "Sandia Nat. Labs., Albuquerque, NM, USA", keywords = "Cray X-MP single processor; massively parallel MIMD computing; mid-course tracking problem; military computing; nCUBE/ten computer; parallel programming; real-time solution; real-time systems; SDI; strategic defence initiative; TRC code", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Bucher:1991:MMA, author = "I. Y. Bucher and M. L. Simmons", title = "Measurement of memory access contentions in multiple vector processor systems", crossref = "IEEE:1991:PSA", pages = "806--817", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C1140C (Queueing theory); C5440 (Multiprocessor systems and techniques); C5470 (Performance evaluation and testing); C6150C (Compilers, interpreters and other processors)", corpsource = "Los Alamos Nat. Lab., NM, USA", keywords = "active processors; CRAY X-MP; CRAY Y-MP; CRAY-2; dynamic memory; memory access conflicts; memory bank conflicts; mixed strides; multiple vector processor systems; parallel machines; performance evaluation; program compilers; queueing theory; queuing model; static memory; stride one; vector length; vector loop unrolling; vector operations; vector performance", sponsororg = "IEEE; ACM", treatment = "P Practical; T Theoretical or Mathematical", } @InProceedings{Chen:1991:CAS, author = "Y.-C. Chen and A. V. Veidenbaum", title = "Comparison and analysis of software and directory coherence schemes", crossref = "IEEE:1991:PSA", pages = "818--829", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C6110P (Parallel programming); C6120 (File organisation); C6185 (Simulation techniques)", corpsource = "Center for Supercomputing Res. and Dev., Illinois Univ., Urbana, IL, USA", keywords = "buffer storage; cache coherence problem; digital simulation; directory coherence; false sharing; hit ratio; MIN- based large-scale multiprocessor system; multiprocessor interconnection networks; nontrivial cache line size; parallel programming; performance; performance evaluation; shared memory traffic; software; storage management; trace-driven simulation", sponsororg = "IEEE; ACM", treatment = "P Practical", } @InProceedings{Ahmad:1991:PPD, author = "I. Ahmad and A. Ghafor and K. Mehrotra", title = "Performance prediction of distributed load balancing on multicomputer systems", crossref = "IEEE:1991:PSA", pages = "830--839", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C1140C (Queueing theory); C5440 (Multiprocessor systems and techniques); C5470 (Performance evaluation and testing)", corpsource = "Sch. of Comput. and Inf. Sci., Syracuse Univ., NY, USA", keywords = "analytical models; average execution queue length; central server open queuing network; local execution; multicomputer systems; multiprocessing systems; newly arrived task; performance evaluation; performance prediction; probability; queueing theory; queuing parameters; response time; sender-initiated distributed load balancing strategies; simulation models; statistical analysis", sponsororg = "IEEE; ACM", treatment = "T Theoretical or Mathematical; X Experimental", } @InProceedings{Su:1991:EDE, author = "H.-M. Su and P.-C. Yew", title = "Efficient {Doacross} execution on distributed shared-memory multiprocessors", crossref = "IEEE:1991:PSA", pages = "842--853", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4240P (Parallel programming and algorithm theory); C6110P (Parallel programming); C6120 (File organisation); C6150C (Compilers, interpreters and other processors)", corpsource = "Center for Supercomput. Res. and Dev., Illinois Univ., Urbana, IL, USA", keywords = "buffer location; compile time; compiler algorithms; direct communication; distributed shared-memory multiprocessors; Doacross execution; Doacross loop; DSM architecture; message buffers; nearest shared memory; parallel algorithms; parallel programming; program compilers; programming theory; static message passing; storage management; UMA architecture; uniform memory access", sponsororg = "IEEE; ACM", treatment = "P Practical; T Theoretical or Mathematical", } @InProceedings{Granston:1991:DRA, author = "E. D. Granston and A. V. Veidenbaum", title = "Detecting redundant accesses to array data", crossref = "IEEE:1991:PSA", pages = "854--865", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4240P (Parallel programming and algorithm theory); C6110P (Parallel programming); C6120 (File organisation); C6150C (Compilers, interpreters and other processors)", corpsource = "Center for Supercomputing Res. and Dev., Illinois Univ., Urbana, IL, USA", keywords = "compile-time algorithm; conditionals; dependence analysis; flow analysis; flow equations; interval-analysis; parallel algorithms; parallel constructs; parallel programming; program compilers; programming theory; redundancy analysis; redundant global memory accesses; redundant reference; storage management; vector constructs", sponsororg = "IEEE; ACM", treatment = "P Practical; T Theoretical or Mathematical", } @InProceedings{Venugopal:1991:EPS, author = "S. Venugopal and V. K. Naik", title = "Effects of partitioning and scheduling sparse matrix factorization on communication and load balance", crossref = "IEEE:1991:PSA", pages = "866--875", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C4140 (Linear algebra); C4240P (Parallel programming and algorithm theory)", corpsource = "Dept. of Comput. Sci., Rutgers Univ., New Brunswick, NJ, USA", keywords = "communication; distributed memory systems; Harwell- Boeing data set; load balance; load imbalance; matrix algebra; parallel algorithms; partitioning; scheduling; scheduling sparse matrix factorization; wrap-mapped column assignment", sponsororg = "IEEE; ACM", treatment = "X Experimental", } @InProceedings{Myers:1991:MSR, author = "T. Myers and E. Williams", title = "Mass storage requirements in the intelligence community", crossref = "IEEE:1991:PSA", pages = "878--889", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5320 (Digital storage); C6110 (Systems analysis and programming)", corpsource = "Dept. of Defense, Ft. Meade, MD, USA", keywords = "digital storage; intelligence community; mass storage systems; research and development; systems analysis", sponsororg = "IEEE; ACM", treatment = "G General Review", } @InProceedings{Bowen:1991:VMT, author = "N. S. Bowen and D. K. Pradhan", title = "A virtual memory translation mechanism to support checkpoint and rollback recovery", crossref = "IEEE:1991:PSA", pages = "890--899", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5470 (Performance evaluation and testing); C6120 (File organisation)", corpsource = "IBM Thomas J. Watson Res. Center, Yorktown Heights, NY, USA", keywords = "address space; checkpoint interval size; checkpoint recovery; fault tolerant computing; rollback recovery; supercomputer applications; virtual memory translation; virtual storage", sponsororg = "IEEE; ACM", treatment = "T Theoretical or Mathematical; X Experimental", } @InProceedings{Annaratone:1991:KDM, author = "M. Annaratone and M. Fillo and M. Halbherr and R. Ruhl and Steiner and P. and M. Viredaz", title = "The {K2} distributed memory parallel processor: architecture, compiler and operating system", crossref = "IEEE:1991:PSA", pages = "900--909", year = "1991", bibdate = "Wed Apr 15 16:28:01 MDT 1998", acknowledgement = ack-nhfb, classification = "C5220P (Parallel architecture); C5440 (Multiprocessor systems and techniques); C6110P (Parallel programming); C6150C (Compilers, interpreters and other processors); C6150J (Operating systems); C6150N (Distributed systems)", corpsource = "Swiss Federal Inst. of Technol., Zurich, Switzerland", keywords = "architecture; K2 distributed memory parallel processor; multi tasking operating system; multi user operating system; multiprogramming; operating systems (computers); parallel architectures; parallel machines; parallel programming; parallelizing compiler; program compilers; time-sharing operating system; workbench machine", sponsororg = "IEEE; ACM", treatment = "P Practical", } %%% ==================================================================== %%% These entries must occur last because they are cross-referenced by %%% entries above. @Proceedings{IEEE:1991:PSA, editor = "{IEEE}", booktitle = "Proceedings, Supercomputing '91: Albuquerque, New Mexico, November 18--22, 1991", title = "Proceedings, Supercomputing '91: Albuquerque, New Mexico, November 18--22, 1991", publisher = pub-IEEE, address = pub-IEEE:adr, pages = "xxiii + 917", year = "1991", ISBN = "0-8186-9158-1 (IEEE case), 0-8186-2158-3 (IEEE paper), 0-8186-6158-5 (IEEE microfiche), 0-89791-459-7 (ACM)", ISBN-13 = "978-0-8186-9158-4 (IEEE case), 978-0-8186-2158-1 (IEEE paper), 978-0-8186-6158-7 (IEEE microfiche), 978-0-89791-459-8 (ACM)", LCCN = "QA76.5 .S894 1991", bibdate = "Fri Aug 30 08:01:51 MDT 1996", bibsource = "University of California MELVYL catalog.", note = "ACM order number 415913. IEEE Computer Society Press order number 2158. IEEE catalog number 91CH3058-5.", acknowledgement = ack-nhfb, classification = "C5440 (Multiprocessor systems and techniques); C5470 (Performance evaluation and testing); C6110P (Parallel programming)", keywords = "combinatorial algorithms; data dependence; distributed memory code generation; high school environment; latency tolerance; memory access; numerical algorithms; parallel processing; parallel programming; performance evaluation; performance tools; processor design; program analysis; storage hierarchy optimization; supercomputer benchmarks; supercomputer congresses; supercomputing; system issues", }