%%% -*-BibTeX-*-
%%% ====================================================================
%%% BibTeX-file{
%%% author = "Nelson H. F. Beebe",
%%% version = "1.04",
%%% date = "25 October 2010",
%%% time = "17:27:12 MDT",
%%% filename = "supercomputing91.bib",
%%% University of Utah
%%% Department of Mathematics, 110 LCB
%%% 155 S 1400 E RM 233
%%% Salt Lake City, UT 84112-0090
%%% USA",
%%% telephone = "+1 801 581 5254",
%%% FAX = "+1 801 581 4148",
%%% URL = "http://www.math.utah.edu/~beebe",
%%% checksum = "13008 2282 10580 106056",
%%% email = "beebe at math.utah.edu, beebe at acm.org,
%%% beebe at ieee.org (Internet)",
%%% codetable = "ISO/ASCII",
%%% keywords = "bibliography, BibTeX, Supercomputing '91",
%%% license = "public domain",
%%% supported = "yes",
%%% docstring = "This is a complete bibliography of papers
%%% published in the proceedings of
%%% Supercomputing '91.
%%%
%%% The organizers of this conference series
%%% maintain a World-Wide Web site at
%%%
%%% http://www.supercomp.org/
%%%
%%% where pointers to Web pages for the
%%% conferences from 1994 to date may be found.
%%%
%%% At version 1.04, the year coverage looked
%%% like this:
%%%
%%% 1991 ( 92)
%%%
%%% InProceedings: 91
%%% Proceedings: 1
%%%
%%% Total entries: 92
%%%
%%% This bibliography was prepared from data
%%% collected from major library catalogs, from
%%% the IEEE INSPEC database, and from the TeX
%%% User Group bibliography archive.
%%%
%%% In this bibliography, entries are sorted in
%%% publication order, using ``bibsort
%%% -byvolume''.
%%%
%%% The checksum field above contains a CRC-16
%%% checksum as the first value, followed by the
%%% equivalent of the standard UNIX wc (word
%%% count) utility output of lines, words, and
%%% characters. This is produced by Robert
%%% Solovay's checksum utility.",
%%% }
%%% ====================================================================
%%% ====================================================================
%%% Acknowledgement abbreviations:
@String{ack-nhfb = "Nelson H. F. Beebe,
University of Utah,
Department of Mathematics, 110 LCB,
155 S 1400 E RM 233,
Salt Lake City, UT 84112-0090, USA,
Tel: +1 801 581 5254,
FAX: +1 801 581 4148,
e-mail: \path|beebe@math.utah.edu|,
\path|beebe@acm.org|,
\path|beebe@ieee.org| (Internet),
URL: \path|http://www.math.utah.edu/~beebe/|"}
%%% ====================================================================
%%% Publishers and their addresses:
@String{pub-IEEE = "IEEE Computer Society Press"}
@String{pub-IEEE:adr = "1109 Spring Street, Suite 300,
Silver Spring, MD 20910, USA"}
%%% ====================================================================
%%% Bibliography entries.
@InProceedings{Pugh:1991:OTF,
author = "W. Pugh",
title = "The {Omega} test: a fast and practical integer
programming algorithm for dependence analysis",
crossref = "IEEE:1991:PSA",
pages = "4--13",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C1180 (Optimisation techniques); C4240 (Programming
and algorithm theory); C6150G (Diagnostic, testing,
debugging and evaluating systems)",
corpsource = "Dept. of Comput. Sci., Maryland Univ., College Park,
MD, USA",
keywords = "approximate algorithms; array references;
computational complexity; dependence analysis;
Fourier-Motzkin variable elimination; integer
programming; integer programming algorithm; Omega test;
polynomial time complexity; production compilers;
program testing; worst-case exponential time
complexity",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Loeliger:1991:PTT,
author = "J. Loeliger and R. Metzger and M. Seligman and S.
Stroud",
title = "Pointer target tracking --- an empirical study",
crossref = "IEEE:1991:PSA",
pages = "14--23",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6150C (Compilers, interpreters and other
processors)",
keywords = "C-series supercomputers; language-independent
interprocedural optimizer; pointer target tracking;
program compilers",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Mellor-Crummey:1991:ODD,
author = "J. Mellor-Crummey",
title = "On-the-fly detection of data races for programs with
nested fork-join parallelism",
crossref = "IEEE:1991:PSA",
pages = "24--33",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5640 (Protocols); C6110P (Parallel programming);
C6150G (Diagnostic, testing, debugging and evaluating
systems)",
corpsource = "Center for Res. on Parallel Comput., Rice Univ.,
Houston, TX, USA",
keywords = "data races for programs; debugging; dynamic nesting;
monitored program execution; nested fork-join
parallelism; on-the-fly detection; parallel constructs;
parallel programming; program debugging; program
testing; protocol; protocols; run-time detection;
shared-memory programs; worst-case run-time overhead",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Picano:1991:PCE,
author = "S. Picano and E. D. {Brooks, III} and J. E. Hoag",
title = "Programming costs of explicit memory localization on a
large scale shared memory multiprocessor",
crossref = "IEEE:1991:PSA",
pages = "36--45",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5440 (Multiprocessor systems and techniques);
C6110P (Parallel programming); C6120 (File
organisation)",
corpsource = "Sch. of Electr. Eng., Purdue Univ., West Lafayette,
IN, USA",
keywords = "BBN TC2000; buffer storage; explicit memory
localization; large scale shared memory multiprocessor;
MIMD parallel computer; multiprocessing systems;
network simulation program; parallel programming;
performance gains; programming costs; software
controlled cache coherence mechanism; storage
management",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Shing:1991:CMD,
author = "H. Shing and L. M. Ni",
title = "A conflict-free memory design for multiprocessors",
crossref = "IEEE:1991:PSA",
pages = "46--55",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5310 (Storage system design); C5440 (Multiprocessor
systems and techniques); C6120 (File organisation)",
corpsource = "Dept. of Comput. Sci., Michigan State Univ., East
Lansing, MI, USA",
keywords = "conflict-free memory design; data consistency; file
organisation; hot spot problem; interconnection network
structure; low cost mechanism; low latency; memory
architecture; multiprocessing systems; multiprocessors;
process synchronization; shared memory organization;
synchronisation",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{deDinechin:1991:UFE,
author = "B. D. {de Dinechin}",
title = "A ultra fast {Euclidean} division algorithm for prime
memory systems",
crossref = "IEEE:1991:PSA",
pages = "56--65",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5230 (Digital arithmetic methods); C5310 (Storage
system design)",
corpsource = "CEA, Centre d'Etudes de Limeil-Valenton, Villeneuve
St. George, France",
keywords = "address mapping; address skewing; digital arithmetic;
hardware implementation; image processing memory
systems; memory architecture; multibank memory design;
nonlinear skewing schemes; prime memory systems;
supercomputer; two's complement binary arithmetic;
ultra fast Euclidean division algorithm",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Cohen:1991:HSS,
author = "M. Cohen and M. Foster and D. Kratzer and P. Malone
and A. Solem",
title = "A high school supercomputing challenge",
crossref = "IEEE:1991:PSA",
pages = "68--75",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5440 (Multiprocessor systems and techniques);
C7810C (Computer-aided instruction)",
corpsource = "Los Alamos Nat. Lab., NM, USA",
keywords = "computational science project; educational computing;
high school supercomputing challenge; high-performance
computers; parallel processing; science and computing
knowledge",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Sadananda:1991:CCA,
author = "R. Sadananda",
title = "Chaotic cardiac arrhythmias",
crossref = "IEEE:1991:PSA",
pages = "76--84",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "A8730C (Electrical activity); C7330 (Biology and
medicine)",
corpsource = "Dept. of Biomed. Eng., Northwestern Univ., Evanston,
IL, USA",
keywords = "cardiology; chaotic cardiac arrhythmias; computer
simulation; coupled biological oscillators; digital
simulation; fibrillations; medical computing;
myocardial cells; nonlinear equations; phase locking;
phase response behavior; physiological models;
piecewise linear equations",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Hiranandani:1991:COF,
author = "S. Hiranandani and K. Kennedy and C.-W. Tseng",
title = "Compiler optimizations for {FortranD} on {MIMD}
distributed-memory machines",
crossref = "IEEE:1991:PSA",
pages = "86--100",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5440 (Multiprocessor systems and techniques);
C6140D (High level languages); C6150C (Compilers,
interpreters and other processors)",
corpsource = "Dept. of Comput. Sci., Rice Univ., Houston, TX, USA",
keywords = "code generation strategy; communication costs;
compiler optimisation; data decomposition; data
dependence; FORTRAN; Fortran D; iPSC/860; load
imbalance; MIMD distributed-memory machines; node
programs; parallel machines; program compilers",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Koelbel:1991:CGR,
author = "C. Koelbel",
title = "Compiler-time generation of regular communications
patterns",
crossref = "IEEE:1991:PSA",
pages = "101--110",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6150C (Compilers, interpreters and other
processors); C6150N (Distributed systems)",
corpsource = "Center for Res. on Parallel Comput., Rice Univ.,
Houston, TX, USA",
keywords = "block-distributed arrays; communication of nonlocal
values; compile time analysis; compile-time generation;
cyclicly-distributed arrays; distributed memory
machine; distributed processing; global name space;
Kali language; mapping; numerical algorithms; program
compilers; regular communications patterns; run-time
analysis",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Ramanujan:1991:TMI,
author = "J. Ramanujan and P. Sadayappan",
title = "Tiling multidimensional iteration spaces for nonshared
memory machines",
crossref = "IEEE:1991:PSA",
pages = "111--120",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6110P (Parallel programming); C6150C (Compilers,
interpreters and other processors)",
corpsource = "Dept. of Electr. and Comput. Eng., Louisiana State
Univ., Baton Rouge, LA, USA",
keywords = "deadlock-free tiles; loop iterations; multiply nested
loops; nested loops; nonshared memory machines;
parallel programming; partitioning; program compilers;
tiling multidimensional iteration spaces",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Kung:1991:NAA,
author = "H. T. Kung and J. Subhlok",
title = "A new approach for automatic parallelization of block
linear algebra computations",
crossref = "IEEE:1991:PSA",
pages = "122--129",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4140 (Linear algebra); C6110P (Parallel
programming)",
corpsource = "Sch. of Comput. Sci., Carnegie Mellon Univ.,
Pittsburgh, PA, USA",
keywords = "automatic generation; automatic parallelization; block
linear algebra computations; block routines; data
distribution scheme; fine-grain parallel
architectures; fully automatic system; highly parallel
systolic algorithms; iWarp; LAPACK; linear algebra;
parallel programming; parallel programs; performance
results; sequential block routine",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Markstein:1991:WFF,
author = "V. Markstein and P. Markstein and T. Nguyen and S.
Poole",
title = "Wide format floating-point math libraries",
crossref = "IEEE:1991:PSA",
pages = "130--138",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5230 (Digital arithmetic methods); C5470
(Performance evaluation and testing); C7310
(Mathematics)",
corpsource = "ISQUARE, Inc., Austin, TX, USA",
keywords = "128 bit; 64 bit; accuracy evaluations; Convex C-240;
Cray Y-MP; digital arithmetic; floating-point formats;
Hewlett--Packard 9000/720; IBM 3090E/VF; IBM
System/6000; math libraries; mathematics computing;
parallel processing; performance; performance
evaluation; transcendental functions; wide format
floating point math libraries",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Nicholas:1991:DCD,
author = "H. Nicholas and G. Giras and V. Hartonas-Garmhausen
and M. Kopko and C. Maher and A. Ropelewski",
title = "Distributing the comparison of {DNA} and protein
sequences across heterogeneous supercomputers",
crossref = "IEEE:1991:PSA",
pages = "139--146",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "A8715 (Molecular biophysics); C7330 (Biology and
medicine)",
corpsource = "Pittsburgh Supercomputing Center, PA, USA",
keywords = "control program; Cray Y-MP; DNA; DNA sequences;
heterogeneous supercomputers; libraries; MaxSegs
algorithm; medical computing; protein sequences;
proteins; Thinking Machines CM-2 system; workstation",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Simmons:1991:PCT,
author = "M. L. Simmons and H. J. Wasserman and O. M. Lubeck and
C. Eoyang and R. Mendez and H. Harada and M. Ishiguro",
title = "A performance comparison of three supercomputers:
{Fujitsu VP-2600}, {NEC SX-3}, and {Cray Y-MP}",
crossref = "IEEE:1991:PSA",
pages = "150--157",
year = "1991",
bibdate = "Sat Oct 24 13:05:56 1998",
acknowledgement = ack-nhfb,
classification = "C5440 (Multiprocessor systems and techniques); C5470
(Performance evaluation and testing)",
corpsource = "Los Alamos Nat. Lab., NM, USA",
keywords = "Cray Y-MP; Fujitsu VP-2600; highly vectorizable
production-type codes; memory bandwidth; Mendez Fluid
dynamics codes; multiple vector pipelines; NEC SX-3;
parallel processing; performance comparison;
performance evaluation; second-generation
supercomputers; standard Los Alamos benchmark set;
supercomputers; vector register organization",
sponsororg = "IEEE; ACM",
treatment = "P Practical; R Product Review",
}
@InProceedings{Bailey:1991:NPB,
author = "D. H. Bailey and E. Barszcz and J. T. Barton and D. S.
Browning and R. L. Carter and L. Dagum and R. A.
Fatoohi and P. O. Frederickson and T. A. Lasinski and
R. S. Schreiber and H. D. Simon and V. Venkatakrishnan
and S. K. Weeratunga",
title = "The {NAS} parallel benchmarks-summary and preliminary
results",
crossref = "IEEE:1991:PSA",
pages = "158--165",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "A4710 (General theory, simulation and other
computational methods); C5440 (Multiprocessor systems
and techniques); C5470 (Performance evaluation and
testing); C7460 (Aerospace engineering)",
corpsource = "NASA Ames Res. Centr, Moffett Field, CA, USA",
keywords = "aerospace computing; CFD codes; computational
aerosciences applications; computer fluid dynamics;
data motions; flow simulation; highly parallel systems;
NAS parallel benchmarks; numerical aerodynamic
simulation; parallel kernels; parallel processing;
performance evaluation; supercomputers",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Bailey:1991:PRT,
author = "D. H. Bailey and P. O. Frederickson",
title = "Performance results for two of the {NAS} parallel
benchmarks",
crossref = "IEEE:1991:PSA",
pages = "166--173",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "A4710 (General theory, simulation and other
computational methods); C1140G (Monte Carlo methods);
C4190 (Other numerical methods); C5440 (Multiprocessor
systems and techniques); C5470 (Performance evaluation
and testing); C7460 (Aerospace engineering)",
corpsource = "NASA Ames Res. Center, Moffett Field, CA, USA",
keywords = "aerospace computing; Connection Machine-2; Cray Y-MP;
fast Fourier transforms; flow simulation;
implementation schemes; Intel iPSC/860; Monte Carlo
methods; Monte Carlo statistical calculation; numerical
aerodynamic simulation; parallel benchmarks; parallel
computer systems; parallel processing; performance
evaluation; performance results; Poisson partial
differential equation solver; three-dimensional fast
Fourier transforms",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Baer:1991:EOP,
author = "J.-L. Baer and T.-F. Chen",
title = "An effective on-chip preloading scheme to reduce data
access penalty",
crossref = "IEEE:1991:PSA",
pages = "176--186",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5310 (Storage system design); C6120 (File
organisation)",
corpsource = "Dept. of Comput. Sci. and Eng., Washington Univ.,
Seattle, WA, USA",
keywords = "buffer storage; clock cycles; data access penalty
reduction; data cache misses; file organisation;
hardware support function; instruction stream; look-
ahead program counter; memory access models; memory
architecture; memory latency; on-chip data cache;
on-chip preloading scheme; operand references;
reference prediction table; trace-driven simulation",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Bird:1991:ULR,
author = "P. L. Bird and R. A. Uhlig",
title = "Using lookahead to reduce memory bank contention for
decoupled operand references",
crossref = "IEEE:1991:PSA",
pages = "187--196",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4240 (Programming and algorithm theory); C5310
(Storage system design); C6120 (File organisation)",
corpsource = "Adv. Comput. Res. Inst., Lyon, France",
keywords = "bank management hardware; complexity; computational
complexity; decoupled operand references; high
throughput memory designs; lookahead; memory
architecture; memory bank contention reduction; operand
references; simulation; storage management; storage
system control structure; table lookup",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Dubois:1991:DCE,
author = "M. Dubois and J.-C. Wang and L. A. Barroso and K. Lee
and Y.-S. Chen",
title = "Delayed consistency and its effects on the miss rate
of parallel programs",
crossref = "IEEE:1991:PSA",
pages = "197--206",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4240P (Parallel programming and algorithm theory);
C5640 (Protocols); C6110P (Parallel programming)",
corpsource = "Dept. of Electr. Eng. Syst., Univ. of Southern
California, Los Angeles, CA, USA",
keywords = "cache-based systems; complexity; computational
complexity; delayed consistency; delayed protocols;
execution-driven simulations; miss rate; parallel
algorithms; parallel programming; parallel programs;
performance comparison; protocols; weakly ordered
consistency model",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Hatcher:1991:ASP,
author = "P. J. Hatcher and M. J. Quinn and R. J. Anderso and A.
J. Lapadula and B. K. Seevers and A. F. Bennett",
title = "Architecture-independent scientific programming in
dataparallel {C}: three case studies",
crossref = "IEEE:1991:PSA",
pages = "208--217",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6110P (Parallel programming); C6140D (High level
languages); C6150C (Compilers, interpreters and other
processors); C7340 (Geophysics)",
corpsource = "Dept. of Comput. Sci., New Hampshire Univ., Durham,
NC, USA",
keywords = "architecture independent scientific programming; C
code; C language; compiled programs; dataparallel C;
geophysics computing; Intel iPSC/2; multicomputers;
multiprocessors; nCUBE 3200; ocean circulation model;
parallel programming; performance; program compilers;
Sequent Symmetry S81; shallow-water atmospheric model;
Sharks World model; SIMD programming language",
sponsororg = "IEEE; ACM",
treatment = "A Application; P Practical",
}
@InProceedings{Hirayama:1991:SFP,
author = "H. Hirayama and M. Ikeda and N. Sagawa",
title = "Solution functions of {PDEQSOL} (partial differential
equation solver language) for fluid problems",
crossref = "IEEE:1991:PSA",
pages = "218--227",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4170 (Differential equations)C4185 (Finite element
analysis); C6110P (Parallel programming); C6115
(Programming support); C7320 (Physics and Chemistry)",
corpsource = "Hitachi VLSI Eng. Ltd., Tokyo, Japan",
keywords = "benchmark; finite element analysis; finite element
method; fluid problems; Fortran 77 program; integrated
problem-solving environment; integrated software;
parallel programming; partial differential equation
solver language; partial differential equations;
performance evaluation; physics computing; problem
solving; programming environments; solution algorithms;
supercomputers; translator; vectorization ratios; very
high-level descriptions",
sponsororg = "IEEE; ACM",
treatment = "A Application; P Practical",
}
@InProceedings{Sethian:1991:CTF,
author = "J. A. Sethian and J.-P. Brunet and A. Greenberg and J.
P. Mesirov",
title = "Computing turbulent flow in complex geometries on a
massively parallel processor",
crossref = "IEEE:1991:PSA",
pages = "230--241",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "A4710 (General theory, simulation and other
computational methods); A4725 (Turbulent flows,
convection, and heat transfer); C5440 (Multiprocessor
systems and techniques); C7320 (Physics and
Chemistry)",
corpsource = "Dept. of Math., California Univ., Berkeley, CA, USA",
keywords = "adaptive creation; complex geometries; computational
element; Connection Machine CM-2; flow simulation;
Lagrangian schemes; massively parallel processor;
merger; parallel data structures; parallel elliptic
solvers; parallel N- body solvers; parallel processing;
physics computing; random vortex method; rollup;
turbulence; turbulent flow computing; vortex shedding",
sponsororg = "IEEE; ACM",
treatment = "A Application; P Practical",
}
@InProceedings{Elton:1991:LBM,
author = "B. H. Elton",
title = "A lattice {Boltzmann} method for a two-dimensional
viscous {Burgers} equation: computational results",
crossref = "IEEE:1991:PSA",
pages = "242--252",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "A5110 (Kinetic and transport theory); C4170
(Differential equations); C7320 (Physics and
Chemistry)",
corpsource = "Fujitsu America Inc., San Jose, CA, USA",
keywords = "Boltzmann equation; computational results;
conditionally monotone finite difference method;
difference equations; flow simulation; kinetic theory
of gases; l/sub 1/-norm; lattice Boltzmann method;
nonlinear advection-diffusion equation; physics
computing; two-dimensional viscous Burgers equation",
sponsororg = "IEEE; ACM",
treatment = "P Practical; T Theoretical or Mathematical",
}
@InProceedings{Mechoso:1991:DCM,
author = "C. R. Mechoso and C.-C. Ma and J. D. Farrar and J. A.
Saphr and Moore and R. W.",
title = "Distribution of a climate model across high-speed
networks",
crossref = "IEEE:1991:PSA",
pages = "253--260",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "A9260S (Climatology); A9385 (Instrumentation and
techniques for geophysical, hydrospheric and lower
atmosphere research); A9575P (Mathematical and computer
techniques); C7340 (Geophysics); C7350 (Astronomy and
astrophysics)",
corpsource = "Dept. of Atmos. Sci., Los Angeles Univ., CA, USA",
keywords = "astrophysics computing; atmospheric techniques;
climate model; climatology; coupled atmosphere-ocean
general circulation model; geographically separated
locations; geophysics computing; heterogeneous
computing environments; high-speed networks;
parallelism",
sponsororg = "IEEE; ACM",
treatment = "A Application; P Practical",
}
@InProceedings{Cann:1991:RFD,
author = "D. Cann",
title = "Retire {FORTRAN}? {A} debate rekindled",
crossref = "IEEE:1991:PSA",
pages = "264--272",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6110P (Parallel programming); C6140D (High level
languages)",
corpsource = "Lawrence Livermore Nat. Lab., CA, USA",
keywords = "abstraction; Cray Sisal; FORTRAN; functional language;
parallel execution; parallel programming; performance;
programming language; scientific computing",
sponsororg = "IEEE; ACM",
treatment = "G General Review; P Practical",
}
@InProceedings{Lee:1991:OOP,
author = "J. K. Lee and D. Gannon",
title = "Object oriented parallel programming experiments and
results",
crossref = "IEEE:1991:PSA",
pages = "273--282",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6110J (Object-oriented programming); C6110P
(Parallel programming); C6115 (Programming support)",
corpsource = "Dept. of Comput. Sci., Indiana Univ., Bloomington, IN,
USA",
keywords = "data distribution; distributed collection model;
massive parallelism; memory locality; object oriented
parallel programming; object-oriented programming;
parallel programming; PC++; performance; programming
environments",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Gursoy:1991:HLS,
author = "A. Gursoy and L. V. Kale",
title = "High level support for divide-and-conquer
parallelism",
crossref = "IEEE:1991:PSA",
pages = "283--292",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6110P (Parallel programming); C6140D (High level
languages)",
corpsource = "Dept. of Comput. Sci., Illinois Univ., Urbana, IL,
USA",
keywords = "C language; Chare Kernel parallel programming;
divide-and-conquer parallelism; dynamic load balancing;
high level languages; high level support; iPSC/2;
machine-independent execution; NCUBE/two; parallel
programming; Sequent symmetry; synchronisation;
synchronization; translator",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Ewing:1991:VPI,
author = "R. Ewing and P. O'Leary and J. Sochacki",
title = "Vector\slash parallel implementation of a porous media
flow code",
crossref = "IEEE:1991:PSA",
pages = "294--303",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "A4710 (General theory, simulation and other
computational methods); A4755M (Flow through porous
media); C4240 (Programming and algorithm theory); C7340
(Geophysics)",
corpsource = "Inst. for Sci. Comput., Wyoming Univ., Laramie, WY,
USA",
keywords = "computational complexity; computational model; flow
simulation; flow through porous media; geophysics
computing; large-scale simulation; miscible fluids; oil
recovery processes; porous media flow code;
supercomputing; timings; viscous fingering",
sponsororg = "IEEE; ACM",
treatment = "A Application; P Practical",
}
@InProceedings{Young:1991:HPV,
author = "L. C. Young and S. E. Zaratonello",
title = "High performance vector processing in reservoir
simulation",
crossref = "IEEE:1991:PSA",
pages = "304--315",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "A4710 (General theory, simulation and other
computational methods); A4755M (Flow through porous
media); C4170 (Differential equations); C5440
(Multiprocessor systems and techniques); C7340
(Geophysics)",
corpsource = "Reservoir Simulation Research Corp., Tulsa, OK, USA",
keywords = "600 MFLOPS; black-oil problems; computational
performance; difference equations; finite-difference
formulation; flow simulation; flow through porous
media; Fujitsu VP2600/10 supercomputer; geophysics
computing; high performance vector processing; parallel
processing; reservoir simulation",
sponsororg = "IEEE; ACM",
treatment = "A Application; P Practical",
}
@InProceedings{Myczkowski:1991:SMA,
author = "J. Myczkowski and G. Steele",
title = "Seismic modeling at {15 Gigaflops} on the {Connection
Machine}",
crossref = "IEEE:1991:PSA",
pages = "316--326",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "A9130 (Seismology); C4170 (Differential equations);
C5440 (Multiprocessor systems and techniques); C7340
(Geophysics)",
corpsource = "Thinking Machines Corp., Cambridge, MA, USA",
keywords = "14 GFLOPS; acoustic wave equation; CM-2 supercomputer;
Connection Machine; difference equations; finite
difference algorithm; floating point unit; geophysics
computing; instruction sequence; interprocessor grid
communication; massively parallel machine; memory
interface; parallel processing; seismic modelling code;
seismology; sponge boundary conditions; stencil
compiler",
sponsororg = "IEEE; ACM",
treatment = "A Application; P Practical",
}
@InProceedings{Dongarra:1991:GBP,
author = "J. J. Dongarra and A. Karp and K. Miura and H. D.
Simon",
title = "{Gordon Bell Prize} lectures (supercomputer
applications)",
crossref = "IEEE:1991:PSA",
pages = "328--337",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5440 (Multiprocessor systems and techniques)",
corpsource = "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
USA",
keywords = "128-node Intel iPSC/860; compiler speedup; Connections
Machine; electronic structure; floating point
processors; Fortran 77; Fortran 90; grid generation
program; parallel processing; partial differential
equation; price/performance award; scientific and
engineering problems; supercomputers",
sponsororg = "IEEE; ACM",
treatment = "G General Review; P Practical",
}
@InProceedings{Sabot:1991:CPE,
author = "G. Sabot and L. Tennies and A. Vasilevsky and R.
Shapiro",
title = "Compiler parallelization of an elliptic grid generator
for {1990 Gordon Bell Prize}",
crossref = "IEEE:1991:PSA",
pages = "338--346",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5440 (Multiprocessor systems and techniques);
C6150C (Compilers, interpreters and other processors)",
corpsource = "Thinking Machines Corp., Cambridge, MA, USA",
keywords = "1990 Gordon Bell Prize; application code;
automatically parallelizing compiler; compiler
parallelisation; Connection Machine Fortran 1.0
compiler; cycle counting analysis; elliptic grid
generator; FORTRAN; Fortran program; numerical
simulation; parallel processing; program compilers; Sun
workstation",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Beal:1991:GAP,
author = "D. Beal and C. Lambrinoudakis",
title = "{GPFP}: an array processing element for the next
generation of massively parallel supercomputer
architectures",
crossref = "IEEE:1991:PSA",
pages = "348--357",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "B1265F (Microprocessors and microcomputers); B2570D
(CMOS integrated circuits); C5130 (Microprocessor
chips); C5220P (Parallel architecture); C5230 (Digital
arithmetic methods)",
corpsource = "Dept. of Comput. Sci., Queen Mary and Westfield Coll.,
London Univ., UK",
keywords = "1.6 micron; 2.5 GFLOPS; 50 MHz; 50-MHz clock; ALU;
arithmetic and logic unit; array processing element;
CMOS integrated circuits; CMOSIC; cost-effective extra
functionality; digital arithmetic; floating point
arithmetic; general purpose with floating point
support; GPFP; MasPar; massively parallel SIMD arrays;
massively parallel supercomputer architectures;
microprocessor chips; on-chip memory; parallel
architectures; processing element; VLSI",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Karmarkar:1991:NPA,
author = "N. Karmarkar",
title = "A new parallel architecture for sparse matrix
computation based on finite projective geometries",
crossref = "IEEE:1991:PSA",
pages = "358--369",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4140 (Linear algebra); C5220P (Parallel
architecture)",
corpsource = "AT and T Bell Labs., Murray Hill, NJ, USA",
keywords = "data-routing; finite projective geometries; load
balancing; mathematical structure; matrix algebra;
memory-access conflicts; parallel architecture;
parallel architectures; parallel systems; pattern of
interconnection; sparse matrix computation",
sponsororg = "IEEE; ACM",
treatment = "A Application; P Practical",
}
@InProceedings{Jordan:1991:TMO,
author = "H. F. Jordan and V. P. Heuring",
title = "Time multiplexed optical computers",
crossref = "IEEE:1991:PSA",
pages = "370--378",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "B4125 (Fibre optics); B4180 (Optical logic devices
and optical computing techniques); C5270 (Optical
computing techniques)",
corpsource = "Dept. of Electr. and Comput. Eng., Colorado Univ.,
Boulder, CO, USA",
keywords = "architecture; bit serial; directional couplers;
interconnection; logic devices; optical counter;
optical fibers; optical fibres; optical information
processing; proof-of-principle experiment; temporal
latency; time division multiplexing; time multiplexed
optical computers",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Fiduccia:1991:UMN,
author = "C. M. Fiduccia and E. M. Jacobson",
title = "Universal multistage networks via linear
permutations",
crossref = "IEEE:1991:PSA",
pages = "380--389",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C1160 (Combinatorial mathematics); C4230M
(Multiprocessor interconnection)",
corpsource = "Supercomputing Res. Center, Bowie, MD, USA",
keywords = "de Bruijn graph; directed 2-graphs; directed graphs;
invertible linear operator; linear permutations;
multiprocessor interconnection networks; N/2 nodes;
shuffle-exchange network; universal multistage
networks",
sponsororg = "IEEE; ACM",
treatment = "P Practical; T Theoretical or Mathematical",
}
@InProceedings{Wei:1991:DAE,
author = "S. Wei and S. Levy",
title = "Design and analysis of efficient hierarchical
interconnection networks",
crossref = "IEEE:1991:PSA",
pages = "390--399",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4230M (Multiprocessor interconnection); C5670
(Network performance)",
corpsource = "Dept. of Comput. Sci., Rutgers Univ., New Brunswick,
NJ, USA",
keywords = "average internode distance; design parameters;
diameter; fault tolerance capability; hierarchical
interconnection networks; intercluster traffic density;
interface nodes; message-passing architectures;
multiprocessor interconnection networks; performance
evaluation; performance measures",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Farrens:1991:ATS,
author = "M. Farrens and B. Wetmore and A. Woodruff",
title = "Alleviation of tree saturation in multistage
interconnection networks",
crossref = "IEEE:1991:PSA",
pages = "400--409",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C1160 (Combinatorial mathematics); C4230M
(Multiprocessor interconnection); C5670 (Network
performance)",
corpsource = "Div. of Comput. Sci., California Univ., Davis, CA,
USA",
keywords = "bleeding; feedback damping scheme; feedback threshold
value; hot spot contention; memory modules; memory
queue size; multiprocessor interconnection networks;
multistage interconnection networks; network
simulation; performance evaluation; system performance;
tree saturation alleviation; trees (mathematics)",
sponsororg = "IEEE; ACM",
treatment = "P Practical; T Theoretical or Mathematical",
}
@InProceedings{Cheng:1991:EAI,
author = "D. Y. Cheng and D. M. Pase",
title = "An evaluation of automatic and interactive parallel
programming tools",
crossref = "IEEE:1991:PSA",
pages = "412--423",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5470 (Performance evaluation and testing); C6110P
(Parallel programming); C6115 (Programming support);
C7460 (Aerospace engineering)",
corpsource = "NASA Ames Res. Center, Moffett Field, CA, USA",
keywords = "aerospace computing; aerospace simulation; automatic
tools; benchmarks; code transformation; Cray Y-MP;
interactive parallel programming tools; interactive
systems; machine-specific optimizations; NAS; Numerical
Aerodynamics Simulation; parallel programming;
performance; performance degradation; performance
evaluation; software tools",
sponsororg = "IEEE; ACM",
treatment = "A Application; P Practical",
}
@InProceedings{Hall:1991:ITP,
author = "M. W. Hall and K. Kennedy and K. S. McKinley",
title = "Interprocedural transformations for parallel code
generation",
crossref = "IEEE:1991:PSA",
pages = "424--434",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6110P (Parallel programming); C6150C (Compilers,
interpreters and other processors); C6150G (Diagnostic,
testing, debugging and evaluating systems)",
corpsource = "Dept. of Comput. Sci., Rice Univ., Houston, TX, USA",
keywords = "compiler optimization; interprocedural
transformations; loop parallelization; machine model;
parallel code generation; parallel programming;
parallelism-enhancing transformations; Perfect
Benchmarks; performance evaluation; performance
improvements; procedure calls; program compilers;
scientific programs; shared-memory multiprocessor",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Beguelin:1991:GDT,
author = "A. Beguelin and J. J. Dongarra and G. A. Geist and R.
Manchek and V. S. Sunderam",
title = "Graphical development tools for network-based
concurrent supercomputing",
crossref = "IEEE:1991:PSA",
pages = "435--444",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6110P (Parallel programming); C6115 (Programming
support); C6180G (Graphical user interfaces)",
corpsource = "Oak Ridge Nat Lab., TN, USA",
keywords = "application program; graphical development tools;
graphical user interfaces; HeNCE; heterogeneous network
computing environment; integrated graphical tools;
network-based concurrent supercomputing; parallel
programming; parallel programs; Parallel Virtual
Machine; process management and communication;
programming environments; PVM; software package;
X-window-based software environment",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Plimpton:1991:SAR,
author = "S. Plimpton and G. Mastin and D. Ghiglia",
title = "Synthetic aperture radar image processing on parallel
supercomputers",
crossref = "IEEE:1991:PSA",
pages = "446--452",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "B6140C (Optical information and image processing);
B6320 (Radar equipment, systems and applications);
C5260B (Computer vision and picture processing); C7410F
(Communications)",
corpsource = "Sandia Nat. Labs., Albuquerque, NM, USA",
keywords = "2-D FFTs; CM-2; computerised picture processing; fast
Fourier transforms; nCUBE 2 hypercube; parallel
processing; parallel supercomputers; performance data;
phase gradient autofocusing; polar reformatter; radar
applications; synthetic aperture radar image
processing; telecommunications computing; uncompensated
phase errors",
sponsororg = "IEEE; ACM",
treatment = "A Application; P Practical",
}
@InProceedings{Hotchkiss:1991:ASI,
author = "R. S. Hotchkiss and C. L. Wampler",
title = "The auditorialization of scientific information",
crossref = "IEEE:1991:PSA",
pages = "453--461",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "B6130 (Speech analysis and processing techniques);
B6140 (Signal processing and detection); C5260 (Digital
signal processing); C5585 (Speech recognition and
synthesis)",
corpsource = "Los Alamos Nat. Lab., NM, USA",
keywords = "auditorialization; computerised signal processing;
cryptography; encoding; encrypt; functional data;
mathematical functions; scientific information;
sequences of music; sound errors; speech analysis and
processing; speech recognition",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Tamayo:1991:PAS,
author = "P. Tamayo and J. P. Mesirov and B. M. Boghosian",
title = "Parallel approaches to short range molecular dynamics
simulations",
crossref = "IEEE:1991:PSA",
pages = "462--470",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "A6120J (Computer simulation of static and dynamic
behaviour); C4240P (Parallel programming and algorithm
theory); C7320 (Physics and Chemistry)",
corpsource = "Thinking Machine Corp., Cambridge, MA, USA",
keywords = "coarse-grained cells; computational requirements;
Connection Machine CM-2; linked lists; molecular
dynamics method; parallel algorithms; parallel
machines; performance evaluation; physics computing;
short range molecular dynamics simulations; Verlet
neighbor lists",
sponsororg = "IEEE; ACM",
treatment = "A Application; P Practical",
}
@InProceedings{Friedell:1991:VBM,
author = "M. Friedell and M. LaPolla and S. Kochhar and S.
Sistare and Juda and J.",
title = "Visualizing the behavior of massively parallel
programs",
crossref = "IEEE:1991:PSA",
pages = "472--480",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6110P (Parallel programming); C6115 (Programming
support); C6150G (Diagnostic, testing, debugging and
evaluating systems)",
corpsource = "Harvard Univ., Cambridge, MA, USA",
keywords = "behaviour visualization; computer-aided design system;
conceptual framework; Connection Machine; debugging;
integrated visualization environment; massively
parallel programs; parallel programming; program
debugging; program testing; programming environments;
prototype system; SIMD programs; user-interaction
paradigm",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Goldberg:1991:PDS,
author = "A. J. Goldberg and J. L. Hennessy",
title = "Performance debugging shared memory multiprocessor
programs with {MTOOL}",
crossref = "IEEE:1991:PSA",
pages = "481--490",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6110P (Parallel programming); C6115 (Programming
support); C6150G (Diagnostic, testing, debugging and
evaluating systems); C6180G (Graphical user
interfaces)",
corpsource = "Stanford Univ., CA, USA",
keywords = "graphical user interfaces; low overhead
instrumentation; MTOOL; parallel programming;
performance evaluation; performance losses; program
debugging; shared memory parallel programs; Silicon
Graphics multiprocessors; software tool; software
tools; synchronisation; synchronization bottlenecks;
time bottlenecks; window-based user interface",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Utter-Honig:1991:GAP,
author = "S. Utter-Honig and C. M. Pancake",
title = "Graphical animation of parallel {Fortran} programs",
crossref = "IEEE:1991:PSA",
pages = "491--500",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6110P (Parallel programming); C6130B (Graphics
techniques); C6150G (Diagnostic, testing, debugging and
evaluating systems)",
corpsource = "Cornell Nat. Supercomputer Facility, Cornell Univ.,
Itahca, NY, USA",
keywords = "computer animation; FORTRAN; hierarchically organized
source code; lock/event synchronization; parallel
Fortran programs; parallel programming; performance
analysis; performance evaluation; PF-View; program
behavior; software tools; synchronisation; textural
trace information; tool; visualizing the behavior",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Chang:1991:SPP,
author = "Yao-Jen Chang and J.-L. C. Wu and Jingshown Wu",
title = "Scheduling parallel programs with non-uniform
parallelism profiles",
crossref = "IEEE:1991:PSA",
pages = "502--511",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6110P (Parallel programming); C6150J (Operating
systems)",
corpsource = "Dept. of Electr. Eng., Nat. Taiwan Univ., Taipei,
Taiwan",
keywords = "databases; job turnaround time; multiprocessing
systems; nonuniform parallelism profiles; operating
system; parallel algorithms; parallel programming;
parallel programs scheduling; parallelizing compilers;
performance evaluation; processor allocation;
scheduling; speedup; task graphs",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Ieumwananonthachai:1991:IMC,
author = "A. Ieumwananonthachai and A. N. Aizawa and S. R.
Schwartz and Wah and B. W. and J. C. Yan",
title = "Intelligent mapping of communicating processes in
distributed computing systems",
crossref = "IEEE:1991:PSA",
pages = "512--521",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C1230 (Artificial intelligence); C4240 (Programming
and algorithm theory); C6150N (Distributed systems)",
corpsource = "Coord. Sci. Lab., Illinois Univ., Champaign, IL, USA",
keywords = "automatically designing heuristics; communicating
processes; computational complexity; distributed
computing systems; distributed processing; heuristic
programming; NP-hard; optimal routing of messages;
post-game analysis; real-time systems; simulations;
solution quality; statistical method; TEACHER 4.1",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Kodama:1991:LBF,
author = "Y. Kodama and S. Sakai and Y. Yamaguchi",
title = "Load balancing by function distribution on the {EM-4}
prototype",
crossref = "IEEE:1991:PSA",
pages = "522--531",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5440 (Multiprocessor systems and techniques); C5470
(Performance evaluation and testing); C6150N
(Distributed systems)",
corpsource = "Electrotech. Lab., Ibaraki, Japan",
keywords = "allocation functions; divide-and-conquer program;
dynamic characteristics; EM-4; function distribution;
game tree program; load balancing methods;
local-minimum load; MLPE packets; parallel dataflow
machine; parallel processing; performance evaluation;
resource allocation",
sponsororg = "IEEE; ACM",
treatment = "X Experimental",
}
@InProceedings{Meindl:1991:GIG,
author = "J. D. Meindl",
title = "Gigascale integration ({GSI}) technology",
crossref = "IEEE:1991:PSA",
pages = "534--538",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "B1265 (Digital electronics); B2570 (Semiconductor
integrated circuits); C5120 (Logic and switching
circuits)",
corpsource = "Rensselaer Polytech. Inst., Troy, NY, USA",
keywords = "chip area; chip performance index; delays; gigascale
integration; integrated circuit technology;
macrovariables; minimum feature size; number of
transistors per minimum feature area; power-delay
product; reciprocal length versus delay; singular
metric; switching operations; technological
forecasting; transmission operations; VLSI",
sponsororg = "IEEE; ACM",
treatment = "G General Review",
}
@InProceedings{Willen:1991:EGP,
author = "D. E. Willen",
title = "Exploration geophysics, parallel computing and
reality",
crossref = "IEEE:1991:PSA",
pages = "540--??",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "A9130R (Explosion seismology); A9365 (Data
acquisition, processing and storage); A9385
(Instrumentation and techniques for geophysical,
hydrospheric and lower atmosphere research); C5440
(Multiprocessor systems and techniques); C7340
(Geophysics)",
corpsource = "EXXON Production Research Co., Houston, TX, USA",
keywords = "complex near surface; density effects; elastic
effects; exploration geophysics; geophysical
prospecting; geophysics computing; inverse problems;
layered Earth approximations; parallel processing;
seismic data; seismology; structured models; TeraFLOPS;
TFLOPS; traveltime calculations; wave propagation",
sponsororg = "IEEE; ACM",
treatment = "G General Review",
}
@InProceedings{Rutledge:1991:AIL,
author = "J. M. Rutledge and D. R. Jones and W. H. Chen and E.
Y. Chung",
title = "Application issues for large scale reservoir
simulation on massively parallel computers",
crossref = "IEEE:1991:PSA",
pages = "541--??",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "A9385 (Instrumentation and techniques for
geophysical, hydrospheric and lower atmosphere
research); C5440 (Multiprocessor systems and
techniques); C6150N (Distributed systems); C7340
(Geophysics); C7450 (Chemical engineering)",
keywords = "chemical engineering computing; computational speed;
distributed memory machines; geophysics computing;
indirect addressing; intensive computational needs;
large scale reservoir simulation; linear equation
solver; load balancing; massively parallel computers;
oil technology; parallel processing; petroleum
reservoir models; resource allocation; robustness;
shared memory computers; unit stride; vector
supercomputers",
sponsororg = "IEEE; ACM",
treatment = "G General Review",
}
@InProceedings{Kendall:1991:LSR,
author = "R. P. Kendall and J. R. Wallis and J. A. Foster and J.
S. Nolen",
title = "Large scale reservoir simulation in the concurrent
processing milieu",
crossref = "IEEE:1991:PSA",
pages = "542--??",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C7340 (Geophysics); C7450 (Chemical engineering)",
keywords = "chemical engineering computing; concurrent processing
milieu; fine granularity; geophysics computing;
numerical reservoir simulation; oil technology;
parallel processing; performance gains; simulation
technology",
sponsororg = "IEEE; ACM",
treatment = "G General Review",
}
@InProceedings{Smith:1991:VCC,
author = "L. L. Smith",
title = "Vectorizing {C} compilers: how good are they?",
crossref = "IEEE:1991:PSA",
pages = "544--553",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6110P (Parallel programming); C6140D (High level
languages); C6150C (Compilers, interpreters and other
processors)",
corpsource = "Supercomputing Res. Center, Bowie, MD, USA",
keywords = "automatic vectorization; C language; C loop kernels;
Convex Application Compiler; Convex cc compiler; Cray 2
scc compiler; Cray YMP scc compiler; parallel
programming; pipeline processing; program compilers;
program testing; vectorizing C compilers",
sponsororg = "IEEE; ACM",
treatment = "P Practical; X Experimental",
}
@InProceedings{Glen:1991:CMH,
author = "R. R. Glen and D. V. Pryor and J. M. Conroy and T.
Johnson",
title = "Characterizing memory hot spots in a shared memory
{MIMD} machine",
crossref = "IEEE:1991:PSA",
pages = "554--566",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5220P (Parallel architecture); C5440
(Multiprocessor systems and techniques); C6150N
(Distributed systems)",
corpsource = "Supercomputing Res. Center, Bowie, MD, USA",
keywords = "bistability; critical section; first come/first serve
queuing mechanism; massively parallel MIMD computers;
memory hot spot; memory stride; multiprocessing
systems; pseudorandom interleaving; separate memory
accesses; shared memory locations; shared memory MIMD
machine; split transaction; storage management;
supercomputers; threads; throughput prediction",
sponsororg = "IEEE; ACM",
treatment = "P Practical; T Theoretical or Mathematical",
}
@InProceedings{Miller:1991:IOB,
author = "E. L. Miller and R. H. Katz",
title = "Input\slash output behavior of supercomputing
applications",
crossref = "IEEE:1991:PSA",
pages = "567--576",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5440 (Multiprocessor systems and techniques);
C6150N (Distributed systems)",
corpsource = "Dept. of Electr. Eng. and Comput. Sci., California
Univ., Berkeley, CA, USA",
keywords = "access pattern; buffer storage; bursty I/O request
pattern; caching simulations; CPU utilization; Cray
computers; Cray Y-MP CPU; digital simulation; file
cache; file references; input-output programs;
parallel processing; read-ahead; solid-state disk;
storage management; supercomputer I/O traces;
write-behind",
sponsororg = "IEEE; ACM",
treatment = "P Practical; X Experimental",
}
@InProceedings{Chronopoulos:1991:TEP,
author = "A. T. Chronopoulos",
title = "Towards efficient parallel implementation of the {CG}
method applied to a class of block tridiagonal linear
systems",
crossref = "IEEE:1991:PSA",
pages = "578--587",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4140 (Linear algebra); C4170 (Differential
equations); C4240P (Parallel programming and algorithm
theory); C5220P (Parallel architecture)",
corpsource = "Dept. of Comput, Sci., Minnesota Univ., Minneapolis,
MN, USA",
keywords = "block tridiagonal linear systems; conjugate gradient
methods; CRAY-2; elliptic partial differential
equation; Hypercube parallel computers; memory
hierarchy; message passing private memory machines;
parallel algorithms; parallel architectures; parallel
machines; parameterized vector architecture; partial
differential equations; shared memory machines; vector
processors",
sponsororg = "IEEE; ACM",
treatment = "X Experimental",
}
@InProceedings{Pommerell:1991:PIL,
author = "C. Pommerell and W. Fichtner",
title = "{PILS}: an iterative linear solver package for
ill-conditioned systems",
crossref = "IEEE:1991:PSA",
pages = "588--599",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4140 (Linear algebra); C7310 (Mathematics)",
corpsource = "Integrated Syst. Lab., ETH, Zurich, Switzerland",
keywords = "equation solution; ill-conditioned systems; iterative
linear solver package; linear algebra; linear
equations; mathematics computing; multidimensional
solution; ordering; partial differential equations;
PILS; preconditioning; production; software
implementation; software package; software packages",
sponsororg = "IEEE; ACM",
treatment = "P Practical; T Theoretical or Mathematical",
}
@InProceedings{Malard:1991:TPD,
author = "J. Malard",
title = "Threshold pivoting for dense {LU} factorization on
distributed memory multiprocessor",
crossref = "IEEE:1991:PSA",
pages = "600--607",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4140 (Linear algebra); C4240P (Parallel programming
and algorithm theory)",
corpsource = "Sch. of Comput. Sci., McGill Univ., Montreal, Que.,
Canada",
keywords = "block column wrapping; dense LU factorization;
distributed memory multiprocessor; matrix algebra;
multicasts; parallel algorithms; parallel programming;
row wrapping",
sponsororg = "IEEE; ACM",
treatment = "X Experimental",
}
@InProceedings{Hummel:1991:FPR,
author = "S. F. Hummel and E. Schonberg and L. E. Flynn",
title = "Factoring: a practical and robust method for
scheduling parallel loops",
crossref = "IEEE:1991:PSA",
pages = "610--619",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6110P (Parallel programming); C6150C (Compilers,
interpreters and other processors)",
corpsource = "CRI, Ecole Nat. Sup{\'e}rieure des Mines de Paris,
Fontainebleau, France",
keywords = "factoring; guided self-scheduling; independent
iterations; optimal finishing time; parallel languages;
parallel programming; parallel-loop characteristics;
program compilers; PTRAN restructuring compiler;
resource allocation; RP3 runtime system; scheduling;
scheduling parallel loops; static chunking",
sponsororg = "IEEE; ACM",
treatment = "P Practical; X Experimental",
}
@InProceedings{Chen:1991:ESD,
author = "D.-K. Chen and P.-C. Yew",
title = "An empirical study on {DOACROSS} loops",
crossref = "IEEE:1991:PSA",
pages = "620--632",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6110P (Parallel programming); C6150C (Compilers,
interpreters and other processors)",
corpsource = "Center for Supercomput. Res. and Dev., Illinois Univ.,
Urbana, IL, USA",
keywords = "concurrent DOACROSS loop execution; cross-iteration
dependences; digital simulation; execution-driven
simulation; KAP; MaxPar; optimizing compilers; parallel
machines; parallel programming; parallelizing compiler;
program compilers",
sponsororg = "IEEE; ACM",
treatment = "P Practical; X Experimental",
}
@InProceedings{Yang:1991:FSS,
author = "T. Yang and A. Gerasoulis",
title = "A fast static scheduling algorithm for {DAGs} on an
unbounded number of processors",
crossref = "IEEE:1991:PSA",
pages = "633--642",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C1160 (Combinatorial mathematics); C4240P (Parallel
programming and algorithm theory); C6110P (Parallel
programming); C6150N (Distributed systems)",
corpsource = "Dept. of Comput. Sci., Rutgers Univ., New Brunswick,
NJ, USA",
keywords = "coarse tree graphs; communication overhead; completely
connected processors; computational complexity; DAG;
DAGs; directed acyclic task graphs; directed graphs;
dominant sequences clustering; fork; heuristic
algorithm; join; parallel algorithms; parallel
programming; parallel time; scheduling; static
scheduling algorithm",
sponsororg = "IEEE; ACM",
treatment = "P Practical; T Theoretical or Mathematical",
}
@InProceedings{Qiao:1991:TOC,
author = "C. Qiao and R. G. Melham",
title = "Time-division optical communications in multiprocessor
arrays",
crossref = "IEEE:1991:PSA",
pages = "644--653",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "B6150C (Switching theory); B6260 (Optical links and
equipment); C4230M (Multiprocessor interconnection);
C5440 (Multiprocessor systems and techniques); C6150N
(Distributed systems)",
corpsource = "Dept. of Comput. Sci., Pittsburgh Univ., PA, USA",
keywords = "clock distribution method; high communication
bandwidth; message pipelining; multiprocessing systems;
multiprocessor arrays; optical communication; optical
signal transmission; optical waveguides; predictable
propagation delays; synchronisation; synchronization;
time division multiplexing; time-division multiplexing;
unidirectional propagation",
sponsororg = "IEEE; ACM",
treatment = "T Theoretical or Mathematical",
}
@InProceedings{Felperin:1991:FRP,
author = "S. A. Felperin and L. Gravano and G. D. Pifarre and J.
C. L. Sanz",
title = "Fully-adaptive routing: packet switching performance
and wormhole algorithms",
crossref = "IEEE:1991:PSA",
pages = "654--663",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "B6150C (Switching theory); C4230M (Multiprocessor
interconnection); C5220P (Parallel architecture); C5470
(Performance evaluation and testing)",
keywords = "deadlock-free adaptive routing; fully adaptive minimal
worm-hole routing algorithm; hypercube; injection
models; latency; livelock-free adaptive routing; mesh;
packet switching; packet switching performance;
parallel architectures; performance evaluation;
saturation point; simulation study; telecommunication
traffic; throughput; traffic models; wormhole
algorithms",
sponsororg = "IEEE; ACM",
treatment = "P Practical; X Experimental",
}
@InProceedings{Kung:1991:NME,
author = "H. T. Kung and R. Sansom and S. Schlick and P.
Steenkiste and M. Arnould and F. J. Bitz and
F. Christianson and E. C. Cooper and
{\"O}. Menzilcio{\u{g}}lu and D. Ombres and B. Zill",
title = "Network-based multicomputers: an emerging parallel
architecture",
crossref = "IEEE:1991:PSA",
pages = "664--673",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5220P (Parallel architecture); C5440
(Multiprocessor systems and techniques); C5620
(Computer networks and techniques)",
corpsource = "Sch. of Comput. Sci., Carnegie Mellon Univ.,
Pittsburgh, PA, USA",
keywords = "computer networks; copy operations; high bandwidth;
high-speed crossbar switches; host interrupts;
host-network interface overhead; low latency;
multicomputer applications; multiprocessing systems;
Nectar; network-based multicomputers; parallel
architecture; parallel architectures; protocol;
system-specific interconnects",
sponsororg = "IEEE; ACM",
treatment = "P Practical; X Experimental",
}
@InProceedings{Chervin:1991:CMP,
author = "R. Chervin",
title = "Climate modeling with parallel vector supercomputers",
crossref = "IEEE:1991:PSA",
pages = "677--??",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "A9260B (General circulation); A9260S (Climatology);
A9365 (Data acquisition, processing and storage); C7340
(Geophysics)",
corpsource = "Nat. Center for Atmos. Res., Boulder, CO, USA",
keywords = "atmospheric movements; climate modeling; climatology;
global atmospheric models; global climate system; model
performance enhancement; National Center for
Atmospheric Research; NCAR; ocean models; parallel
processing; parallel vector supercomputers; performance
evaluation; reduced execution time",
sponsororg = "IEEE; ACM",
treatment = "G General Review",
}
@InProceedings{Dannevik:1991:CMM,
author = "W. Dannevik",
title = "Computing modeling in a {MIMD} environment",
crossref = "IEEE:1991:PSA",
pages = "678--??",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "A9210D (Dynamics of the deep ocean); A9210F
(Dynamics of the upper ocean); A9260B (General
circulation); A9260S (Climatology); A9365 (Data
acquisition, processing and storage); C6110P (Parallel
programming); C7340 (Geophysics)",
corpsource = "Lawrence Livermore Nat. Lab., CA, USA",
keywords = "1D domain decomposition; 2D decomposition; atmospheric
circulation model; atmospheric movements; BBN TC2000
MIMD system; climate model numerical algorithms;
climatology; data structure definition;
distributed-memory programming models; finite
difference models; general circulation models;
geophysics computing; load-balancing; message-passing
paradigms; MIMD environment; oceanography; parallel
efficiency; parallel processing; Semtner-Chervin ocean
circulation model; shared-memory programming model;
spatial resolution; time-advance algorithm selection",
sponsororg = "IEEE; ACM",
treatment = "P Practical; T Theoretical or Mathematical",
}
@InProceedings{Smith:1991:OMC,
author = "R. D. Smith and J. K. Dukowicz and R. C. Malone",
title = "Ocean modeling on the {Connection Machine}",
crossref = "IEEE:1991:PSA",
pages = "679--??",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "A9210D (Dynamics of the deep ocean); A9210F
(Dynamics of the upper ocean); A9260B (General
circulation); A9365 (Data acquisition, processing and
storage); C6110P (Parallel programming); C7340
(Geophysics)",
corpsource = "Los Alamos Nat. Lab., NM, USA",
keywords = "3D primitive equations; 4-processor XMP; coastal
topography; Connection Machine; data structure; DOE
CHAMMP program; geophysics computing; global ocean
model; longitude-depth slab; Los Alamos CM-2 Connection
Machine; ocean-bottom topography; oceanography;
parallel processing; Semtner-Chervin ocean model;
stratified fluid flow; surface-pressure formulation",
sponsororg = "IEEE; ACM",
treatment = "T Theoretical or Mathematical; X Experimental",
}
@InProceedings{Chiueh:1991:IMM,
author = "T.-C. Chiueh",
title = "An integrated memory management scheme for dynamic
alias resolution",
crossref = "IEEE:1991:PSA",
pages = "682--691",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5220P (Parallel architecture); C5440
(Multiprocessor systems and techniques); C6150J
(Operating systems); C6150N (Distributed systems)",
corpsource = "Dept. of Electr. Eng. and Comput. Sci., California
Univ., Berkeley, CA, USA",
keywords = "indirect resolution; integrated memory management;
machine cycle time; memory mapped register;
multiprocessor configurations; on-chip data cache;
pipeline depth; processor registers; storage
allocation; storage management; tagged register",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Corporal:1991:MFH,
author = "{Corporal, H.} and H. Mulder",
title = "{MOVE}: a framework for high-performance processor
design",
crossref = "IEEE:1991:PSA",
pages = "692--701",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5220P (Parallel architecture)",
corpsource = "Dept. of Electr. Eng., Delft Univ. of Technol.,
Netherlands",
keywords = "configurable; data operations; data transport;
hardware organization; hardware utilization;
high-performance processors;
instruction-level-parallelism; MOVE; parallel
architectures; pipeline processing; pipelining;
scalable; short cycle implementations",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Bird:1991:SPP,
author = "P. L. Bird and U. F. Pleban",
title = "A semantics-directed partitioning of a processor
architecture",
crossref = "IEEE:1991:PSA",
pages = "702--709",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4210 (Formal logic); C4240 (Programming and
algorithm theory); C5220P (Parallel architecture)",
corpsource = "Adv. Comput. Res. Inst., Lyon, France",
keywords = "action semantics; computer architecture; decoupled
address generation; decoupled control activity;
denotational semantics; formal languages; formal
semantic model; MISD machine; parallel architectures;
processor architecture; programming language semantics;
programming theory; semantics partitioning;
semantics-directed partitioning",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Zagha:1991:RSV,
author = "M. Zagha and G. E. Blelloch",
title = "Radix sort for vector multiprocessors",
crossref = "IEEE:1991:PSA",
pages = "712--721",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4240P (Parallel programming and algorithm theory);
C6110P (Parallel programming); C6130 (Data handling
techniques)",
corpsource = "Sch. of Comput. Sci., Carnegie Mellon Univ.,
Pittsburgh, PA, USA",
keywords = "Cray computers; CRAY-Y-MP; data-parallel algorithm;
parallel algorithms; pipeline processing; radix sort
algorithm; sorting; vector multiprocessors",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Kanada:1991:MVP,
author = "Y. Kanada",
title = "A method of vector processing for shared symbolic
data",
crossref = "IEEE:1991:PSA",
pages = "722--731",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4210 (Formal logic); C4240P (Parallel programming
and algorithm theory); C6120 (File organisation)",
corpsource = "Hitachi Ltd., Tokyo, Japan",
keywords = "address calculation sorting; data structures; dynamic
data structures; filtering-overwritten-label method;
graphs; hash table; Hitachi S-810; lists; multiple
processings; parallel algorithms; parallel programming;
parallel rewriting; programming theory; rewriting
systems; shared elements; shared symbolic data;
symbolic processing algorithms; trees; vector
processing",
sponsororg = "IEEE; ACM",
treatment = "T Theoretical or Mathematical",
}
@InProceedings{Alnuweiri:1991:OBV,
author = "H. M. Alnuweiri",
title = "Optimal bounded-degree {VLSI} networks for sorting in
a constant number of rounds",
crossref = "IEEE:1991:PSA",
pages = "732--739",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "B2570 (Semiconductor integrated circuits); C4230M
(Multiprocessor interconnection); C4240P (Parallel
programming and algorithm theory); C6130 (Data handling
techniques)",
corpsource = "Dept. of Electr. Eng., British Columbia Univ.,
Vancouver, BC, Canada",
keywords = "bounded-degree VLSI networks; computational
complexity; enumeration-sort; I/O pins; index-mapping
methodology; multiple chip networks; multiprocessor
interconnection networks; optimal VLSI sorters;
parallel programming; partitioning; programming theory;
reduced-area shuffle networks; rotate-sort; sorting;
VLSI",
sponsororg = "IEEE; ACM",
treatment = "T Theoretical or Mathematical",
}
@InProceedings{Theobald:1991:EPA,
author = "K. B. Theobald and G. R. Gao",
title = "An efficient parallel algorithm for all pairs
examination",
crossref = "IEEE:1991:PSA",
pages = "742--753",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C1110 (Algebra); C4140 (Linear algebra); C4240P
(Parallel programming and algorithm theory)",
corpsource = "Sch. of Comput. Sci., McGill Univ., Montreal, Que.,
Canada",
keywords = "all pairs examination; automorphic transformations;
communication steps; computational complexity; group
theory; linear feedback shift registers; matrix
algebra; network traffic; parallel algorithm; parallel
algorithms; permutation groups; processor time;
run-time overhead",
sponsororg = "IEEE; ACM",
treatment = "T Theoretical or Mathematical",
}
@InProceedings{Woo:1991:PPF,
author = "M.-l. Woo and R. A. Renaut",
title = "Parallel power-of-two {FFTs} on hypercubes",
crossref = "IEEE:1991:PSA",
pages = "754--763",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4190 (Other numerical methods); C4230M
(Multiprocessor interconnection); C4240P (Parallel
programming and algorithm theory)",
corpsource = "Dept. of Math., Arizona State Univ., Tempe, AZ, USA",
keywords = "computational complexity; distance one algorithm;
distance two algorithm; fast Fourier transforms;
hypercube architectures; hypercube networks;
interprocessor communications; ordered power-of-two
fast Fourier transforms; packet transmission; parallel
algorithms; parallel power of two FFTs; time
complexity",
sponsororg = "IEEE; ACM",
treatment = "T Theoretical or Mathematical",
}
@InProceedings{Narayanan:1991:ARD,
author = "P. J. Narayanan",
title = "Analysis of replicated data algorithms on processor
array architectures",
crossref = "IEEE:1991:PSA",
pages = "764--773",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C1250 (Pattern recognition); C4230M (Multiprocessor
interconnection); C4240P (Parallel programming and
algorithm theory)",
corpsource = "Dept. of Comput. Sci., Maryland Univ., College Park,
MD, USA",
keywords = "3-D mesh; array interconnection networks; computerised
picture processing; data parallelism; data replication;
hypercube connected connection machine; image
processing algorithms; multiprocessor interconnection
networks; nonglobal architectures; operation
parallelism; parallel algorithms; processor array
architectures; replicated data algorithms",
sponsororg = "IEEE; ACM",
treatment = "T Theoretical or Mathematical; X Experimental",
}
@InProceedings{Tzeng:1991:DHR,
author = "N.-F. Tzeng",
title = "Design of a highly reliable cube-connected cycles
architecture",
crossref = "IEEE:1991:PSA",
pages = "776--785",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4230M (Multiprocessor interconnection); C5220P
(Parallel architecture); C5470 (Performance evaluation
and testing)",
corpsource = "Center for Adv. Comput. Studies, Univ. of Southwestern
Louisiana, Lafayette, LA, USA",
keywords = "area overhead; cross connections; fault tolerant
computing; fault tolerant cube connected cycles
architecture; multiprocessor interconnection networks;
parallel architectures; processing element;
reconfiguration procedure; reliable cube-connected
cycles architecture; XCCC layout",
sponsororg = "IEEE; ACM",
treatment = "T Theoretical or Mathematical",
}
@InProceedings{Taylor:1991:TFA,
author = "V. E. Taylor and A. Ranade and D. G. Messerschmitt",
title = "Three-dimensional finite-element analyses:
implications for computer architectures",
crossref = "IEEE:1991:PSA",
pages = "786--795",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4140 (Linear algebra); C4185 (Finite element
analysis); C4240P (Parallel programming and algorithm
theory); C5220P (Parallel architecture); C6110P
(Parallel programming); C6120 (File organisation)",
corpsource = "Dept. of Electr. Eng. and Comput. Sci., California
Univ., Berkeley, CA, USA",
keywords = "columns; computer architectures; data path design;
data structure; data structures; finite element
analysis; floating-point units; matrix algebra; memory
bandwidth; parallel architectures; parallel
programming; programming theory; rows; sparse matrices;
sparsity pattern",
sponsororg = "IEEE; ACM",
treatment = "P Practical; T Theoretical or Mathematical",
}
@InProceedings{Tomkins:1991:MPC,
author = "J. L. Tomkins and J. P. VanDyke",
title = "Massively parallel computing and the mid-course
tracking problem",
crossref = "IEEE:1991:PSA",
pages = "796--804",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6110P (Parallel programming); C7150 (Military)",
corpsource = "Sandia Nat. Labs., Albuquerque, NM, USA",
keywords = "Cray X-MP single processor; massively parallel MIMD
computing; mid-course tracking problem; military
computing; nCUBE/ten computer; parallel programming;
real-time solution; real-time systems; SDI; strategic
defence initiative; TRC code",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Bucher:1991:MMA,
author = "I. Y. Bucher and M. L. Simmons",
title = "Measurement of memory access contentions in multiple
vector processor systems",
crossref = "IEEE:1991:PSA",
pages = "806--817",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C1140C (Queueing theory); C5440 (Multiprocessor
systems and techniques); C5470 (Performance evaluation
and testing); C6150C (Compilers, interpreters and other
processors)",
corpsource = "Los Alamos Nat. Lab., NM, USA",
keywords = "active processors; CRAY X-MP; CRAY Y-MP; CRAY-2;
dynamic memory; memory access conflicts; memory bank
conflicts; mixed strides; multiple vector processor
systems; parallel machines; performance evaluation;
program compilers; queueing theory; queuing model;
static memory; stride one; vector length; vector loop
unrolling; vector operations; vector performance",
sponsororg = "IEEE; ACM",
treatment = "P Practical; T Theoretical or Mathematical",
}
@InProceedings{Chen:1991:CAS,
author = "Y.-C. Chen and A. V. Veidenbaum",
title = "Comparison and analysis of software and directory
coherence schemes",
crossref = "IEEE:1991:PSA",
pages = "818--829",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C6110P (Parallel programming); C6120 (File
organisation); C6185 (Simulation techniques)",
corpsource = "Center for Supercomputing Res. and Dev., Illinois
Univ., Urbana, IL, USA",
keywords = "buffer storage; cache coherence problem; digital
simulation; directory coherence; false sharing; hit
ratio; MIN- based large-scale multiprocessor system;
multiprocessor interconnection networks; nontrivial
cache line size; parallel programming; performance;
performance evaluation; shared memory traffic;
software; storage management; trace-driven
simulation",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
@InProceedings{Ahmad:1991:PPD,
author = "I. Ahmad and A. Ghafor and K. Mehrotra",
title = "Performance prediction of distributed load balancing
on multicomputer systems",
crossref = "IEEE:1991:PSA",
pages = "830--839",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C1140C (Queueing theory); C5440 (Multiprocessor
systems and techniques); C5470 (Performance evaluation
and testing)",
corpsource = "Sch. of Comput. and Inf. Sci., Syracuse Univ., NY,
USA",
keywords = "analytical models; average execution queue length;
central server open queuing network; local execution;
multicomputer systems; multiprocessing systems; newly
arrived task; performance evaluation; performance
prediction; probability; queueing theory; queuing
parameters; response time; sender-initiated distributed
load balancing strategies; simulation models;
statistical analysis",
sponsororg = "IEEE; ACM",
treatment = "T Theoretical or Mathematical; X Experimental",
}
@InProceedings{Su:1991:EDE,
author = "H.-M. Su and P.-C. Yew",
title = "Efficient {Doacross} execution on distributed
shared-memory multiprocessors",
crossref = "IEEE:1991:PSA",
pages = "842--853",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4240P (Parallel programming and algorithm theory);
C6110P (Parallel programming); C6120 (File
organisation); C6150C (Compilers, interpreters and
other processors)",
corpsource = "Center for Supercomput. Res. and Dev., Illinois Univ.,
Urbana, IL, USA",
keywords = "buffer location; compile time; compiler algorithms;
direct communication; distributed shared-memory
multiprocessors; Doacross execution; Doacross loop; DSM
architecture; message buffers; nearest shared memory;
parallel algorithms; parallel programming; program
compilers; programming theory; static message passing;
storage management; UMA architecture; uniform memory
access",
sponsororg = "IEEE; ACM",
treatment = "P Practical; T Theoretical or Mathematical",
}
@InProceedings{Granston:1991:DRA,
author = "E. D. Granston and A. V. Veidenbaum",
title = "Detecting redundant accesses to array data",
crossref = "IEEE:1991:PSA",
pages = "854--865",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4240P (Parallel programming and algorithm theory);
C6110P (Parallel programming); C6120 (File
organisation); C6150C (Compilers, interpreters and
other processors)",
corpsource = "Center for Supercomputing Res. and Dev., Illinois
Univ., Urbana, IL, USA",
keywords = "compile-time algorithm; conditionals; dependence
analysis; flow analysis; flow equations;
interval-analysis; parallel algorithms; parallel
constructs; parallel programming; program compilers;
programming theory; redundancy analysis; redundant
global memory accesses; redundant reference; storage
management; vector constructs",
sponsororg = "IEEE; ACM",
treatment = "P Practical; T Theoretical or Mathematical",
}
@InProceedings{Venugopal:1991:EPS,
author = "S. Venugopal and V. K. Naik",
title = "Effects of partitioning and scheduling sparse matrix
factorization on communication and load balance",
crossref = "IEEE:1991:PSA",
pages = "866--875",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C4140 (Linear algebra); C4240P (Parallel programming
and algorithm theory)",
corpsource = "Dept. of Comput. Sci., Rutgers Univ., New Brunswick,
NJ, USA",
keywords = "communication; distributed memory systems; Harwell-
Boeing data set; load balance; load imbalance; matrix
algebra; parallel algorithms; partitioning; scheduling;
scheduling sparse matrix factorization; wrap-mapped
column assignment",
sponsororg = "IEEE; ACM",
treatment = "X Experimental",
}
@InProceedings{Myers:1991:MSR,
author = "T. Myers and E. Williams",
title = "Mass storage requirements in the intelligence
community",
crossref = "IEEE:1991:PSA",
pages = "878--889",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5320 (Digital storage); C6110 (Systems analysis and
programming)",
corpsource = "Dept. of Defense, Ft. Meade, MD, USA",
keywords = "digital storage; intelligence community; mass storage
systems; research and development; systems analysis",
sponsororg = "IEEE; ACM",
treatment = "G General Review",
}
@InProceedings{Bowen:1991:VMT,
author = "N. S. Bowen and D. K. Pradhan",
title = "A virtual memory translation mechanism to support
checkpoint and rollback recovery",
crossref = "IEEE:1991:PSA",
pages = "890--899",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5470 (Performance evaluation and testing); C6120
(File organisation)",
corpsource = "IBM Thomas J. Watson Res. Center, Yorktown Heights,
NY, USA",
keywords = "address space; checkpoint interval size; checkpoint
recovery; fault tolerant computing; rollback recovery;
supercomputer applications; virtual memory translation;
virtual storage",
sponsororg = "IEEE; ACM",
treatment = "T Theoretical or Mathematical; X Experimental",
}
@InProceedings{Annaratone:1991:KDM,
author = "M. Annaratone and M. Fillo and M. Halbherr and R. Ruhl
and Steiner and P. and M. Viredaz",
title = "The {K2} distributed memory parallel processor:
architecture, compiler and operating system",
crossref = "IEEE:1991:PSA",
pages = "900--909",
year = "1991",
bibdate = "Wed Apr 15 16:28:01 MDT 1998",
acknowledgement = ack-nhfb,
classification = "C5220P (Parallel architecture); C5440
(Multiprocessor systems and techniques); C6110P
(Parallel programming); C6150C (Compilers, interpreters
and other processors); C6150J (Operating systems);
C6150N (Distributed systems)",
corpsource = "Swiss Federal Inst. of Technol., Zurich, Switzerland",
keywords = "architecture; K2 distributed memory parallel
processor; multi tasking operating system; multi user
operating system; multiprogramming; operating systems
(computers); parallel architectures; parallel machines;
parallel programming; parallelizing compiler; program
compilers; time-sharing operating system; workbench
machine",
sponsororg = "IEEE; ACM",
treatment = "P Practical",
}
%%% ====================================================================
%%% These entries must occur last because they are cross-referenced by
%%% entries above.
@Proceedings{IEEE:1991:PSA,
editor = "{IEEE}",
booktitle = "Proceedings, Supercomputing '91: Albuquerque, New
Mexico, November 18--22, 1991",
title = "Proceedings, Supercomputing '91: Albuquerque, New
Mexico, November 18--22, 1991",
publisher = pub-IEEE,
address = pub-IEEE:adr,
pages = "xxiii + 917",
year = "1991",
ISBN = "0-8186-9158-1 (IEEE case), 0-8186-2158-3 (IEEE paper),
0-8186-6158-5 (IEEE microfiche), 0-89791-459-7 (ACM)",
ISBN-13 = "978-0-8186-9158-4 (IEEE case), 978-0-8186-2158-1 (IEEE
paper), 978-0-8186-6158-7 (IEEE microfiche),
978-0-89791-459-8 (ACM)",
LCCN = "QA76.5 .S894 1991",
bibdate = "Fri Aug 30 08:01:51 MDT 1996",
bibsource = "University of California MELVYL catalog.",
note = "ACM order number 415913. IEEE Computer Society Press
order number 2158. IEEE catalog number 91CH3058-5.",
acknowledgement = ack-nhfb,
classification = "C5440 (Multiprocessor systems and techniques); C5470
(Performance evaluation and testing); C6110P (Parallel
programming)",
keywords = "combinatorial algorithms; data dependence; distributed
memory code generation; high school environment;
latency tolerance; memory access; numerical algorithms;
parallel processing; parallel programming; performance
evaluation; performance tools; processor design;
program analysis; storage hierarchy optimization;
supercomputer benchmarks; supercomputer congresses;
supercomputing; system issues",
}