%%%     address-1       = "Computer Science Department
%%%                        University of Tennessee
%%%                        Knoxville, TN 37996-1301
%%%                        USA
%%%                        and
%%%                        PO Box 2008, Building 6012
%%%                        Mathematical Science Section
%%%                        Oak Ridge National Laboratory
%%%                        Oak Ridge, TN  37821-6367
%%%                        USA",
%%%     address-2       =  "University of Utah
%%%                        Department of Mathematics, 110 LCB
%%%                        155 S 1400 E RM 233
%%%                        Salt Lake City, UT 84112-0090
%%%                        USA",
%%%     address-3       =  "Center for High Performance Computing
%%%                        University of Utah
%%%                        Salt Lake City, UT 84112
%%%                        USA",
%%%     telephone-1     = "+1 423 974-8295 (UTK), +1 423 574-3148 (ORNL)",
%%%     telephone-2     = "+1 801 581 5254",
%%%     telephone-3     = "+1 801 581 3173",
%%%     FAX-1           = "+1 423 974-8296 (UTK)",
%%%     FAX-3           = "+1 801 585 5366",
%%%     URL-1           = "",
%%%     URL-2           = "",
%%%     email-1         = "dongarra at (Internet),
%%%                        dongarra at (Internet)",
%%%     email-2         = "beebe at, beebe at,
%%%                        beebe at (Internet)",
%%%     email-3         = "stefano at (Internet)",
%%%     docstring       = "This is a (still incomplete) bibliography
%%%                        of the publications of Jack J. Dongarra.
%%%                        On 29 March 2022, ACM announced that the 2021
%%%                        Alan M. Turing Award is given to Jack
%%%                        Dongarra for ``Pioneering Concepts and
%%%                        Methods Which Resulted in World-Changing
%%%                        Computations''.
%%%                        At version 1.296, the year coverage looked
%%%                        like this:
%%%                             1976 (   1)    1993 (  35)    2010 (  29)
%%%                             1977 (   1)    1994 (  42)    2011 (  33)
%%%                             1978 (   2)    1995 (  47)    2012 (  23)
%%%                             1979 (   2)    1996 (  56)    2013 (  24)
%%%                             1980 (   2)    1997 (  61)    2014 (  12)
%%%                             1981 (   1)    1998 (  40)    2015 (  18)
%%%                             1982 (   2)    1999 (  34)    2016 (  12)
%%%                             1983 (   6)    2000 (  27)    2017 (  12)
%%%                             1984 (  26)    2001 (  53)    2018 (  20)
%%%                             1985 (  13)    2002 (  47)    2019 (  16)
%%%                             1986 (  19)    2003 (  47)    2020 (  12)
%%%                             1987 (  26)    2004 (  31)    2021 (   5)
%%%                             1988 (  21)    2005 (  24)    2022 (  12)
%%%                             1989 (  26)    2006 (  20)    2023 (   5)
%%%                             1990 (  26)    2007 (  29)    2024 (   6)
%%%                             1991 (  40)    2008 (  32)
%%%                             1992 (  40)    2009 (  26)
%%%                             19xx (   1)
%%%                             Article:        463
%%%                             Book:            36
%%%                             InBook:           1
%%%                             InCollection:    28
%%%                             InProceedings:  185
%%%                             Manual:           3
%%%                             Misc:             9
%%%                             PhdThesis:        1
%%%                             Proceedings:    184
%%%                             TechReport:     232
%%%                             Unpublished:      3
%%%                             Total entries: 1145
%%%                        In 2014, Jack Dongarra received the ACM-IEEE
%%%                        Computer Society Ken Kennedy award (announced
%%%                        on page 18 of the September 2014 issue of
%%%                        Communications of the ACM).
%%%                        This file is available as part of the BibNet
%%%                        Project.  The master copy is available for
%%%                        public access on in the
%%%                        directory tree /pub/bibnet/authors.  It is
%%%                        mirrored to in the
%%%                        directory tree /netlib/bibnet/authors, from
%%%                        which it is available via anonymous ftp and
%%%                        the Netlib service.
%%%                        This bibliography was collected from
%%%                        multiple sources:
%%%                        * the authors' own files;
%%%                        * Jack Dongarra's publications page at
%%%                        * the TeX User Group bibliography
%%%                          collection on in
%%%                          /pub/tex/bib;
%%%                        * the very large Computer Science
%%%                          bibliography collection on
%%%                          in /pub/bibliography, to which many people
%%%                          have contributed;
%%%                        * the ACM Computing Archive CD ROM,
%%%                          covering literature of the 1980s;
%%%                        * the IEEE Inspec CD ROMs for 1989--1996,
%%%                          and the IEEE Inspec database (1979--1996);
%%%                        * Internet library catalogs, including
%%%                          University of California MELVYL, Stanford
%%%                          University RLIN, Library of Congress,
%%%                          OCLC;
%%%                        * the Compendex database;
%%%                        * the OCLC Contents1st and Article1st
%%%                          databases; and
%%%                        * the AMS MathSciNet database.
%%%                        BibTeX citation tags are uniformly chosen
%%%                        as name:year:abbrev, where name is the
%%%                        family name of the first author or editor,
%%%                        year is a 4-digit number, and abbrev is a
%%%                        3-letter condensation of important title
%%%                        words. Citation tags were automatically
%%%                        generated by software developed for the
%%%                        BibNet Project.
%%%                        In this bibliography, entries are sorted
%%%                        first by ascending year, and within each
%%%                        year, alphabetically by author or editor,
%%%                        and then, if necessary, by the 3-letter
%%%                        abbreviation at the end of the BibTeX
%%%                        citation tag, using the bibsort -byyear
%%%                        utility.  Cross-referenced proceedings
%%%                        entries appear at the end, because of a
%%%                        restriction in the current BibTeX.
%%%                        The checksum field above contains a CRC-16
%%%                        checksum as the first value, followed by the
%%%                        equivalent of the standard UNIX wc (word
%%%                        count) utility output of lines, words, and
%%%                        characters.  This is produced by Robert
%%%                        Solovay's checksum utility.",
%%%  }
%%% Acknowledgement abbreviations:
@String{ack-nhfb = "Nelson H. F. Beebe,
                    University of Utah,
                    Department of Mathematics, 110 LCB,
                    155 S 1400 E RM 233,
                    Salt Lake City, UT 84112-0090, USA,
                    Tel: +1 801 581 5254,
                    e-mail: \path|[email protected]|,
                            \path|[email protected]|,
                            \path|[email protected]| (Internet),
                    URL: \path||"}

@String{ack-nj =   "Norbert Juffa,
                  2445 Mission College Blvd.
                  Santa Clara, CA 95054
                  email: \path=[email protected]="}

%%% ====================================================================
%%% Institutional abbreviations:
@String{inst-ANL                = "Argonne National Laboratory"}
@String{inst-ANL:adr            = "9700 South Cass Avenue, Argonne, IL
                                  60439-4801, USA"}

@String{inst-ANL-AM             = "Applied Mathematics Division, Argonne
                                  National Laboratory"}
@String{inst-ANL-AM:adr         = "9700 South Cass Avenue, Argonne, IL
                                  60439-4801, USA"}

@String{inst-ANL-MCS            = "Mathematics and Computer Science
                                  Division, Argonne National Laboratory"}
@String{inst-ANL-MCS:adr        = "9700 South Cass Avenue, Argonne, IL
                                  60439-4801, USA"}

@String{inst-ATT-BELL           = "AT\&T Bell Laboratories"}
@String{inst-ATT-BELL:adr       = "Murray Hill, NJ, USA"}

@String{inst-CS-U-Tenn          = "Department of Computer Science, University of
@String{inst-CS-U-Tenn:adr      = "Knoxville, TN, USA"}

@String{inst-HARWELL            = "{AERE Harwell} Laboratory"}
@String{inst-HARWELL:adr        = "Chilton, Oxon, England"}

@String{inst-INRIA              = "INRIA (Institut National de Recherche en
                                  Informatique et en Automatique)"}
@String{inst-INRIA:adr          = "Rocquencourt, France"}

@String{inst-MSS-ORNL           = "Mathematical Sciences Section, Oak Ridge
                                  National Laboratory"}
@String{inst-MSS-ORNL:adr       = "Knoxville, TN, USA"}

@String{inst-ORNL               = "Oak Ridge National Laboratory"}
@String{inst-ORNL:adr           = "Knoxville, TN, USA"}

@String{inst-UIUC-CSRD          = "University of Illinois at Urbana-Champaign,
                                  Center for Supercomputing Research and
@String{inst-UIUC-CSRD:adr      = "Urbana, IL 61801, USA"}

@String{inst-UTK                = "University of Tennessee, Knoxville"}
@String{inst-UTK:adr            = "Knoxville, TN 37996, USA"}

@String{inst-UTK-CS             = "Department of Computer Science,
                                  University of Tennessee, Knoxville"}
@String{inst-UTK-CS:adr         = "Knoxville, TN 37996, USA"}

%%% ====================================================================
%%% Journal abbreviations:
@String{j-ACTA-NUMERICA         = "Acta Numerica"}

@String{j-AMER-MATH-MONTHLY     = "American Mathematical Monthly"}

@String{j-ANN-HIST-COMPUT       = "Annals of the History of Computing"}

@String{j-APPL-ALGEBRA-ENG-COMMUN-COMPUT = "Applicable algebra in engineering,
                                  communication and computing"}

@String{j-APPL-MATH-COMP        = "Applied Mathematics and Computation"}

@String{j-APPL-MATH-COMP-SCI    = "Applied Mathematics and Computer Science"}

@String{j-APPL-NUM-MATH         = "Applied Numerical Mathematics: Transactions
                                  of IMACS"}

@String{j-BULL-AMS              = "Bulletin of the American Mathematical

@String{j-CACM                  = "Communications of the ACM"}

@String{j-CCPE                  = "Concurrency and Computation: Prac\-tice and

@String{j-COMP-ARCH-NEWS        = "ACM SIGARCH Computer Architecture News"}

@String{j-COMP-COMM             = "Computer Communications"}

@String{j-COMP-J                = "The Computer Journal"}

@String{j-COMPUT-MATH-APPL      = "Computers and Mathematics with Applications"}

@String{j-COMP-PHYS-COMM        = "Computer Physics Communications"}

@String{j-COMPUT-PHYS           = "Computers in Physics"}

@String{j-COMPUT-SCI-ENG        = "Computing in Science and Engineering"}

@String{j-COMPUTER              = "Computer"}

@String{j-CPE                   = "Concurrency: practice and experience"}

@String{j-CRAY-CHANNELS         = "CRAY Channels"}

@String{j-D-LIB-MAGAZINE        = "D-Lib magazine: the magazine of the Digital
                                  Library Forum"}

@String{j-FUT-GEN-COMP-SYS      = "Future Generation Computer Systems"}

@String{j-IBM-JRD               = "IBM Journal of Research and Development"}

@String{j-IEEE-ANN-HIST-COMPUT  = "IEEE Annals of the History of Computing"}

@String{j-IEEE-COMPUT-SCI-ENG   = "IEEE Computational Science \& Engineering"}

@String{j-IEEE-PAR-DIST-TECH    = "IEEE parallel and distributed
                                  technology: systems and applications"}

@String{j-IEEE-POT              = "IEEE Potentials"}

@String{j-IEEE-SOFTWARE         = "IEEE Software"}

@String{j-IEEE-SPECTRUM         = "IEEE Spectrum"}

@String{j-IEEE-TRANS-COMPUT     = "IEEE Transactions on Computers"}

@String{j-IEEE-TRANS-PAR-DIST-SYS = "IEEE Transactions on Parallel and
                                    Distributed Systems"}

@String{j-IJHPCA                = "The International Journal of High Performance
                                  Computing Applications"}

@String{j-IJSA                  = "International Journal of Supercomputer

@String{j-IJSAHPC               = "The International Journal of
                                  Supercomputer Applications and High
                                  Performance Computing"}

@String{j-INT-J-FOUND-COMP-SCI  = "International Journal of Foundations of
                                  Computer Science"}

@String{j-INT-J-PARALLEL-PROG   = "International Journal of Parallel

@String{j-J-COMPUT-APPL-MATH    = "Journal of Computational and Applied

@String{j-J-COMPUT-PHYS         = "Journal of Computational Physics"}

@String{j-J-COMPUT-SCI          = "Journal of Computational Science"}

@String{j-J-DIGITAL-INFO        = "Journal of Digital Information"}

@String{j-J-INFO-SCI-ENG        = "Journal of Information Science and Engineering"}

@String{j-J-GRID-COMP           = "Journal of Grid Computing"}

@String{j-J-PAR-DIST-COMP       = "Journal of Parallel and Distributed

@String{j-J-SUPERCOMPUTING      = "The Journal of Supercomputing"}

@String{j-LECT-NOTES-COMP-SCI   = "Lecture Notes in Computer Science"}

@String{j-LINEAR-ALGEBRA-APPL   = "Linear Algebra and its Applications"}

@String{j-MATH-COMPUT           = "Mathematics of Computation"}

@String{j-NATL-SCI-REV          = "National Science Review"}

@String{j-NUMER-ALGORITHMS      = "Numerical Algorithms"}

@String{j-NUM-LIN-ALG-APPL      = "Numerical Linear Algebra with Applications"}

@String{j-PARALLEL-COMPUTING    = "Parallel Computing"}

@String{j-PARALLEL-DIST-COMP-PRACT = "Parallel and Distributed Computing

@String{j-PARALLEL-PROCESS-LETT = "Parallel Processing Letters"}

@String{j-PHILOS-TRANS-R-SOC-LOND-SER-A = "Philosophical transactions of the
                                  Royal Society of London Series A"}

@String{j-PROC-IEEE             = "Proceedings of the IEEE"}

@String{j-PROC-R-SOC-LOND-SER-A = "Proceedings of the Royal Society of London.
                                  Series A"}

@String{j-PROC-SPIE             = "Proceedings of the SPIE --- The
                                  International Society for Optical

@String{j-SCI-COMPUT            = "Scientific Computing"}

@String{j-SCI-PROG              = "Scientific Programming"}

@String{j-SIAM-J-MAT-ANA-APPL   = "SIAM Journal on Matrix Analysis and

@String{j-SIAM-J-NUMER-ANAL     = "SIAM Journal on Numerical Analysis"}

@String{j-SIAM-J-SCI-COMP       = "SIAM Journal on Scientific Computing"}

@String{j-SIAM-J-SCI-STAT-COMP  = "SIAM Journal on Scientific and
                                  Statistical Computing"}

@String{j-SIAM-NEWS             = "SIAM News"}

@String{j-SIAM-REVIEW           = "SIAM Review"}

@String{j-SIGMETRICS            = "ACM SIGMETRICS Performance Evaluation Review"}

@String{j-SIGNUM                = "ACM SIGNUM Newsletter"}

@String{j-SIGPLAN               = "ACM SIG{\-}PLAN Notices"}

@String{j-SIGSOFT               = "ACM SIGSOFT Software Engineering Notes"}

@STRING{j-SIMULATION            = "Simulation"}

@String{j-SPE                   = "Soft{\-}ware\emdash Prac{\-}tice
                                  and Experience"}

@String{j-SUPERCOMPUTER         = "Supercomputer"}

@String{j-SUPERCOMPUTING-REVIEW = "Supercomputing Review"}

@String{j-SUPERFRI              = "Supercomputing Frontiers and Innovations"}

@String{j-TECHNIQUE-SCI-INFORMATIQUES = "Technique et Science Informatiques"}

@String{j-TOMS                  = "ACM Transactions on Mathematical

@String{j-TOPC                  = "ACM Transactions on Parallel Computing

%%% ====================================================================
%%% Publishers and their addresses:
@String{pub-ACADEMIC            = "Academic Press"}
@String{pub-ACADEMIC:adr        = "New York, NY, USA"}

@String{pub-ACM                 = "ACM Press"}
@String{pub-ACM:adr             = "New York, NY 10036, USA"}

@String{pub-ASME                = "American Society of Mechanical Engineers"}
@String{pub-ASME:adr            = "345 E. 47th St., New York, NY 10017, USA"}

@String{pub-AW                  = "Ad{\-d}i{\-s}on-Wes{\-l}ey"}
@String{pub-AW:adr              = "Reading, MA, USA"}

@String{pub-CHAPMAN-HALL        = "Chapman and Hall, Ltd."}
@String{pub-CHAPMAN-HALL:adr    = "London, UK"}

@String{pub-CHAPMAN-HALL-CRC    = "Chapman and Hall/CRC"}
@String{pub-CHAPMAN-HALL-CRC:adr = "Boca Raton, FL, USA"}

@String{pub-CLARENDON           = "Clarendon Press"}
@String{pub-CLARENDON:adr       = "Oxford, UK"}

@String{pub-CNRI                = "Corporation for National Research
@String{pub-CNRI:adr            = "Reston, VA, USA"}

@String{pub-CRC                 = "CRC Press"}
@String{pub-CRC:adr             = "2000 N.W. Corporate Blvd., Boca Raton,
                                  FL 33431-9868, USA"}

@String{pub-DEKKER              = "Marcel Dekker"}
@String{pub-DEKKER:adr          = "New York, NY, USA"}

@String{pub-EH                  = "Ellis Horwood"}
@String{pub-EH:adr              = "New York, NY, USA"}

@String{pub-ELSEVIER            = "Elsevier"}
@String{pub-ELSEVIER:adr        = "Amsterdam, The Netherlands"}

@String{pub-IEE                 = "IEE"}
@String{pub-IEE:adr             = "London, UK"}

@String{pub-IEEE                = "IEEE Computer Society Press"}
@String{pub-IEEE:adr            = "1109 Spring Street, Suite 300, Silver
                                  Spring, MD
                                  20910, USA"}

@String{pub-KLUWER              = "Kluwer Academic Publishers Group"}
@String{pub-KLUWER:adr          = "Norwell, MA, USA, and Dordrecht,
                                  The Netherlands"}

@String{pub-LONGMAN             = "Longman Scientific and Technical"}
@String{pub-LONGMAN:adr         = "Harlow, Essex, UK"}

@String{pub-MARCEL-DEKKER       = "Marcel Dekker"}
@String{pub-MARCEL-DEKKER:adr   = "New York, NY, USA"}

@String{pub-MIT                 = "MIT Press"}
@String{pub-MIT:adr             = "Cambridge, MA, USA"}

@String{pub-MORGAN-KAUFMANN     = "Morgan Kaufmann Publishers"}
@String{pub-MORGAN-KAUFMANN:adr = "San Francisco, CA, USA"}

@String{pub-NH                  = "North-Hol{\-}land"}
@String{pub-NH:adr              = "Amsterdam, The Netherlands"}

@String{pub-ORA                 = "O'Reilly \& Associates, Inc."}
@String{pub-ORA:adr             = "103a Morris Street,
                                  Sebastopol, CA 95472,
                                  Tel: +1 707 829 0515,
                                  90 Sherman Street,
                                  Cambridge, MA 02140,
                                  Tel: +1 617 354 5800"}

@String{pub-OXFORD              = "Oxford University Press"}
@String{pub-OXFORD:adr          = "Walton Street, Oxford OX2 6DP, UK"}

@String{pub-PH                  = "Pren{\-}tice-Hall"}
@String{pub-PH:adr              = "Englewood Cliffs, NJ 07632, USA"}

@String{pub-SIAM                = "Society for Industrial and Applied
@String{pub-SIAM:adr            = "Philadelphia, PA, USA"}

@String{pub-SV                  = "Spring{\-}er-Ver{\-}lag"}
@String{pub-SV:adr              = "Berlin, Germany~/ Heidelberg, Germany~/
                                  London, UK~/ etc."}

@String{pub-WESTERN-PERIODICALS = "Western Periodicals Co.,"}
@String{pub-WESTERN-PERIODICALS:adr = "North Hollywood, CA"}

@String{pub-WILEY               = "Wiley"}
@String{pub-WILEY:adr           = "New York, NY, USA"}

@String{pub-WORLD-SCI           = "World Scientific Publishing Co."}
@String{pub-WORLD-SCI:adr       = "Singapore; Philadelphia, PA, USA; River
                                  Edge, NJ, USA"}

%%% Series abbreviations:
@String{ser-LNAI                = "Lecture Notes in Artificial Intelligence"}

@String{ser-LNCS                = "Lecture Notes in Computer Science"}

@String{type-CSDTR              = "Computer Science Dept. Technical Report"}

@String{type-MCSDTM             = "Mathematics and Computer Science
                                  Division Technical Memo"}

@String{type-MCSDTR             = "Mathematics and Computer Science Division

@String{type-TM                 = "Technical Memorandum"}

@String{type-TR                 = "Technical Report"}

  author =       "B. T. Smith and J. M. Boyle and J. J. Dongarra and B.
                 S. Garbow and Y. Ikebe and V. C. Klema and C. B.
  title =        "Matrix Eigensystem Routines: {EISPACK} Guide",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "vii + 551",
  year =         "1976",
  CODEN =        "LNCSD9",
  ISBN =         "0-387-07546-1",
  ISBN-13 =      "978-0-387-07546-4",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA193 .M371 1976",
  MRclass =      "65F15 (65-04)",
  MRnumber =     "58 13662a",
  bibdate =      "Thu Dec 19 15:02:06 1996",
  bibsource =    "",
  note =         "See also \cite{Garbow:1977:MER}.",
  series =       ser-LNCS,
  acknowledgement = ack-nhfb,
  keywords =     "EISPACK",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "B. S. Garbow and J. M. Boyle and J. J. Dongarra and C.
                 B. Moler",
  title =        "Matrix Eigensystem Routines: {EISPACK} Guide
  volume =       "51",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "viii + 343",
  year =         "1977",
  ISBN =         "0-387-08254-9, 3-540-08254-9",
  ISBN-13 =      "978-0-387-08254-7, 978-3-540-08254-5",
  LCCN =         "QA193 .M381, QA267.A1,L43 no. 51",
  MRclass =      "65F15 (65-04)",
  MRnumber =     "58 13662b",
  bibdate =      "Mon Jan 15 10:36:06 1996",
  bibsource =    "",
  series =       ser-LNCS,
  acknowledgement = ack-nhfb,
  annote =       "Es wird das Eispack-Programmsystem zur Loesung von
                 Eigenwertproblemen beschrieben. Ferner werden Hinweise
                 zur Behandlung verschiedener Matrixtypen mit diesem
                 System gegeben. Ausserdem werden noch
                 Laufzeitabschaetzungen angegeben.",
  descriptor =   "Eigensystem, Eispack, Eigenvektor, Eigenwert,
  keywords =     "book, nla, eig, eispack, software",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra",
  title =        "Some {LINPACK} Timings on the {CRAY-1}",
  crossref =     "Buzbee:1978:PLW",
  pages =        "58--75",
  year =         "1978",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and J. R. Bunch and C. B. Moler and G.
                 W. Stewart",
  title =        "{LINPACK} Users' Guide",
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "320",
  year =         "1979",
  DOI =          "",
  ISBN =         "0-89871-172-X (paperback)",
  ISBN-13 =      "978-0-89871-172-1 (paperback)",
  LCCN =         "QA76.73 .L22 L5 1979; QA184 .L56 1982; QA214 .L56
  bibdate =      "Mon Dec 13 15:18:20 1993",
  bibsource =    ";
  abstract =     "The authors of this carefully structured guide are the
                 principal developers of LINPACK, a unique package of
                 Fortran subroutines for analyzing and solving various
                 systems of simultaneous linear algebraic equations and
                 linear least squares problems. This guide supports both
                 the casual user of LINPACK who simply requires a
                 library subroutine, and the specialist who wishes to
                 modify or extend the code to handle special problems.
                 It is also recommended for classroom work.",
  acknowledgement = ack-nhfb,
  GWS-number =   "B2",
  keywords =     "book, Cholesky decomposition, cond, downd, linpack,
                 lud, lud, math, nla, qrd, qrd, soft, software, survey,
                 svd, svd, upd, updating",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  subject =      "LINPACK (Computer system); Equations, Simultaneous;
                 Data processing; Matrices; Data processing.; LINPACK
                 (Computer system); LINPACK (Syst{\`e}me d'ordinateur);
                 {\'E}quations simultan{\'e}es; Informatique",
  tableofcontents = "General matrices \\
                 Band matrices \\
                 Positive definite matrices \\
                 Positive definite band matrices \\
                 Symmetric indefinite matrices \\
                 Triangular matrices \\
                 Tridiagonal matrices \\
                 The Cholesky decomposition \\
                 The $QR$ decomposition \\
                 Updating $QR$ and Cholesky decompositions \\
                 The singular value decomposition \\
                 References \\
                 Basic linear algebra subprograms \\
                 Timing data \\
                 Program listings \\
                 BLA listings",
  xxauthor =     "J. J. Dongarra and C. B. Moler and J. R. Bunch and G.
                 W. Stewart",

  author =       "J. J. Dongarra and A. R. Hinds",
  title =        "Unrolling Loops in {FORTRAN}",
  journal =      j-SPE,
  volume =       "9",
  number =       "3",
  pages =        "219--226",
  month =        mar,
  year =         "1979",
  CODEN =        "SPEXBL",
  DOI =          "",
  ISSN =         "0038-0644 (print), 1097-024X (electronic)",
  ISSN-L =       "0038-0644",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "C6140D (High level languages)",
  corpsource =   "Argonne Nat. Lab., Argonne, IL, USA",
  fjournal =     "Software---Practice and Experience",
  journal-URL =  "",
  keywords =     "compilers; FORTRAN; short program loops; unrolling",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "J. J. Dongarra",
  title =        "Improving the Accuracy of Computed Matrix
  type =         "{Ph.D.} thesis",
  school =       "Department of Computer Science, University of New
  address =      "Albuquerque, NM, USA",
  year =         "1980",
  bibdate =      "Wed Jan 14 05:30:39 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  advisor =      "Cleve B. Moler",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and C. B. Moler and J. H. Wilkinson",
  title =        "Improving the Accuracy of Computed Eigenvalues and
  type =         "Technical Report",
  number =       "ANL-81-43",
  institution =  inst-ANL-AM,
  address =      inst-ANL-AM:adr,
  year =         "1981",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  note =         "Published as
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra",
  title =        "{Algorithm 589}: {SICEDR}: {A FORTRAN} Subroutine for
                 Improving the Accuracy of Computed Matrix Eigenvalues",
  journal =      j-TOMS,
  volume =       "8",
  number =       "4",
  pages =        "371--375",
  month =        dec,
  year =         "1982",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "B0290H (Linear algebra); C4140 (Linear algebra); C7310
                 (Mathematics computing)",
  corpsource =   "Argonne Nat. Lab., Argonne, IL, USA",
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  keywords =     "algorithms, matrix eigensystems, iterative method;
                 eigensystems improvement; eigenvalues and
                 eigenfunctions; eigenvector; FORTRAN subroutine;
                 improvement; iterative; iterative method; matrix
                 eigenvalues; numerical methods; Schur decomposition
                 technique; SICEDR; subroutines",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "A Application; T Theoretical or Mathematical",

  author =       "J. J. Dongarra and J. R. Gabriel and J. H. Wilkinson",
  title =        "The Eigenvalue Problem for {Hermitian} Matrices with
                 Time Reversal Symmetry",
  type =         "Technical Memorandum",
  number =       "3",
  institution =  inst-ANL-MCS,
  address =      inst-ANL-MCS:adr,
  year =         "1982",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  note =         "Published as \cite{Dongarra:1984:EPH} where D. D.
                 Koelling is also an author.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and R. Hiromoto",
  title =        "A Collection of Parallel Linear Equations Routines for
                 the {Denelcor HEP}",
  type =         "??",
  number =       "ANL/MCS-TM-15",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        sep,
  year =         "1983",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and C. B. Moler and J. H. Wilkinson",
  title =        "Improving the Accuracy of Computed Eigenvalues and
  journal =      j-SIAM-J-NUMER-ANAL,
  volume =       "20",
  number =       "1",
  pages =        "23--45",
  month =        feb,
  year =         "1983",
  CODEN =        "SJNAEQ",
  DOI =          "",
  ISSN =         "0036-1429 (print), 1095-7170 (electronic)",
  ISSN-L =       "0036-1429",
  MRclass =      "65F15",
  MRnumber =     "84c:65063",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "B0290B (Error analysis in numerical methods); B0290H
                 (Linear algebra); C4110 (Error analysis in numerical
                 methods); C4140 (Linear algebra)",
  corpsource =   "Argonne Nat. Lab., Argonne, IL, USA",
  fjournal =     "SIAM Journal on Numerical Analysis",
  journal-URL =  "",
  keywords =     "accuracy; computed eigenvalues; computed eigenvectors;
                 convergence of numerical methods; eigenfunctions;
                 eigenvalues and; EISPACK; error analysis; extended;
                 matrix algebra; matrix eigenvalues; matrix
                 eigenvectors; Newton's method; nla, eig, iterative
                 refinement; numerical; numerical accuracy; numerically
                 stable implementation; precision arithmetic; residuals;
                 standard; subroutines",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  reviewer =     "M. Lotkin",
  treatment =    "T Theoretical or Mathematical",

  author =       "J. J. Dongarra",
  title =        "Improving the Accuracy of Computed Singular Values",
  journal =      j-SIAM-J-SCI-STAT-COMP,
  volume =       "4",
  number =       "4",
  pages =        "712--719",
  month =        dec,
  year =         "1983",
  CODEN =        "SIJCD4",
  DOI =          "",
  ISSN =         "0196-5204",
  MRclass =      "65F10",
  MRnumber =     "85a:65054",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "B0290F (Interpolation and function approximation);
                 C4130 (Interpolation and function approximation)",
  corpsource =   "Math. and Computer Sci. Div., Argonne Nat. Lab.,
                 Argonne, IL, USA",
  fjournal =     "SIAM Journal on Scientific and Statistical Computing",
  journal-URL =  "",
  keywords =     "accuracy; computations; computed singular values;
                 eigenvalue; eigenvalues and eigenfunctions; extended
                 precision; iterative improvement; iterative methods;
                 linear; linear systems; Newton's method; nla, svd,
                 iterative refinement; singular vectors; systems",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  reviewer =     "Beny Neta",
  treatment =    "T Theoretical or Mathematical",

  author =       "J. J. Dongarra and C. B. Moler and J. H. Wilkinson",
  title =        "Improving the Accuracy of Computed Eigenvalues and
  journal =      j-SIGNUM,
  volume =       "20",
  pages =        "23--45",
  year =         "1983",
  CODEN =        "SNEWD6",
  ISSN =         "0163-5778 (print), 1558-0237 (electronic)",
  ISSN-L =       "0163-5778",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "ACM SIGNUM Newsletter",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra",
  title =        "Performance of various computers using standard linear
                 equations software in a {FORTRAN} environment",
  journal =      j-COMP-ARCH-NEWS,
  volume =       "11",
  number =       "5",
  pages =        "22--27",
  month =        dec,
  year =         "1983",
  CODEN =        "CANED2",
  ISSN =         "0163-5964 (ACM), 0884-7495 (IEEE)",
  ISSN-L =       "0163-5964",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C5420 (Mainframes and minicomputers); C7310
                 (Mathematics computing)",
  corpsource =   "Math. and Computer Sci. Div., Argonne Nat. Lab.,
                 Argonne, IL, USA",
  fjournal =     "ACM SIGARCH Computer Architecture News",
  journal-URL =  "",
  keywords =     "68000 based systems; Apollo; benchmarking; computer
                 testing; Cray X-MP; dense systems of linear equations;
                 environment; FORTRAN; linear algebra; LINPACK software;
                 solving; standard linear equations software; SUN;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "X Experimental",

  author =       "J. J. Dongarra",
  title =        "Redesigning Linear Algebra Algorithms",
  journal =      "Bull. Dir. Etud. Rech. C (France), Bulletin de la
                 Direction des Etudes et Recherches, Serie C",
  volume =       "C",
  number =       "1",
  pages =        "51--60 (or 51--59??)",
  month =        "????",
  year =         "1983",
  CODEN =        "EDBCAA",
  ISSN =         "0013-4511",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  classcodes =   "C4140 (Linear algebra); C4240 (Programming and
                 algorithm theory); C5420 (Mainframes and
  conflocation = "Paris, France; 17-18 March 1983",
  conftitle =    "1/sup er/ Colloque International sur les Methodes
                 Vectorielles et Paralleles en Calcul Scientifique (1st
                 International Colloquium on Vectorial and Parallel
                 Methods in Scientific Calculations)",
  keywords =     "algebra; algorithm theory; FORTRAN; large-scale vector
                 computers; linear algebra algorithms; parallel
                 processing; portable environment; sequential computers;
                 standard algorithms; supercomputers",
  language =     "French; English",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "T Theoretical or Mathematical",

  author =       "Steven S. Chen and Jack J. Dongarra and Christopher C.
  title =        "Multiprocessing Linear Algebra Algorithms on the {Cray
                 X-MP-2}: Experiences with Small Granularity",
  journal =      j-J-PAR-DIST-COMP,
  volume =       "1",
  number =       "1",
  pages =        "22--31",
  month =        aug,
  year =         "1984",
  CODEN =        "JPDCER",
  DOI =          "",
  ISSN =         "0743-7315 (print), 1096-0848 (electronic)",
  ISSN-L =       "0743-7315",
  bibdate =      "Fri Aug 23 12:59:02 MDT 1996",
  bibsource =    "Compendex database;
  URL =          "",
  abstract =     "This paper reviews the CRAY X-MP-2 general-purpose
                 multiprocessor system and discusses how it can be used
                 effectively to solve problems that have small
                 granularity. An implementation is described for linear
                 algebra algorithms that solve systems of linear
                 equations when the matrix is general and when the
                 matrix is symmetric and positive definite.",
  acknowledgement = ack-nhfb,
  affiliation =  "CRAY Research Inc, Chippewa Falls, WI, USA",
  affiliationaddress = "CRAY Research Inc, Chippewa Falls, WI, USA",
  classification = "722; 723; 921",
  fjournal =     "Journal of Parallel and Distributed Computing",
  journal-URL =  "",
  journalabr =   "J Parallel Distrib Comput",
  keywords =     "COMPUTER PROGRAMMING --- Algorithms; COMPUTER SYSTEMS,
                 MATHEMATICAL TECHNIQUES --- Linear Algebra;
                 Multiprocessing; nla, prll; SMALL GRANULARITY",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Robert E. Hiromoto",
  title =        "A collection of parallel linear equations routines for
                 the {Denelcor HEP}",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "1",
  number =       "2",
  pages =        "133--142",
  month =        dec,
  year =         "1984",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  URL =          "",
  abstract =     "The implementation and performance results for a few
                 standard linear algebra routines on the Denelcor HEP
                 computer are described. The algorithms used here are
                 based on high-level modules that facilitate portability
                 and perform efficiently in a wide range of
                 environments. The modules are chosen to be of a large
                 enough computational granularity so that reasonably
                 optimum performance may be insured. The design of
                 algorithms with such fundamental modules in mind will
                 also facilitate their replacement by others more suited
                 to gain the desired performance on a particular
                 computer architecture.",
  acknowledgement = ack-nhfb,
  affiliation =  "Argonne Natl Lab, Mathematics \& Computer Science Div,
                 Argonne, IL, USA",
  affiliationaddress = "Argonne Natl Lab, Mathematics \& Computer
                 Science Div, Argonne, IL, USA",
  classcodes =   "C4140 (Linear algebra); C7310 (Mathematics
  classification = "723; 921",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  journalabr =   "Parallel Comput",
  keywords =     "Algorithms; ASSEMBLY LANGUAGE PROGRAMMING;
                 computational granularity; COMPUTER PROGRAMMING;
                 PROCESSOR; high-level; linear algebra; linear algebra
                 routines; listings; MATHEMATICAL TECHNIQUES --- Linear
                 Algebra; modules; nla, prll, linear system, lud;
                 PARALLEL COMPUTERS; parallel linear equations routines;
                 parallel processing; PERFORMANCE ANALYSIS; performance
                 results; portability",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical; T Theoretical or Mathematical; X

  author =       "Jack J. Dongarra",
  booktitle =    "Proceedings of the 23rd {IEEE} Conference on Decision
                 \& Control, December 12--14, 1984, Las Vegas Hilton,
                 Las Vegas, Nevada",
  title =        "Designing Algorithms in Linear Algebra for Different
                 Computer Architectures",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "661--661",
  year =         "1984",
  CODEN =        "PCDCDZ",
  DOI =          "",
  ISSN =         "0191-2216",
  bibdate =      "Fri Aug 23 12:59:02 MDT 1996",
  bibsource =    "Compendex database;
  note =         "Three volumes. IEEE catalog number 84CH2093-3.",
  abstract =     "Implementations and performance are discussed of a few
                 standard algorithms from linear algebra on
                 high-performance computers, such as the CRAY 1, CRAY
                 X-MP, Fujitsu VP-200, Hitachi S-810\slash 20 and
                 Denelcor HEP, based on the use of high-level modules.
                 High-level modularity facilitates portability and aids
                 in attaining performance efficiency on a wide variety
                 of environments spanning scalar, vector, and certain
                 parallel computers.",
  acknowledgement = ack-nhfb,
  affiliation =  "Argonne Natl Lab, Argonne, IL, USA",
  affiliationaddress = "Argonne Natl Lab, Argonne, IL, USA",
  classcodes =   "C1110 (Algebra); C4140 (Linear algebra); C7310
                 (Mathematics computing)",
  classification = "723; 921",
  conference =   "Proceedings of the 23rd IEEE Conference on Decision
                 and Control.",
  conflocation = "Las Vegas, NV, USA; 12-14 Dec. 1984",
  corpsource =   "Argonne Nat. Lab., IL, USA",
  journalabr =   "Proceedings of the IEEE Conference on Decision and
                 Control Including The Symposium on Adaptive Processes
  keywords =     "ABSTRACT ONLY; algorithm design; Algorithms; CAD;
                 SOFTWARE --- Portability; CRAY 1; CRAY X-MP; Denelcor
                 HEP; Fujitsu VP-200; HIGH-LEVEL MODULARITY;
                 HIGH-PERFORMANCE COMPUTERS; Hitachi S-810/20; linear
                 algebra; MATHEMATICAL TECHNIQUES --- Linear Algebra;
                 mathematics computing; modules; parallel computers;
                 PERFORMANCE EFFICIENCY; vector",
  meetingaddress = "Las Vegas, NV, USA",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsor =      "IEEE Control Systems Soc, New York, NY, USA; SIAM,
                 Philadelphia, PA, USA; Operations Research Soc of
                 America, Baltimore, MD, USA",
  sponsororg =   "IEEE",
  treatment =    "T Theoretical or Mathematical",
  xxISBN =       "none",

  author =       "J. Dongarra and E. Grosse",
  title =        "Distribution of Mathematical Software via Electronic
  type =         "Technical Report",
  number =       "MCS-TM-48",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  year =         "1984",
  bibdate =      "Tue Oct 9 11:25:29 2007",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and J. R. Gabriel and D. D. Koelling
                 and J. H. Wilkinson",
  title =        "The eigenvalue problem for {Hermitian} matrices with
                 time reversal symmetry",
  journal =      j-LINEAR-ALGEBRA-APPL,
  volume =       "60",
  number =       "????",
  pages =        "27--42",
  month =        aug,
  year =         "1984",
  CODEN =        "LAAPAW",
  DOI =          "",
  ISSN =         "0024-3795 (print), 1873-1856 (electronic)",
  ISSN-L =       "0024-3795",
  MRclass =      "65F15 (81G55)",
  MRnumber =     "MR749173 (85j:65013)",
  MRreviewer =   "Cs. J. Heged{\H{u}}s",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "A0260 (Numerical approximation and analysis); A0270
                 (Computational techniques); A0365F (Algebraic methods
                 in quantum theory); A3115 (General mathematical and
                 computational developments for atoms and molecules);
                 A3130J (Radiative and relativistic effects (atoms and
  corpsource =   "Maths. and Comput. Sci., Argonne Nat. Lab., IL, USA",
  fjournal =     "Linear Algebra and its Applications",
  journal-URL =  "",
  keywords =     "algebra; atomic structure; computational method;
                 eigensystem; eigenvalue problem; eigenvalues and
                 eigenfunctions; electronic; heavy atoms; Hermitian
                 matrices; inversion; matrix; molecular electronic
                 states; molecules; quantum mechanics; quantum theory;
                 relativistic corrections; relativistic kinematics;
                 relativistic mechanics; solids; structure; symmetry;
                 time reversal",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  reviewer =     "Cs. J. Heged{\H{u}}s",
  treatment =    "T Theoretical or Mathematical",

  author =       "J. J. Dongarra and C. B. Moler",
  title =        "{EISPACK} --- {A} Package for Solving Matrix
                 Eigenvalue Problems",
  crossref =     "Cowell:1984:SDM",
  pages =        "68--87",
  year =         "1984",
  bibdate =      "Fri Aug 23 12:59:02 MDT 1996",
  bibsource =    "Compendex database;
  abstract =     "EISPACK is a collection of Fortran subroutines that
                 compute the eigenvalues and eigenvectors of matrices
                 and matrix systems. The package can determine the
                 eigensystem of complex general, complex Hermitian, real
                 general, real symmetric, real symmetric band, real
                 symmetric tridiagonal, and special real tridiagonal
                 matrices, and generalized real and generalized real
                 symmetric matrix systems. The subroutines are based
                 mainly on Algol procedures published in the Handbook
                 series of Springer-Verlaga by Wilkinson and Reinsch
                 (1971) and the QZ algorithm of Moler and Stewart
                 (1973). The algorithms have been adapted to Fortran and
                 thoroughly tested on a wide range of different
                 computers. The software has been certified and is
                 supported by the developers.",
  acknowledgement = ack-nhfb,
  affiliation =  "Argonne Natl Lab, Mathematics \& Computer Science Div,
                 Argonne, IL, USA",
  affiliationaddress = "Argonne Natl Lab, Mathematics \& Computer
                 Science Div, Argonne, IL, USA",
  classification = "723",
  journalabr =   "Sources and Dev of Math Software",
                 Subroutines; COMPUTER PROGRAMMING LANGUAGES ---
                 SUBROUTINES; MATHEMATICAL TECHNIQUES --- Eigenvalues
                 and Eigenfunctions; Modular Construction; SYMMETRIC
                 MATRIX SYSTEMS",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and F. G. Gustavson and A. Karp",
  title =        "Implementing Linear Algebra Algorithms for Dense
                 Matrices on a Vector Pipeline Machine",
  journal =      j-SIAM-REVIEW,
  volume =       "26",
  number =       "1",
  pages =        "91--112",
  month =        jan,
  year =         "1984",
  CODEN =        "SIREAD",
  DOI =          "",
  ISSN =         "0036-1445 (print), 1095-7200 (electronic)",
  ISSN-L =       "0036-1445",
  MRclass =      "65F10 (65F30)",
  MRnumber =     "85c:65032",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "C4140 (Linear algebra)",
  corpsource =   "Argonne Nat. Lab., Argonne, IL, USA",
  fjournal =     "SIAM Review",
  journal-URL =  "",
  keywords =     "computer architecture; dense matrices; instruction
                 execution; linear algebra; matrix-matrix
                 multiplication; matrix-vector multiplication; nla,
                 vect; pipeline processing; pipelined; vector pipeline
                 machine; vector processing",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "T Theoretical or Mathematical",

  author =       "J. Dongarra",
  title =        "Increasing the Performance of Mathematical Software
                 through High-Level Modularity",
  crossref =     "Glowinski:1984:CMA",
  pages =        "239--248",
  year =         "1984",
  MRclass =      "65F99 (65W05)",
  MRnumber =     "86k:65033",
  bibdate =      "Mon Jan 15 10:23:21 1996",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and G. W. Stewart",
  title =        "{LINPACK} --- {A} Package for Solving Linear Systems",
  crossref =     "Cowell:1984:SDM",
  pages =        "20--48",
  year =         "1984",
  bibdate =      "Fri Aug 23 12:59:02 MDT 1996",
  bibsource =    "Compendex database;
  abstract =     "LINPACK is a collection of Fortran subroutines that
                 analyze and solve linear equations and linear least
                 squares problems. The package solves linear systems
                 whose matrices are general, banded, symmetric
                 indefinite, symmetric positive definite, triangular,
                 and tridiagonal. In addition, the package computes the
                 $ Q R $ and singular value decompositions of
                 rectangular matrices and applies them to least squares
  acknowledgement = ack-nhfb,
  affiliation =  "Argonne Natl Lab, Mathematics \& Computer Science Div,
                 Argonne, IL, USA",
  affiliationaddress = "Argonne Natl Lab, Mathematics \& Computer
                 Science Div, Argonne, IL, USA",
  classification = "723; 731; 921",
  journalabr =   "Sources and Dev of Math Software",
                 Subroutines; COMPUTER PROGRAMMING LANGUAGES ---
                 FORTRAN; COMPUTER SOFTWARE --- Modular Construction;
                 MATHEMATICAL TECHNIQUES --- Linear Algebra;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and S. Chen and S. Hsiung",
  title =        "Multiprocessing Linear Algebra Algorithms on the {CRAY
                 X-MP2}: Experiences with Small Granularity",
  number =       "MCS-TM-24",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  pages =        "????",
  month =        feb,
  year =         "1984",
  bibdate =      "Tue Oct 9 11:20:07 2007",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and E. Lusk and R. Overbeek and B. Smith
                 and D. Sorensen",
  title =        "New Directions in Software for Advanced Computer
  number =       "MCS-TM-32",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  pages =        "????",
  month =        aug,
  year =         "1984",
  bibdate =      "Tue Oct 9 11:21:20 2007",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra",
  title =        "Performances Compar{\`e}es de 80 Ordinateurs sur des
                 Programmes {Fortran}",
  volume =       "3",
  number =       "5",
  pages =        "355--360",
  year =         "1984",
  CODEN =        "TTSIDJ",
  ISSN =         "0752-4072, 0264-7419",
  ISSN-L =       "0752-4072",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Technique et science informatiques : TSI",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and J. DuCroz and S. Hammarling and R.
  title =        "A Proposal for an Extended Set of {Fortran Basic
                 Linear Algebra Subprograms}",
  type =         type-MCSDTM,
  number =       "MCS-TM-41",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        dec,
  year =         "1984",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and D. Sorensen",
  title =        "A Parallel Linear Algebra Library for the {Denelcor
  type =         "Technical Report",
  number =       "ANL/MCS/TM-33",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        "??",
  year =         "1984",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra",
  title =        "Performance of Various Computers Using Standard linear
                 equations software in a {Fortran} Environment",
  type =         type-TM,
  number =       "23",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  pages =        "8",
  year =         "1984",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  descriptors =  "Computer performance; LINPACK; linear equation;
  keywords =     "nla, lud, performance, fortran",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra",
  title =        "Performance of Various Computers Using Standard Linear
                 Equations Software in a {Fortran} Environment",
  journal =      j-SIGNUM,
  volume =       "19",
  number =       "1",
  pages =        "23--26",
  month =        jan,
  year =         "1984",
  CODEN =        "SNEWD6",
  ISSN =         "0163-5778 (print), 1558-0237 (electronic)",
  ISSN-L =       "0163-5778",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "C0310H (Equipment and software evaluation methods);
                 C7310 (Mathematics computing)",
  corpsource =   "Mathematics and Computer Sci. Div., Argonne Nat. Lab.,
                 Argonne, IL, USA",
  fjournal =     "ACM SIGNUM Newsletter",
  journal-URL =  "",
  keywords =     "68000 based systems; Apollo; computer selection and
                 evaluation; computer systems; computing; Cray X-; dense
                 systems; FORTRAN environment; LINPACK software; MP;
                 natural sciences; nla, lud, performance, fortran;
                 standard linear equations software; SUN",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "J. J. Dongarra",
  title =        "Performance of various computers using standard linear
                 equations software in a {FORTRAN} environment",
  volume =       "3",
  number =       "5",
  pages =        "317--320",
  year =         "1984",
  CODEN =        "TTSIDJ, TTSIEK",
  ISSN =         "0752-4072, 0264-7419",
  ISSN-L =       "0752-4072",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "C5470 (Performance evaluation and testing)",
  corpsource =   "Math. and Comput. Sci. Div., Argonne Nat. Lab., IL,
  fjournal =     "Technique et science informatiques : TSI",
  keywords =     "Apple III; benchmarks; computer testing; Cray X-MP;
                 ELXSI; equations software; execution timings; FORTRAN
                 environment; Fujitsu VP-200; LINPACK library; NAS 9060;
                 performance evaluation; Ridge 32; standard linear;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  source =       "Technique et Science Informatiques",
  treatment =    "P Practical",
  xxpages =      "355--360",

  author =       "Jack J. Dongarra and Stanley C. Eisenstat",
  title =        "Squeezing the Most out of an Algorithm in {CRAY
  journal =      j-TOMS,
  volume =       "10",
  number =       "3",
  pages =        "219--230",
  month =        sep,
  year =         "1984",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  MRclass =      "65F99",
  MRnumber =     "791 988",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  URL =          "",
  abstract =     "A technique is described for achieving supervector
                 performance on a CRAY-1 in a purely FORTRAN environment
                 (i.e., without resorting to assembler language). The
                 technique can be applied to a wide variety of
                 algorithms in linear algebra, and is beneficial in
                 other architectural settings.",
  acknowledgement = ack-nhfb,
  affiliation =  "Argonne Natl Lab, Argonne, IL, USA",
  affiliationaddress = "Argonne Natl Lab, Argonne, IL, USA",
  classcodes =   "C4140 (Linear algebra); C7310 (Mathematics
  classification = "723; 921",
  corpsource =   "Argonne Nat. Lab., IL, USA",
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  journalabr =   "ACM Trans Math Software",
  keywords =     "Algorithms; algorithms; architectural; COMPUTER
                 PROGRAMMING; CRAY-1; environment; FORTRAN; linear
                 algebra; LINEAR ALGEBRA, nla, cray, vect, fortran;
                 MATHEMATICAL TECHNIQUES --- Linear Algebra; numerical
                 analysis; parallel processing; settings; supervector
                 performance; VECTOR PROCESSING; vector processing",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "J. Dongarra and L. Kaufman and S. Hammarling",
  title =        "Squeezing the Most out of Eigenvalue Solvers on High
                 Performance Computers",
  number =       "MCS-TM-46",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  year =         "1984",
  bibdate =      "Tue Oct 9 11:24:40 2007",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and A. Sameh",
  title =        "On Some Parallel Banded System Solvers",
  type =         "Technical Report",
  number =       "ANL/MCS-TM-27",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        "??",
  year =         "1984",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Ahmed H. Sameh",
  title =        "On Some Parallel Banded System Solvers",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "1",
  number =       "3--4",
  pages =        "223--235",
  month =        dec,
  year =         "1984",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  URL =          "",
  abstract =     "Algorithms are described for solving narrow banded
                 systems and the Helmholtz difference equations that are
                 suitable for multiprocessing systems. The organization
                 of the algorithms highlights the large grain
                 parallelism inherent in the problems.",
  acknowledgement = ack-nhfb,
  affiliation =  "Argonne Natl Lab, Mathematics \& Computer Science Div,
                 Argonne, IL, USA",
  affiliationaddress = "Argonne Natl Lab, Mathematics \& Computer
                 Science Div, Argonne, IL, USA",
  classcodes =   "C4290 (Other computer theory)",
  classification = "722; 723",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  journalabr =   "Parallel Comput",
  keywords =     "banded systems; computation theory; computer
                 programming --- algorithms; computer systems, digital;
                 equations; Helmholtz difference; Helmholtz difference
                 equations; large grain parallelism; multiprocessing
                 systems; parallel banded system solvers; parallel
                 processing; partitioning",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical; T Theoretical or Mathematical",

  author =       "J. J. Dongarra and J. R. Gabriel and D. D. Koelling
                 and J. H. Wilkinson",
  title =        "Solving the Secular Equation Including Spin Orbit
                 Coupling for Systems with Inversion and Time-Reversal
  journal =      j-J-COMPUT-PHYS,
  volume =       "54",
  number =       "2",
  pages =        "278--288",
  month =        may,
  year =         "1984",
  CODEN =        "JCTPAH",
  DOI =          "",
  ISSN =         "0021-9991 (print), 1090-2716 (electronic)",
  ISSN-L =       "0021-9991",
  bibdate =      "Sun Jan 1 15:59:19 MST 2012",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  classcodes =   "A0230 (Function theory, analysis); A0250 (Probability
                 theory, stochastic processes, and statistics); A0365C
                 (Formalism in quantum theory)",
  corpsource =   "Math. and Computer Sci. Div., Argonne Nat. Lab.,
                 Argonne, IL, USA",
  fjournal =     "Journal of Computational Physics",
  journal-URL =  "",
  keywords =     "computational method; eigenvalues; eigenvalues and
                 eigenfunctions; eigenvectors; inversion symmetry;
                 numerical methods; quantum; quantum mechanics; secular
                 equation; spin orbit coupling; spin-orbit interactions;
                 symmetry; T invariance; theory; time reversal",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "T Theoretical or Mathematical",

  author =       "P. Messina and B. Smith and J. Dongarra",
  title =        "Proceedings form the {Argonne} Workshop on Programming
                 the Next Generation of Supercomputers",
  type =         "Technical Report",
  number =       "MCS-TM-34",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  year =         "1984",
  bibdate =      "Tue Oct 9 11:24:12 2007",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and B. T. Smith and D. Sorensen",
  title =        "Algorithm Design for Different Computer
  journal =      j-IEEE-SOFTWARE,
  volume =       "2",
  number =       "4",
  pages =        "79--80",
  month =        jul,
  year =         "1985",
  CODEN =        "IESOEG",
  ISSN =         "0740-7459 (print), 0740-7459 (electronic)",
  ISSN-L =       "0740-7459",
  bibdate =      "Tue Feb 26 09:53:36 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Software",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra",
  title =        "Book Review: {{\booktitle{A New Approach to Scientific
                 Computation}} (Ulrich W. Kulisch and Willard L.
                 Miranker, eds.)}",
  journal =      j-SIAM-REVIEW,
  volume =       "27",
  number =       "2",
  pages =        "267--268",
  month =        "????",
  year =         "1985",
  CODEN =        "SIREAD",
  DOI =          "",
  ISSN =         "0036-1445 (print), 1095-7200 (electronic)",
  ISSN-L =       "0036-1445",
  bibdate =      "Sat Mar 29 09:53:55 MDT 2014",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM Review",
  journal-URL =  "",
  onlinedate =   "June 1985",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and A. Hinds",
  title =        "Comparison of the {CRAY X-MP-4}, the {Fujitsu VP-200},
                 and the {Hitachi S-810/20}: An {Argonne} perspective",
  type =         type-TR,
  number =       "ANL-8579",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        oct,
  year =         "1985",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and E. Grosse",
  title =        "Distribution of mathematical software via electronic
  journal =      j-SIGNUM,
  volume =       "20",
  number =       "3",
  pages =        "45--47",
  month =        jul,
  year =         "1985",
  CODEN =        "SNEWD6",
  ISSN =         "0163-5778 (print), 1558-0237 (electronic)",
  ISSN-L =       "0163-5778",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "B6210G (Electronic mail); C0310F (Software development
                 management); C7310 (Mathematics computing)",
  corpsource =   "Math. and Comput. Sci. Div., Argonne Nat. Lab., IL,
  fjournal =     "ACM SIGNUM Newsletter",
  journal-URL =  "",
  keywords =     "algorithms; Arpanet/CSNET; design; electronic mail;
                 library catalog; mathematics; netlib@anl-mcs; network;
                 public domain mathematical software; research!netlib;
                 software packages; UNIX",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  subject =      "H.4.3 Information Systems, INFORMATION SYSTEMS
                 APPLICATIONS, Communications Applications, Electronic
  treatment =    "P Practical",

  author =       "J. J. Dongarra and D. C. Sorensen",
  title =        "A Fast Algorithm for the Symmetric Eigenvalue
  crossref =     "Hwang:1985:PSC",
  pages =        "338--342",
  year =         "1985",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  note =         "IEEE catalog number 85CH2146-9.",
  acknowledgement = ack-nhfb,
  classcodes =   "B0200 (Engineering mathematics and mathematical
                 techniques); B0290H (Linear algebra); C1100
                 (Mathematical techniques); C4140 (Linear algebra)",
  conflocation = "Urbana, IL, USA; 4-6 June 1985",
  corpsource =   "Dept. of Math. and Comput. Sci., Argonne Nat. Lab.,
                 IL, USA",
  keywords =     "algorithm; computers; eigenvalues and eigenfunctions;
                 numerical; parallel; parallel algorithms; parallel
                 processing; rank-one tearing; symmetric eigenvalue
                 problem; tridiagonal problem",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "IEEE; Univ. Illinois",
  treatment =    "T Theoretical or Mathematical",

  author =       "J. Dongarra and T. Hewitt",
  title =        "Implementing Dense Linear Algebra Algorithms Using
                 Multitasking on the {CRAY X-MP-4}",
  type =         "Technical Report",
  number =       "MCS-TM-55",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        aug,
  year =         "1985",
  bibdate =      "Tue Oct 9 11:26:47 2007",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and A. H. Sameh and D. C. Sorensen",
  booktitle =    "Proceedings of the Eighteenth Hawaii International
                 Conference on System Science, Honolulu, {HI}, {USA,
                 2--4} January 1985",
  title =        "Implementation of Some Concurrent Algorithms for
                 Matrix Factorization",
  publisher =    pub-WESTERN-PERIODICALS,
  address =      pub-WESTERN-PERIODICALS:adr,
  pages =        "39--46",
  year =         "1985",
  CODEN =        "PHISD7",
  ISBN =         "????",
  ISBN-13 =      "????",
  ISSN =         "0073-1129",
  LCCN =         "????",
  bibdate =      "Fri Aug 23 12:59:02 MDT 1996",
  bibsource =    "Compendex database;
  abstract =     "This paper discusses implementations of various forms
                 of the QR factorization on the Denelcor HEP. The
                 motivation for examining these implementations was to
                 investigate performance issues that we might expect to
                 face in developing mathematical software for linear
                 algebra problems on emerging parallel architectures.
                 The Denelcor HEP is particularly well suited for such a
                 study because it offers the possibility of very fine
                 grain parallelism through low overhead synchronization
                 primitives. We point out certain synchronization
                 problems that arise within the more lightly coupled
                 variations of the algorithm and offer a comparison of
                 the performance of these variations.",
  acknowledgement = ack-nhfb,
  affiliation =  "Argonne Natl Lab, Mathematics \& Computer Science Div,
                 Argonne, IL, USA",
  affiliationaddress = "Argonne Natl Lab, Mathematics \& Computer
                 Science Div, Argonne, IL, USA",
  classcodes =   "C4140 (Linear algebra); C4240 (Programming and
                 algorithm theory)",
  classification = "722; 723; 921",
  conference =   "Proceedings of the Eighteenth Hawaii International
                 Conference on System Sciences 1985. Volume 2: Software.
                 Proceedings of the Hawaii International Conference on
                 System Science 18th, Distributed by Western Periodicals
  conflocation = "Honolulu, HI, USA; 2-4 Jan. 1985",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  keywords =     "algorithm theory; Algorithms; architectures; COMPUTER
                 PROGRAMMING; CONCURRENT ALGORITHMS; concurrent
                 algorithms; DENELCOR HEP; Denelcor HEP; factorization;
                 linear algebra; LINEAR ALGEBRA PROBLEMS; mathematical
                 software; MATHEMATICAL TECHNIQUES --- Matrix Algebra;
                 matrix algebra; MATRIX FACTORIZATION; matrix
                 factorization; parallel; PARALLEL ARCHITECTURES;
                 parallel processing; performance issues; Q R; QR
                 FACTORIZATION; synchronization problems",
  meetingaddress = "Honolulu, HI, USA North Hollywood, CA, USA",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsor =      "Univ of Hawaii, Honolulu, HI, USA; Univ of
                 Southwestern Louisiana, Lafayette, LA, USA; ACM, New
                 York, NY, USA; IEEE Computer Soc, Los Alamitos, CA,
  sponsororg =   "Univ. Hawaii; Univ. Southwestern Louisiana; ACM; IEEE;
                 Community Health Comput.; Cray Res.; IBM; Plenum",
  treatment =    "T Theoretical or Mathematical",

  author =       "J. J. Dongarra and J. {Du Croz} and S. Hammarling and
                 R. J. Hanson",
  title =        "A proposal for an extended set of {FORTRAN} Basic
                 Linear Algebra Subprograms",
  journal =      j-SIGNUM,
  volume =       "20",
  number =       "1",
  pages =        "2--18",
  month =        jan,
  year =         "1985",
  CODEN =        "SNEWD6",
  ISSN =         "0163-5778 (print), 1558-0237 (electronic)",
  ISSN-L =       "0163-5778",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "C4140 (Linear algebra); C7310 (Mathematics
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  fjournal =     "ACM SIGNUM Newsletter",
  journal-URL =  "",
  keywords =     "algorithms; Basic Linear Algebra Subprograms; BLAS;
                 FORTRAN; high; languages; linear algebra; matrix;
                 performance computers; portable implementations; vector
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  subject =      "G.1.6 Mathematics of Computing, NUMERICAL ANALYSIS,
                 Optimization, Linear programming \\ D.3.2 Software,
                 PROGRAMMING LANGUAGES, Language Classifications,
                 FORTRAN 77 \\ G.1.3 Mathematics of Computing, NUMERICAL
                 ANALYSIS, Numerical Linear Algebra, Matrix inversion
                 D.2.5 Software, SOFTWARE ENGINEERING, Testing and
                 Debugging, Diagnostics",
  treatment =    "P Practical",

  author =       "J. Dongarra",
  title =        "Performance of Various Computers Using Standard Linear
                 Equations Software in a {Fortran} Environment",
  type =         "??",
  number =       "MCA-TM-23",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        "??",
  year =         "1985",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra",
  title =        "Performance of various computers using standard linear
                 equations software in a {FORTRAN} environment",
  journal =      j-COMP-ARCH-NEWS,
  volume =       "13",
  number =       "1",
  pages =        "3--11",
  month =        mar,
  year =         "1985",
  CODEN =        "CANED2",
  ISSN =         "0163-5964 (ACM), 0884-7495 (IEEE)",
  ISSN-L =       "0163-5964",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C4140 (Linear algebra); C5470 (Performance evaluation
                 and testing); C7310 (Mathematics computing)",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  fjournal =     "ACM SIGARCH Computer Architecture News",
  journal-URL =  "",
  keywords =     "68000 based; Apollo workstations; Cray X-MP; dense
                 systems; evaluation; FORTRAN environment; IBM PCs;
                 linear algebra; linear equations; LINPACK; performance;
                 performance comparison; performance evaluation;
                 software; Sun Workstations; systems",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "X Experimental",

  author =       "J. J. Dongarra and A. H. Sameh and D. C. Sorensen",
  title =        "Some Implementations of the {$ Q R $}-Factorization on
                 an {MIMD}-Machine",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "??",
  number =       "??",
  pages =        "??--??",
  month =        oct,
  year =         "1985",
  CODEN =        "PACOEJ",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. L. Martin and R. Baron and R. Rashid and E. Siegel
                 and A. Tevanian and M. Young and P. C. Patton and J. R.
                 Gurd and J. Sargeant and K. Arvind and A. Gottlieb and
                 G. C. Fox and P. A. Rigsbee and W. K. Giloi and T. Hoag
                 and J. C. Browne and J. J. Dongarra and B. T. Smith and
                 D. C. Sorensen",
  title =        "Special Section --- International Parallel Processing
                 Projects --- a Software Perspective",
  journal =      j-IEEE-SOFTWARE,
  volume =       "2",
  number =       "4",
  pages =        "65--80",
  month =        "????",
  year =         "1985",
  CODEN =        "IESOEG",
  DOI =          "",
  ISSN =         "0740-7459 (print), 1937-4194 (electronic)",
  ISSN-L =       "0740-7459",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Software",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Alan Hinds",
  title =        "Comparison of the {CRAY X-MP-4}, {Fujitsu VP-200}, and
                 {Hitachi S-810\slash 20}",
  journal =      j-SIMULATION,
  volume =       "47",
  number =       "3",
  pages =        "93--107",
  month =        sep,
  year =         "1986",
  CODEN =        "SIMUA2",
  DOI =          "",
  ISSN =         "0037-5497 (print), 1741-3133 (electronic)",
  ISSN-L =       "0037-5497",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  abstract =     "A set of programs, gathered from major Argonne
                 computer users, was run on the current generation of
                 supercomputers: the CRAY X-MP-4 is a consistently
                 strong performer over a wide range of problems. The
                 Fujitsu and Hitachi computers excel on highly
                 vectorized programs and offer an attractive opportunity
                 to sites with IBM-compatible computers.",
  acknowledgement = ack-nhfb,
  affiliation =  "Argonne Natl Lab, Argonne, IL, USA",
  affiliationaddress = "Argonne Natl Lab, Argonne, IL, USA",
  classcodes =   "C5440 (Multiprocessor systems and techniques); C5470
                 (Performance evaluation and testing)",
  classification = "722; 723",
  corpsource =   "Argonne Nat. Lab., IL, USA",
  fjournal =     "Simulation",
  journal-URL =  "",
  journalabr =   "Simulation",
                 concurrent; constant stride; contiguous element; CRAY
                 X-MP; CRAY X-MP-4; execution; Fujitsu VP; FUJITSU
                 VP-200; high-performance; HITACHI S-810/20; Hitachi
                 S/810; independent functional units; index vector;
                 indirect address; mainframes; parallel machines;
                 Performance; performance evaluation; pipeline
                 processing; pipeline techniques; programs; register
                 format; register-to-; SUPERCOMPUTERS; supercomputers;
                 VECTOR COMPUTER; vector processors; vectorized",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical; R Product Review",

  author =       "J. J. Dongarra and D. C. (Danny C.) Sorensen",
  title =        "A fully parallel algorithm for the symmetric
                 eigenvalue problem",
  type =         "Technical Report",
  number =       "CSRD-542",
  institution =  inst-UIUC-CSRD,
  address =      inst-UIUC-CSRD:adr,
  pages =        "22",
  year =         "1986",
  bibdate =      "Mon Jul 07 11:50:59 1997",
  bibsource =    "",
  note =         "Also available as Argonne Report MCS-TM-62.",
  acknowledgement = ack-nhfb,
  annote =       "Work was supported in part by the Applied Mathematical
                 Sciences Sub-program of the Office of Energy Research,
                 U.S. Department of Energy.",
  keywords =     "Eigenvalues; Parallel processing (Electronic
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra",
  title =        "How do the `Mini-Supers' Stack Up?",
  journal =      j-COMPUTER,
  volume =       "19",
  number =       "3",
  pages =        "93, 100",
  month =        mar,
  year =         "1986",
  CODEN =        "CPTRB4",
  ISSN =         "0018-9162 (print), 1558-0814 (electronic)",
  ISSN-L =       "0018-9162",
  bibdate =      "Tue Feb 26 09:51:54 2002",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Computer",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and D. C. Sorensen",
  title =        "High performance computers and algorithms from linear
  crossref =     "Cullum:1986:LSE",
  pages =        "15--36",
  year =         "1986",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C6100 (Software techniques and systems)",
  conflocation = "Oberlech, Austria; 8-12 July 1985",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  keywords =     "algorithms; architectures; ease of use; linear
                 algebra; parallel programming; portability;
                 programming; robustness; software development process;
                 software portability; structured",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "IBM World Trade Corp",
  treatment =    "G General Review; T Theoretical or Mathematical",

  author =       "Jack J. Dongarra and Tom Hewitt",
  title =        "Implementing Dense Linear Algebra Algorithms Using
                 Multitasking on the {CRAY X-MP-4} (or, {Approaching}
                 the Gigaflop)",
  journal =      j-SIAM-J-SCI-STAT-COMP,
  volume =       "7",
  number =       "1",
  pages =        "347--350",
  month =        jan,
  year =         "1986",
  CODEN =        "SIJCD4",
  DOI =          "",
  ISSN =         "0196-5204",
  MRclass =      "65W05 (65Fxx)",
  MRnumber =     "87c:65170",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "C4140 (Linear algebra); C7310 (Mathematics
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  fjournal =     "SIAM Journal on Scientific and Statistical Computing",
  journal-URL =  "",
  keywords =     "Cholesky decomposition; Cray X-MP-4; dense linear
                 algebra algorithms; L U decomposition; linear algebra;
                 multiprogramming; multitasking; nla, prll, vect;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "X Experimental",

  author =       "J. J. Dongarra and A. H. Sameh and D. C. Sorensen",
  title =        "Implementation of Some Concurrent Algorithms for
                 Matrix Factorization",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "3",
  number =       "1",
  pages =        "25--34",
  month =        mar,
  year =         "1986",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  URL =          "",
  abstract =     "Three parallel algorithms for computing the
                 QR-factorization of a matrix are presented. The
                 discussion is primarily concerned with implementation
                 of these algorithms on a computer that supports tightly
                 coupled parallel processes sharing a large common
                 memory. The three algorithms are a Householder method
                 based upon high-level modules, a Windowed Householder
                 method that avoids fork-join synchronization, and a
                 Pipelined Givens method that is a variant of the
                 data-flow type algorithms offering large enough
                 granularity to mask synchronization costs. Numerical
                 experiments were conducted on the Denelcor HEP
                 computer. The computational results indicate that the
                 Pipelined Givens method is preferred and that this is
                 primarily due to the number of array references
                 required by the various algorithms.",
  acknowledgement = ack-nhfb,
  affiliation =  "Argonne Natl Lab, Argonne, IL, USA",
  affiliationaddress = "Argonne Natl Lab, Argonne, IL, USA",
  classcodes =   "C4140 (Linear algebra); C5470 (Performance evaluation
                 and testing)",
  classification = "722; 723; 921",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  journalabr =   "Parallel Comput",
  keywords =     "Algorithms; algorithms; array references; COMPUTER
                 PROGRAMMING; COMPUTER SYSTEMS, DIGITAL --- Parallel
                 Processing; CONCURRENT ALGORITHMS; concurrent
                 algorithms; data-flow type; DENELCOR HEP; Denelcor HEP
                 computer; high-level modules; Householder method; large
                 common memory; MATHEMATICAL TECHNIQUES --- Matrix
                 Algebra; matrix algebra; MATRIX FACTORIZATION; matrix
                 factorization; nla, prll, lud, qrd; parallel; parallel
                 processing; performance analysis; performance
                 evaluation; pipelined Givens method; processes;
                 QR-factorization; synchronisation cost masking; tightly
                 coupled parallel; windowed",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "T Theoretical or Mathematical; X Experimental",

  author =       "J. J. Dongarra and D. C. Sorensen",
  title =        "Linear Algebra on High-Performance Computers",
  crossref =     "Feilmeier:1986:PCP",
  pages =        "3--32",
  year =         "1986",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and D. C. Sorensen",
  title =        "Linear Algebra on High Performance Computers",
  journal =      j-APPL-MATH-COMP,
  volume =       "20",
  number =       "1--2",
  pages =        "57--88",
  month =        sep,
  year =         "1986",
  CODEN =        "AMHCBQ",
  ISSN =         "0096-3003 (print), 1873-5649 (electronic)",
  ISSN-L =       "0096-3003",
  MRclass =      "65Fxx (65W05)",
  MRnumber =     "87i:65034",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "C4140 (Linear algebra); C6110 (Systems analysis and
                 programming); C7310 (Mathematics)",
  conflocation = "Houghton, MI, USA; 5-8 Aug. 1985",
  conftitle =    "Workshop on Applications of Supercomputers",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  fjournal =     "Applied Mathematics and Computation",
  journal-URL =  "",
  keywords =     "advanced computer architectures; algebra; algorithm
                 restructuring; banded systems; high; linear algebra;
                 modules; nla; numerical analysis; numerical linear;
                 numerical software; parallel; parallel computers;
                 performance; performance computers; processing;
                 programming; QR factorization; software portability;
                 sparse; symmetric eigenvalue problems;
                 transportability; vect; vector computers",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical; T Theoretical or Mathematical",

  author =       "J. J. Dongarra and D. C. Sorensen",
  title =        "Performance and library issues for mathematical
                 software on high performance computers",
  crossref =     "Wouk:1986:NCE",
  pages =        "112--135",
  year =         "1986",
  MRclass =      "65W05",
  MRnumber =     "849 385",
  bibdate =      "Mon Jan 15 10:41:35 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and I. Duff",
  title =        "Performance of Vector Computers for Direct and
                 Indirect Addressing in {Fortran}",
  type =         "Harwell Report",
  institution =  inst-HARWELL,
  address =      inst-HARWELL:adr,
  month =        "??",
  year =         "1986",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and L. Johnsson",
  title =        "Solving Banded Systems on a Parallel Processor",
  type =         "Technical Report",
  number =       "MCS-TM-85",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        nov,
  year =         "1986",
  bibdate =      "Tue Oct 9 11:30:35 2007",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  keywords =     "CRAY X-MP-4",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra",
  title =        "A survey of high performance computers",
  crossref =     "Bell:1986:DPC",
  pages =        "8--11",
  year =         "1986",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  note =         "IEEE catalog number 86CH2285-.",
  abstract =     "Computers that are based on advanced architecture
                 design and have the capability for high performance
                 cover a price range from 50,000 to 20,000,000, and
                 there is a wide range in their performance as well.
                 However, all hope to provide performance close to that
                 of the leading-edge supercomputers at a fraction of
                 their multimillion-dollar price tag. The difficulty of
                 classifying these machines is pointed out. A list of
                 machines that are available or scheduled to appear in
                 1986 is presented. Data on the various machines are
  acknowledgement = ack-nhfb,
  affiliation =  "Argonne Natl Lab, IL, USA",
  affiliationaddress = "Argonne Natl Lab, IL, USA",
  classcodes =   "C5420 (Mainframes and minicomputers)",
  classification = "722; 723",
  conference =   "Digest of Papers --- COMPCON Spring 86: Thirty-First
                 IEEE Computer Society International Conference.",
  conflocation = "San Francisco, CA, USA; 3-6 March 1986",
  corpsource =   "Argonne Nat. Lab., IL, USA",
  journalabr =   "Proceedings - IEEE Computer Society International
                 Conference 31st.",
  keywords =     "1986; advanced; architecture design; classification;
                 Parallel Processing; high performance computers;
                 mainframes; parallel processing; SUPERCOMPUTERS;
  meetingaddress = "San Francisco, CA, USA",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsor =      "IEEE Computer Soc, Los Alamitos, CA, USA",
  sponsororg =   "IEEE",
  treatment =    "G General Review",

  author =       "Jack J. Dongarra and Linda Kaufman and Sven
  title =        "Squeezing the Most Out of Eigenvalue Solvers on High
                 Performance Computers",
  journal =      j-LINEAR-ALGEBRA-APPL,
  volume =       "77",
  number =       "??",
  pages =        "113--136",
  month =        "??",
  year =         "1986",
  CODEN =        "LAAPAW",
  DOI =          "",
  ISSN =         "0024-3795 (print), 1873-1856 (electronic)",
  ISSN-L =       "0024-3795",
  MRclass =      "65F15 (65-04 65W05)",
  MRnumber =     "837 861",
  bibdate =      "Thu Dec 19 14:33:37 1996",
  bibsource =    ";
  note =         "Special volume on parallel computing.",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Linear Algebra and its Applications",
  journal-URL =  "",
  keywords =     "nla, eig, vect",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and D. Sorensen",
  title =        "{SCHEDULE}: Tools for Developing and Analyzing
                 Parallel {Fortran} Programs",
  type =         "Technical Report",
  number =       "ANL-MCS-TM-86",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        nov,
  year =         "1986",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and J. DuCroz and S. Hammarling and R.
  title =        "An Update Notice on the Extended {BLAS}",
  journal =      j-SIGNUM,
  volume =       "21",
  number =       "4",
  pages =        "2--4",
  year =         "1986",
  CODEN =        "SNEWD6",
  ISSN =         "0163-5778 (print), 1558-0237 (electronic)",
  ISSN-L =       "0163-5778",
  bibdate =      "Wed Aug 17 02:24:34 1994",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "ACM SIGNUM Newsletter",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Greg Astfalk and Jack Dongarra and Eric Grosse",
  title =        "Finding Public Domain Mathematical Software",
  type =         "Numerical Analysis Manuscript",
  number =       "87-5",
  institution =  inst-ATT-BELL,
  address =      inst-ATT-BELL:adr,
  year =         "1987",
  bibdate =      "Mon Jul 11 13:32:00 MDT 1994",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "F. Chatelin and J. Dongarra and I. Duff",
  title =        "Special Volume in Memory of {James H. Wilkinson}",
  journal =      j-LINEAR-ALGEBRA-APPL,
  volume =       "88/89",
  pages =        "??--??",
  year =         "1987",
  CODEN =        "LAAPAW",
  ISSN =         "0024-3795 (print), 1873-1856 (electronic)",
  ISSN-L =       "0024-3795",
  bibdate =      "Mon Jan 02 09:49:28 2006",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Linear Algebra and its Applications",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "James Demmel and Jack Dongarra and Jeremy {Du Croz}
                 and Anne Greenbaum and Sven Hammarling and Danny
  title =        "Prospectus for the Development of a Linear Algebra
                 Library for High-Performance Computers",
  type =         "LAPACK Working Note" # " and " # type-MCSDTR,
  number =       "01 and ANL/MCS-TM-97",
  institution =  inst-ANL-MCS,
  address =      inst-ANL-MCS:adr,
  month =        sep,
  year =         "1987",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    ";
  note =         "ANL, MCS-TM-97, September 1987, and LAPACK Working
                 Note \#1.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and I. Duff",
  title =        "Advanced Architecture Computers",
  type =         "Technical Report",
  number =       "ANL-MCS-TM-57 (Revision 1)",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        oct,
  year =         "1987",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and E. L. Lusk",
  editor =       "Ahmed K. Noor",
  booktitle =    "Parallel computations and their impact on mechanics /
                 presented at the Winter Annual Meeting of the American
                 Society of Mechanical Engineers, Boston, Massachusetts,
                 December 13-18, 1987",
  title =        "{Advanced Computing Research Facility} and Algorithm
                 Design for Different Computers",
  volume =       "86",
  publisher =    pub-ASME,
  address =      pub-ASME:adr,
  bookpages =    "xii + 402",
  pages =        "49--53",
  year =         "1987",
  CODEN =        "AMDVAS",
  ISSN =         "0160-8835",
  LCCN =         "QA76.6 .A43 1987",
  bibdate =      "Fri Aug 23 12:59:02 MDT 1996",
  bibsource =    "Compendex database;
  series =       "AMD (Series)",
  abstract =     "Argonne National Laboratory has established an
                 Advanced Computing Research Facility where researchers
                 can experiment with innovative machines and develop
                 programming tools for advanced-architecture computers.
                 Argonne scientists are using new approaches to write
                 software that operates on different high-performance
                 computers with minimal rewriting. These approaches
                 include restructuring of algorithms and design of a
                 monitors\slash macros technique for synchronizing
                 multiple processes. Additionally, scientists are
                 developing new algorithms that take advantage of the
                 special properties of parallel computers. Argonne
                 researchers have also implemented a parallel Warren
                 Abstract Machine for logic programming that will be
                 used to develop extremely high-performance automated
                 reasoning systems.",
  acknowledgement = ack-nhfb,
  affiliation =  "Argonne Natl Lab, Argonne, IL, USA",
  affiliationaddress = "Argonne Natl Lab, Argonne, IL, USA",
  classification = "722; 723",
  conference =   "Parallel Computations and Their Impact on Mechanics.
                 Presented at the Winter Annual Meeting of the American
                 Society of Mechanical Engineers.",
  journalabr =   "AMD (Symposia Series) (American Society of Mechanical
                 Engineers, Applied Mechanics Division)",
                 ARCHITECTURE; COMPUTER PROGRAMMING --- Algorithms;
                 --- Parallel Processing; PARALLEL COMPUTERS; Research;
                 WARREN ABSTRACT MACHINE",
  meetingaddress = "Boston, MA, USA",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsor =      "ASME, Applied Mechanics Div, New York, NY, USA; ASME,
                 Pressure Vessels \& Piping Div, New York, NY, USA;
                 ASME, Computer Engineering Div, New York, NY, USA",
  xxISBN =       "none",

  author =       "Jack Dongarra and Sven Hammarling and Danny Sorensen",
  title =        "Block Reduction of Matrices to Condensed Forms for
                 Eigenvalue Computations",
  type =         "LAPACK Working Note",
  number =       "02",
  institution =  inst-ANL-MCS,
  address =      inst-ANL-MCS:adr,
  month =        sep,
  year =         "1987",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    ";
  note =         "ANL, MCS-TM-99, September 1987.",
  URL =          ";
  acknowledgement = ack-nhfb,
  keywords =     "nla, block algorithm, eig",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxtitle =      "Block Reduction of Matrices to Condensed form for
                 Eigenvalue Computations",

  author =       "Jack Dongarra and Joanne L. Martin and Jack Worlton",
  title =        "Computer Benchmarking: Paths and Pitfalls",
  journal =      j-IEEE-SPECTRUM,
  volume =       "24",
  number =       "7",
  pages =        "38--43",
  month =        jul,
  year =         "1987",
  CODEN =        "IEESAM",
  ISSN =         "0018-9235 (print), 1939-9340 (electronic)",
  ISSN-L =       "0018-9235",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  URL =          "",
  abstract =     "Benchmarking, running a set of well-known programs on
                 a machine to compare its performance with that of
                 others, is explained, and the problems involved in its
                 use are outlined. Suggestions for avoiding the pitfalls
                 of benchmarking are provided. The need to take into
                 account user-friendliness is highlighted. A
                 hierarchical approach to evaluation is described.",
  acknowledgement = ack-nhfb,
  affiliation =  "Argonne Natl Lab, IL, USA",
  affiliationaddress = "Argonne Natl Lab, IL, USA",
  classcodes =   "C5470 (Performance evaluation and testing); C6150G
                 (Diagnostic, testing, debugging and evaluating
  classification = "721; 722; 723",
  corpsource =   "Argonne Nat. Lab., IL, USA",
  fjournal =     "IEEE Spectrum",
  journal-URL =  "",
  journalabr =   "IEEE Spectrum",
  keywords =     "BENCHMARKING; COMPUTER ARCHITECTURE --- Testing;
                 COMPUTER BENCHMARKING; computer benchmarking; COMPUTER
                 EQUIPMENT --- Testing; computer testing; COMPUTERS,
                 DIGITAL; evaluation; hierarchical; Performance;
                 performance evaluation; user-friendliness",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "Jack J. Dongarra and Eric Grosse",
  title =        "Distribution of Mathematical Software via Electronic
  journal =      j-CACM,
  volume =       "30",
  number =       "5",
  pages =        "403--407",
  month =        may,
  year =         "1987",
  CODEN =        "CACMA2",
  DOI =          "",
  ISSN =         "0001-0782 (print), 1557-7317 (electronic)",
  ISSN-L =       "0001-0782",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  URL =          "",
  abstract =     "A large collection of public-domain mathematical
                 software is now available via electronic mail. Messages
                 sent to `netlib@anl-mcs' (on the Arpanet\slash CSNET)
                 or to `research|netlib' (on the UNIX network) wake up a
                 server that distributes items from the collection. The
                 one-line message `send index' causes a library catalog
                 to be sent by return mail.",
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics)",
  classification = "716; 718; 722; 723",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  fjournal =     "Communications of the ACM",
  journal-URL =  "",
  journalabr =   "Commun ACM",
  keywords =     "algorithms; ARPANET; community; COMPUTER SOFTWARE;
                 documentation; ELECTRONIC MAIL; electronic mail;
                 LIBRARY CATALOG; library catalog; MATHEMATICAL
                 PROGRAMMING; MATHEMATICAL SOFTWARE; mathematical
                 software; mathematics computing; MESSAGES SENT;
                 public-domain; scientific computing; telesoftware;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  subject =      "G.4 Mathematics of Computing, MATHEMATICAL SOFTWARE
                 H.4.3 Information Systems, INFORMATION SYSTEMS
                 APPLICATIONS, Communications Applications, Electronic
                 mail \\ C.2.3 Computer Systems Organization,
                 COMPUTER-COMMUNICATION NETWORKS, Network Operations \\
                 G.1.0 Mathematics of Computing, NUMERICAL ANALYSIS,
                 General, Numerical algorithms \\ H.3.0 Information
                 Systems, INFORMATION STORAGE AND RETRIEVAL, General \\
                 K.6.3 Computing Milieux, MANAGEMENT OF COMPUTING AND
                 INFORMATION SYSTEMS, Software Management \\ C.2.3
                 Computer Systems Organization, COMPUTER-COMMUNICATION
                 NETWORKS, Network Operations, Public networks",
  treatment =    "P Practical",

  editor =       "J. J. Dongarra",
  title =        "Experimental Parallel Computing Architectures",
  publisher =    pub-NH,
  address =      pub-NH:adr,
  pages =        "xiii + 303",
  year =         "1987",
  ISBN =         "0-444-70234-2",
  ISBN-13 =      "978-0-444-70234-0",
  LCCN =         "QA76.5 .E985 1987",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and J. {Du Croz} and S. Hammarling and
                 R. J. Hanson",
  title =        "An Extended Set of {Fortran Basic Linear Algebra
                 Subprograms}: Model Implementation and Test Programs",
  type =         "Technical Report",
  number =       "MCS-TM-81",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        jan,
  year =         "1987",
  bibdate =      "Tue Oct 9 11:35:16 2007",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and D. C. Sorensen",
  title =        "A Fully Parallel Algorithm for the Symmetric
                 Eigenvalue Problem",
  journal =      j-SIAM-J-SCI-STAT-COMP,
  volume =       "8",
  number =       "2",
  pages =        "S139--S154",
  month =        mar,
  year =         "1987",
  CODEN =        "SIJCD4",
  DOI =          "",
  ISSN =         "0196-5204",
  MRclass =      "65F15 (65W05)",
  MRnumber =     "88f:65054",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  classcodes =   "C4140 (Linear algebra)",
  conflocation = "Norfolk, VA, USA; 18-21 Nov. 1985",
  conftitle =    "Second Conference on Parallel Processing for
                 Scientific Computing",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  fjournal =     "SIAM Journal on Scientific and Statistical Computing",
  journal-URL =  "",
  keywords =     "algorithms; computation time, accuracy; Cuppen;
                 deflation technique; divide-and-conquer scheme;
                 eigenvalues and eigenfunctions; fully parallel
                 algorithm; matrix algebra; nla, eig, symmetric matrix,
                 prll; numerical properties; parallel; performance;
                 robust root finding technique; round off error;
                 speedup; symmetric eigenvalue problem; symmetric
                 tridiagonal matrix",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  reviewer =     "Michel Cosnard",
  sponsororg =   "SIAM; NSF; Air Force Office Sci. Res",
  treatment =    "T Theoretical or Mathematical",

  author =       "J. J. Dongarra and D. C. Sorensen",
  title =        "On the implementation of a fully parallel algorithm
                 for the symmetric eigenvalue problem",
  journal =      j-PROC-SPIE,
  volume =       "696",
  pages =        "45--53",
  year =         "1987",
  CODEN =        "PSISDG",
  ISSN =         "0277-786X (print), 1996-756X (electronic)",
  ISSN-L =       "0277-786X",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "B0290H (Linear algebra); B6140 (Signal processing and
                 detection); C1260 (Information theory); C4140 (Linear
  conflocation = "San Diego, CA, USA; 19-20 Aug. 1986",
  conftitle =    "Advanced Algorithms and Architectures for Signal
  corpsource =   "Div. of Math., Argonne Nat. Lab., IL, USA",
  fjournal =     "Proceedings of the SPIE --- The International Society
                 for Optical Engineering",
  keywords =     "active parallel processes; divide and conquer scheme;
                 eigenvalues and eigenfunctions; fully parallel
                 algorithm; matrix algebra; processing; roundoff error;
                 sensitivity; serial mode; signal; symmetric eigenvalue
                 problem; tridiagonal matrix",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "SPIE",
  treatment =    "T Theoretical or Mathematical",

  author =       "J. J. Dongarra and D. C. Sorensen",
  title =        "A look at the evolution of mathematical software for
                 dense matrix problems over the past fifteen years",
  crossref =     "Anonymous:1987:ISS",
  pages =        "203--216",
  month =        "",
  year =         "1987",
  bibdate =      "Mon Sep 9 14:56:14 MDT 1996",
  bibsource =    "",
  abstract =     "Looks at the evolution which has taken place in the
                 design of mathematical software for dense matrix
                 problems. The paper also examines the problems facing
                 implementation of such algorithms on a large number of
                 processors. The main emphasis is on algorithms for
                 solving linear algebra problems where the software
                 developed would reside in a library on high-performance
  acknowledgement = ack-nhfb,
  affiliation =  "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  classcodes =   "C7310 (Mathematics); C4140 (Linear algebra)",
  classification = "C4140 (Linear algebra); C7310 (Mathematics)",
  conflocation = "Paris, France; 2-6 Feb. 1987",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  keywords =     "Algorithms; algorithms; Dense matrix problems; dense
                 matrix problems; Library; library; Linear algebra
                 problems; linear algebra problems; Mathematical
                 software; mathematical software; mathematics computing;
                 matrix algebra",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  thesaurus =    "Mathematics computing; Matrix algebra",
  treatment =    "P Practical",

  author =       "J. J. Dongarra and D. C. Sorensen",
  title =        "A Portable Environment for Developing Parallel
                 {FORTRAN} Programs",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "5",
  number =       "1--2",
  pages =        "175--186",
  month =        jul,
  year =         "1987",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  URL =          "",
  abstract =     "We present an attempt at a short term solution to the
                 transportability problem. The motivation for developing
                 the package has been to extend capabilities beyond loop
                 based parallelism and to provide a convenient machine
                 independent user interface. A package called SCHEDULE
                 is described which provides a standard user interface
                 to several shared memory parallel machines. A user
                 writes standard FORTRAN code and calls SCHEDULE
                 routines which express and enforce the large grain data
                 dependencies of his parallel algorithm. Machine
                 dependencies are internal to SCHEDULE and change from
                 one machine to another but the users code remains
                 essentially the same across all such machines. The
                 semantics and usage of SCHEDULE are described and
                 several examples of parallel algorithms which have been
                 implemented using SCHEDULE are presented.",
  acknowledgement = ack-nhfb,
  affiliation =  "Argonne Natl Lab, Argonne, IL, USA",
  affiliationaddress = "Argonne Natl Lab, Argonne, IL, USA",
  classcodes =   "C4240 (Programming and algorithm theory); C6115
                 (Programming support)",
  classification = "723",
  conference =   "Proceedings of the International Conference on Vector
                 and Parallel Computing.",
  conflocation = "Loen, Norway; 2-6 June 1986",
  conftitle =    "International Conference on Vector and Parallel
                 Computing - Issues in Applied Research and
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  journalabr =   "Parallel Computing",
  keywords =     "commercially produced parallel computers; COMPUTER
                 LANGUAGES --- Fortran; COMPUTER SYSTEMS, DIGITAL ---
                 Parallel Processing; cs, prll; FORTRAN; FORTRAN
                 PROGRAMS; interface; mathematical software; parallel
                 algorithms; parallel FORTRAN programs; PARALLEL
                 PROGRAMMING; parallel programming; portable
                 environment; PORTABLE SOFTWARE; programming
                 environments; SCHEDULE; SCHEDULE SOFTWARE PACKAGE;
                 SHARED-MEMORY MULTIPROCESSORS; software portability;
                 transportability problem; transportable; user",
  meetingaddress = "Loen, Norw",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsor =      "Chr. Michelsens Inst, Norw",
  sponsororg =   "IBM Norway; R. Norwegian Council Sci. and Ind. Res.;
                 AMDAHL; FPS; CRAY",
  treatment =    "P Practical",

  author =       "Jack Dongarra and Jeremy {Du Croz} and Iain Duff and
                 Sven Hammarling",
  title =        "A proposal for a set of {Level 3} basic linear algebra
  journal =      j-SIGNUM,
  volume =       "22",
  number =       "3",
  pages =        "2--14",
  month =        jul,
  year =         "1987",
  CODEN =        "SNEWD6",
  ISSN =         "0163-5778 (print), 1558-0237 (electronic)",
  ISSN-L =       "0163-5778",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C4140 (Linear algebra); C7310 (Mathematics)",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  fjournal =     "ACM SIGNUM Newsletter",
  journal-URL =  "",
  keywords =     "algorithms; blas; hierarchical memory;
                 high-performance computers; Level 3 basic linear
                 algebra subprograms; Level 3 BLAS; mathematics
                 computing; matrix algebra; matrix-matrix operations;
                 memory hierarchy; nla; parallel processing capability;
                 prll; software; subroutines; theory",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  subject =      "F.2.1 Theory of Computation, ANALYSIS OF ALGORITHMS
                 AND PROBLEM COMPLEXITY, Numerical Algorithms and
                 Problems, Computations on matrices \\ G.2.m Mathematics
                 of Computing, DISCRETE MATHEMATICS, Miscellaneous",
  treatment =    "P Practical; T Theoretical or Mathematical",

  author =       "J. J. Dongarra",
  editor =       "Walter J. Karplus",
  booktitle =    "Multiprocessors and array processors: proceedings of
                 the Third Conference on Multiprocessors and Array
                 Processors: 14--16 January 1987, San Diego,
  title =        "Performance of various computers using standard linear
                 equations software in a {Fortran} environment",
  publisher =    "Society for Computer Simulation",
  address =      "San Diego, CA, USA",
  bookpages =    "xii + 321",
  pages =        "15--32",
  year =         "1987",
  ISSN =         "0735-9276",
  LCCN =         "QA76.5 .C61923",
  bibdate =      "Tue Feb 26 05:52:45 2002",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C5470 (Performance evaluation and testing)",
  conflocation = "San Diego, CA, USA; 14-16 Jan. 1987",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  keywords =     "68000 based systems; Apollo; computer performance;
                 CRAY X-MP; FORTRAN; Fortran environment; IBM PC's;
                 linear equations; LINPACK software; performance
                 evaluation; software packages; standard linear
                 equations software; SUN Workstations",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",
  xxISBN =       "none",

  author =       "Jack J. Dongarra",
  title =        "Performance of Various Computers Using Standard Linear
                 Equations Software in a {Fortran} Environment",
  journal =      j-SIMULATION,
  volume =       "49",
  number =       "2",
  pages =        "51--62",
  month =        aug,
  year =         "1987",
  CODEN =        "SIMUA2",
  DOI =          "",
  ISSN =         "0037-5497 (print), 1741-3133 (electronic)",
  ISSN-L =       "0037-5497",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  abstract =     "This note compares the performance of different
                 computer systems while solving dense systems of linear
                 equations using the LINPACK software in a Fortran
                 environment. About 100 computers, ranging from a CRAY
                 X-MP to the 68000-based systems such as the Apollo and
                 SUN Workstations to IBM PC's, are compared.",
  acknowledgement = ack-nhfb,
  affiliation =  "Argonne Natl Lab, Argonne, IL, USA",
  affiliationaddress = "Argonne Natl Lab, Argonne, IL, USA",
  classcodes =   "C4140 (Linear algebra); C5470 (Performance evaluation
                 and testing); C7310 (Mathematics)",
  classification = "722; 723; 921",
  corpsource =   "Math. and Comput. Sci. Div., Argonne Nat. Lab., IL,
  fjournal =     "Simulation",
  journal-URL =  "",
  journalabr =   "Simulation",
  keywords =     "68000-based; Apollo; COMPUTER PROGRAMMING LANGUAGES
                 floating point arithmetic operations; FORTRAN
                 environment; IBM PC; linear algebra; LINPACK programs;
                 --- Linear Algebra; microcomputers; minicomputers;
                 minisupercomputers; Performance; performance
                 evaluation; standard linear equations software; SUN
                 Workstations; supercomputers; systems",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "X Experimental",

  author =       "Jack J. Dongarra and Lennart Johnsson",
  title =        "Solving Banded Systems on a Parallel Processor",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "5",
  number =       "1--2",
  pages =        "219--246",
  month =        jul,
  year =         "1987",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  MRclass =      "65W05 (65F05)",
  MRnumber =     "898 045",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  note =         "Proceedings of the international conference on vector
                 and parallel computing---issues in applied research and
                 development (Loen, 1986).",
  URL =          "",
  abstract =     "In this paper we examine ways of solving dense, banded
                 systems on different parallel processors. We start with
                 some considerations for processors with vector
                 instructions, then discuss various algorithms for the
                 solution of large, dense, banded systems on a parallel
                 processor. We analyze the behavior of the parallel
                 algorithms on distributed-storage architectures
                 configured as rings, two-dimensional meshes with
                 end-around connections (tori), boolean n-cube
                 configured architectures, and bus-based and
                 switch-based machines with shared storage. We also
                 present measurements for two bus-based architectures
                 with shared storage, namely, the Alliant FX/8 and the
                 Sequent Balance 21000.",
  affiliation =  "Argonne Natl Lab, Argonne, IL, USA",
  affiliationaddress = "Argonne Natl Lab, Argonne, IL, USA",
  classcodes =   "C4240 (Programming and algorithm theory); C5440
                 (Multiprocessor systems and techniques)",
  classification = "722; 723; 921",
  conference =   "Proceedings of the International Conference on Vector
                 and Parallel Computing.",
  conflocation = "Loen, Norway; 2-6 June 1986",
  conftitle =    "International Conference on Vector and Parallel
                 Computing - Issues in Applied Research and
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  journalabr =   "Parallel Computing",
  keywords =     "ALLIANT FX/8; Alliant FX/8; banded systems; boolean
                 n-cube configured architectures; COMPUTER PROGRAMMING
                 --- Algorithms; COMPUTER SYSTEMS, DIGITAL; DENSE BANDED
                 distributed-storage architectures; end-around
                 connections; machines; MATHEMATICAL TECHNIQUES ---
                 Linear Algebra; PARALLEL ALGORITHMS; parallel
                 algorithms; Parallel Processing; parallel processing;
                 parallel processor; rings; SEQUENT BALANCE 21000;
                 Sequent Balance 21000; switch-based; two-dimensional
                 meshes; vector instructions",
  meetingaddress = "Loen, Norw",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsor =      "Chr. Michelsens Inst, Norw",
  sponsororg =   "IBM Norway; R. Norwegian Council Sci. and Ind. Res.;
                 AMDAHL; FPS; CRAY",
  treatment =    "P Practical; T Theoretical or Mathematical",

  author =       "J. J. Dongarra and D. C. Sorensen",
  title =        "{Schedule: A} Tool for Developing and Analyzing
                 Parallel {Fortran} Programs",
  crossref =     "Jamieson:1987:CPA",
  volume =       "5 (??)",
  pages =        "363--394 (??)",
  year =         "1987",
  bibdate =      "Mon Jan 15 10:51:03 1996",
  bibsource =    "",
  keywords =     "email, data sharing, implementation",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and D. C. Sorensen",
  title =        "{SCHEDULE} Users Guide",
  number =       "ANL-MCS-TM-76",
  organization = inst-ANL,
  address =      inst-ANL:adr,
  pages =        "????",
  month =        jun,
  year =         "1987",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra",
  title =        "Workshop on the {Level 3 BLAS}",
  type =         "Technical Report",
  number =       "MCS-TM-89",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  pages =        "????",
  month =        mar,
  year =         "1987",
  bibdate =      "Tue Oct 9 11:34:27 2007",
  bibsource =    "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Gene H. Golub and Miki Neumann and James W. Demmel and
                 Paul Saylor and James M. Boyle and Iain Duff and Jack
  title =        "{James Wilkinson} (1919--1986)",
  journal =      j-ANN-HIST-COMPUT,
  volume =       "9",
  number =       "2",
  pages =        "205--210",
  month =        apr # "\slash " # jun,
  year =         "1987",
  CODEN =        "AHCOE5",
  ISSN =         "0164-1239",
  bibdate =      "Sat Jul 14 18:11:40 2001",
  bibsource =    ";
  note =         "From the introduction: ``A series of lightly edited
                 extracts from messages that were sent over various
                 computer networks during the period October 5,
                 1986--February 13, 1987''.",
  fjournal =     "Annals of the History of Computing",
  journal-URL =  "",
  keywords =     "obituary",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "C. Bischof and J. Demmel and J. Dongarra and J. {Du
                 Croz} and A. Greenbaum and S. Hammarling and D.
  title =        "{LAPACK} Provisional Contents",
  type =         type-MCSDTR,
  number =       "ANL-88-38",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        sep,
  year =         "1988",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  note =         "(LAPACK Working Note \#5)",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "C. Bischof and J. Demmel and J. Dongarra and J. {Du
                 Croz} and A. Greenbaum and S. Hammarling and D.
  title =        "Provisional Contents",
  type =         "LAPACK Working Note",
  number =       "05",
  institution =  inst-ANL-MCS,
  address =      inst-ANL-MCS:adr,
  month =        sep,
  year =         "1988",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "ANL, MCS-TM-38, September 1988.",
  URL =          ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "O. Brewer and J. Dongarra and D. Sorensen",
  title =        "Tools to Aid in the Analysis of Memory Access Patterns
                 for {FORTRAN} Programs",
  type =         "LAPACK Working Note",
  number =       "06",
  institution =  inst-ANL-MCS,
  address =      inst-ANL-MCS:adr,
  month =        jun,
  year =         "1988",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "ANL, MCS-TM-120 (or ANL-MCS-TM-119??), June 1988.",
  URL =          ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Orlie Brewer and Jack Dongarra and Danny Sorensen",
  title =        "Tools to aid in the analysis of memory access patterns
                 for {FORTRAN} programs",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "9",
  number =       "1",
  pages =        "25--35",
  month =        dec,
  year =         "1988",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  URL =          "",
  abstract =     "In order to improve the performance of algorithms
                 implemented on high-performance computers, we must
                 consider not only the total number of memory
                 references, but also the pattern of memory references.
                 We would like our algorithms to observe the principle
                 of locality of reference, so that the data can be
                 effectively utilized. This paper describes a set of
                 tools that can be used as an aid in the analysis of
                 memory access patterns of FORTRAN programs.",
  affiliation =  "Argonne",
  affiliationaddress = "Argonne, IL, USA",
  classcodes =   "C6115 (Programming support); C6110 (Systems analysis
                 and programming)",
  classification = "723",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  journalabr =   "Parallel Comput",
  keywords =     "Computer Programming Languages--FORTRAN; Computer
                 Software; Data Storage, Digital; FORTRAN Programs;
                 FORTRAN programs; Linear Algebra; Memory Access
                 Patterns; memory access patterns analysis; Parallel
                 Processing Computers; parallel programming; Software
                 Engineering; software tools; Visualization Tools",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "D. Callahan and J. Dongarra and D. Levine",
  title =        "Vectorizing Compilers: a Test Suite and Results",
  type =         type-TM,
  number =       "109",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        mar,
  year =         "1988",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  note =         "To appear: {\it Proceedings of the Supercomputing '88
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "David Callahan and Jack Dongarra and David Levine",
  title =        "Vectorizing compilers: a test suite and results",
  crossref =     "IEEE:1988:PSN",
  volume =       "1",
  pages =        "98--105",
  year =         "1988",
  bibdate =      "Thu Apr 16 07:55:03 MDT 1998",
  bibsource =    "Compendex database;
  abstract =     "A collection of 100 Fortran loops used to test the
                 effectiveness of an automatic vectorizing compiler is
                 described. The results of compiling these loops using
                 commercially available, vectorizing Fortran compilers
                 on a variety of supercomputers, minisupercomputers, and
                 mainframes are presented. The testing methodology and
                 loop scoring are exploring.",
  affiliation =  "Dept. of Comput. Sci., Rice Univ., Houston, TX, USA",
  classification = "723; C6150C (Compilers, interpreters and other
                 processors); C6150G (Diagnostic, testing, debugging and
                 evaluating systems)",
  conference =   "Proceedings: Supercomputing '88",
  conferenceyear = "1988",
  corpsource =   "Dept. of Comput. Sci., Rice Univ., Houston, TX, USA",
  keywords =     "Automatic vectorizing compiler; automatic vectorizing
                 compiler; Computer Operating Systems; Computer
                 Programming Languages--FORTRAN; Computer Systems,
                 Digital--Parallel Processing; Fortran Compilers;
                 Fortran loops; Fortran Loops; Fortran loops; Loop
                 scoring; loop scoring; Mainframes; mainframes;
                 Minisupercomputers; minisupercomputers; Program
                 Compilers; program compilers; program testing;
                 Supercomputers; supercomputers; Test suite; test suite;
                 Testing methodology; testing methodology; Vectorizing
                 Compilers; Vectorizing Fortran compilers; vectorizing
                 Fortran compilers",
  meetingabr =   "Proc Supercomputing 88",
  meetingaddress = "Orlando, FL, USA",
  meetingdate =  "Nov 14--18 1988",
  meetingdate2 = "1988 Nov 14--18",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsor =      "IEEE Computer Soc, Los Alamitos, CA, USA; ACM,
                 SIGARCH, New York, NY, USA",
  sponsororg =   "IEEE; ACM",
  thesaurus =    "Program compilers; Program testing",
  treatment =    "P Practical",

  author =       "J. J. Dongarra and D. C. Sorensen",
  title =        "Algorithm design for high-performance computers",
  crossref =     "Paul:1988:PSC",
  pages =        "83--97",
  year =         "1988",
  bibdate =      "Wed Sep 22 15:43:54 2010",
  bibsource =    "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Jeremy {Du Croz} and Sven
                 Hammarling and Richard J. Hanson",
  title =        "{Algorithm 656}: An Extended Set of {Basic Linear
                 Algebra Subprograms}: Model Implementation and Test
  journal =      j-TOMS,
  volume =       "14",
  number =       "1",
  pages =        "18--32",
  month =        mar,
  year =         "1988",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  URL =          ";
  abstract =     "This paper describes a model implementation and test
                 software for the Level 2 Basic Linear Algebra
                 Subprograms (Level 2 BLAS). Level 2 BLAS are targeted
                 at matrix-vector operations with the aim of providing
                 more efficient, but portable, implementations of
                 algorithms on high-performance computers. The model
                 implementation provides a portable set of FORTRAN 77
                 Level 2 BLAS for machines where specialized
                 implementations do not exist or are not required. The
                 test software aims to verify that specialized
                 implementations meet the specification of Level 2 BLAS
                 and that implementations are correctly installed.",
  affiliation =  "Argonne Natl Lab, Argonne, IL, USA",
  affiliationaddress = "Argonne Natl Lab, Argonne, IL, USA",
  classcodes =   "C4140 (Linear algebra); C7310 (Mathematics)",
  classification = "723; 921",
  corpsource =   "Argonne Nat. Lab., IL, USA",
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  keywords =     "algorithms; basic linear algebra subprograms; computer
                 programming; computer programming languages ---
                 fortran; FORTRAN 77; Level 2 Basic Linear Algebra
                 Subprograms; Level 2 BLAS; mathematical software;
                 mathematical techniques --- Linear Algebra; mathematics
                 computing; matrix algebra; matrix-vector operations;
                 model implementation; nla, blas, vect, software;
                 program testing; Subroutines; test programs; theory;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  subject =      "G.1.3 Mathematics of Computing, NUMERICAL ANALYSIS,
                 Numerical Linear Algebra \\ G.4 Mathematics of
                 Computing, MATHEMATICAL SOFTWARE, Algorithm analysis",
  treatment =    "P Practical",

  author =       "Jack J. Dongarra and Jeremy {Du Croz} and Sven
                 Hammarling and Richard J. Hanson",
  title =        "Corrigenda: ``{An} Extended Set of {FORTRAN Basic
                 Linear Algebra Subprograms}''",
  journal =      j-TOMS,
  volume =       "14",
  number =       "4",
  pages =        "399--399",
  month =        dec,
  year =         "1988",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  bibdate =      "Sat Nov 19 13:03:54 1994",
  bibsource =    "",
  note =         "See \cite{Dongarra:1988:ESF}.",
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Jeremy {Du Croz} and Sven
                 Hammarling and Richard J. Hanson",
  title =        "An Extended Set of {FORTRAN Basic Linear Algebra
  journal =      j-TOMS,
  volume =       "14",
  number =       "1",
  pages =        "1--17",
  month =        mar,
  year =         "1988",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  note =         "See also \cite{Dongarra:1988:CES}.",
  URL =          ";
  abstract =     "This paper describes an extension to the set of Basic
                 Linear Algebra Subprograms (BLAS). The extensions are
                 targeted at matrix-vector operations that should
                 provide for efficient and portable implementations of
                 algorithms for high-performance computers. The
                 discussion covers naming conventions, argument
                 conventions, and storage conventions.",
  affiliation =  "Argonne Natl Lab, Argonne, IL, USA",
  affiliationaddress = "Argonne Natl Lab, Argonne, IL, USA",
  classcodes =   "C4140 (Linear algebra); C7310 (Mathematics)",
  classification = "723; 921",
  corpsource =   "Argonne Nat. Lab., IL, USA",
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  keywords =     "algorithms; Basic Linear Algebra Subprograms; basic
                 linear algebra subprograms; BLAS; computer programming;
                 computer programming languages --- fortran; FORTRAN
                 programs; mathematical software; mathematical
                 techniques --- Linear Algebra; mathematics computing;
                 matrix algebra; matrix-vector; operations;
                 standardization; Subroutines; vectors",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  review =       "ACM CR 8812-0940",
  subject =      "{\bf G.4}: Mathematics of Computing, MATHEMATICAL
                 SOFTWARE, Portability. {\bf G.1.3}: Mathematics of
                 Computing, NUMERICAL ANALYSIS, Numerical Linear
  treatment =    "P Practical",

  author =       "J. J. Dongarra and D. C. Sorensen",
  title =        "A look at the evolution of mathematical software for
                 dense matrix problems over the past fifteen years",
  crossref =     "Schultz:1988:NAM",
  pages =        "29--36",
  year =         "1988",
  MRclass =      "65V05",
  MRnumber =     "950 701",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra",
  booktitle =    "Evaluating Supercomputers: Strategies for Exploiting,
                 Evaluating and Benchmarking Computers with Advanced
  title =        "The {LINPACK} Benchmark: an explanation",
  publisher =    "Unicom Seminars",
  address =      "Uxbridge, UK",
  bookpages =    "xv + 183",
  pages =        "150--167",
  month =        "????",
  year =         "1988",
  ISBN =         "????",
  ISBN-13 =      "????",
  LCCN =         "????",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  classcodes =   "C4140 (Linear algebra); C5470 (Performance evaluation
                 and testing)",
  conflocation = "London, UK; 1-3 June 1988",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  keywords =     "data types; FORTRAN; history; linear equations;
                 LINPACK Benchmark; LINPACK package; matrix algebra;
                 performance evaluation; subroutines; well-structured
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",
  xxnote =       "Check: was this republished as

  author =       "J. J. Dongarra",
  title =        "The {LINPACK} benchmark: an explanation",
  crossref =     "Houstis:1988:SIC",
  pages =        "456--474",
  year =         "1988",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          "",
  abstract =     "Clears up some of the confusion and mystery
                 surrounding the LINPACK Benchmark. The author examines
                 what is measured and describes how to interpret the
                 results of the programs. Performance is a complex
                 issue, dependent on a variety of diverse quantities
                 including the algorithm, the problem size, and the
                 implementation. The LINPACK Benchmark provides three
                 separate benchmarks that can be used to evaluate
                 computer performance on a dense system of linear
                 equations: the first for 100*100 matrix, the second for
                 a 300*300 matrix, and the third for a 1000*1000 matrix.
                 The third benchmark, in particular, is dependent on the
                 algorithm chosen by the manufacturer.",
  affiliation =  "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  classcodes =   "C4140 (Linear algebra); C5470 (Performance evaluation
                 and testing); C7310 (Mathematics)",
  classification = "C4140 (Linear algebra); C5470 (Performance
                 evaluation and testing); C7310 (Mathematics)",
  conflocation = "Athens, Greece; 8-12 June 1987",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  keywords =     "Computer performance; computer performance; computer
                 testing; dense; Dense system of linear equations;
                 linear algebra; LINPACK Benchmark; performance
                 evaluation; Problem size; problem size; system of
                 linear equations",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "Comput. Technol. Inst. Greece",
  thesaurus =    "Computer testing; Linear algebra; Performance
  treatment =    "P Practical; X Experimental",

  author =       "Jack J. Dongarra and Danny C. Sorensen and Kathryn
                 Connolly and Jim Patterson",
  title =        "Programming methodology and performance issues for
                 advanced computer architectures",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "8",
  number =       "1--3",
  pages =        "41--58",
  month =        oct,
  year =         "1988",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  URL =          "",
  abstract =     "This paper describes some recent attempts to construct
                 transportable numerical software for high-performance
                 computers. Restructuring algorithms in terms of simple
                 linear algebra modules is reviewed. We also present a
                 programming methodology that is useful for constructing
                 new parallel algorithms which require sophisticated
                 synchronization at a large grain level. We describe the
                 SCHEDULE package which provides an environment for
                 developing and analyzing explicitly parallel programs
                 in FORTRAN which are portable. This package now
                 includes a preprocessor to achieve complete portability
                 of user level code and also a graphics post processor
                 for performance analysis and debugging. We discuss
                 details of porting both the SCHEDULE package and user
                 code. Examples from linear algebra, and partial
                 differential equations are used to illustrate the
                 utility of this approach.",
  affiliation =  "Argonne",
  affiliationaddress = "Argonne, IL, USA",
  classcodes =   "C5220 (Computer architecture); C6110 (Systems analysis
                 and programming)",
  classification = "723",
  conference =   "Proceedings of the International Conference on Vector
                 and Parallel Processors in Computational Science III",
  conflocation = "Liverpool, UK; 25-28 Aug. 1987",
  conftitle =    "International Conference on Vector and Parallel
                 Processors in Computational Science III",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  journalabr =   "Parallel Comput",
  keywords =     "advanced computer architectures; Algorithms;
                 algorithms restructuring vector computers; Computer
                 Programming; Computer Programming Languages--FORTRAN;
                 Computer Software Schedule; Computer Systems,
                 Digital--Parallel Processing; computers; debugging;
                 floating-point operations; FORTRAN; graphics post;
                 issues; linear algebra modules; Numerical Software;
                 numerical software; parallel; Parallel Algorithms;
                 parallel algorithms; parallel architectures; Parallel
                 Programs; parallel programs; partial differential
                 equations; performance; performance evaluation;
                 Portable Software; processor; programming; SCHEDULE
                 package; transportable",
  meetingaddress = "Liverpool, Engl",
  meetingdate =  "Aug 25--28 1987",
  meetingdate2 = "08/25--28/87",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsor =      "US Army European Research Office, USA",
  sponsororg =   "US Army Eur. Res. Office",
  treatment =    "P Practical",

  author =       "J. J. Dongarra",
  title =        "Performance of Various Computers Using Standard Linear
                 Equations Software in a {Fortran} Environment",
  type =         "Technical Report",
  number =       "MCS-TM-23",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  pages =        "????",
  month =        jan,
  year =         "1988",
  bibdate =      "Tue Oct 9 11:33:34 2007",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra",
  title =        "Performance of various computers using standard linear
                 equations software in a {Fortran} environment",
  journal =      j-COMP-ARCH-NEWS,
  volume =       "16",
  number =       "1",
  pages =        "47--69",
  month =        mar,
  year =         "1988",
  CODEN =        "CANED2",
  ISSN =         "0163-5964 (ACM), 0884-7495 (IEEE)",
  ISSN-L =       "0163-5964",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  classcodes =   "C5470 (Performance evaluation and testing); C7310
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  fjournal =     "ACM SIGARCH Computer Architecture News",
  journal-URL =  "",
  keywords =     "68000 based systems; Apollo; computer systems; CRAY
                 X-MP; dense systems; Fortran environment; IBM PCs;
                 LINPACK; mathematics computing; packages; performance;
                 performance evaluation; software; standard linear
                 equations software; SUN; Workstations",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical; X Experimental",

  author =       "J. J. Dongarra and J. {Du Croz} and I. S. Duff and S.
  title =        "A Set of Level 3 {Basic Linear Algebra Subprograms}",
  type =         "??",
  number =       "ANL-MCS-TM-88",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        "??",
  year =         "1988",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. Anderson and J. Dongarra",
  title =        "Installing and Testing the Initial Release of {LAPACK}
                 --- {Unix} and Non-{Unix} Versions",
  type =         "LAPACK Working Note",
  number =       "10",
  institution =  inst-ANL-MCS,
  address =      inst-ANL-MCS:adr,
  month =        may,
  year =         "1989",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "ANL, MCS-TM-130, May 1989.",
  URL =          ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. Anderson and Z. Bai and C. Bischof and J. Demmel
                 and J. Dongarra and J. DuCroz and A. Greenbaum and S.
                 Hammarling and A. McKenney and D. Sorensen",
  title =        "{LAPACK}: a Portable Linear Algebra Library for
  type =         "??",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        "??",
  year =         "1989",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. Anderson and J. Dongarra",
  title =        "Results from the Initial Release of {LAPACK}",
  type =         "LAPACK Working Note" # " and " # type-CSDTR,
  number =       "16 and CS-89-89",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        nov,
  year =         "1989",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    ";
  note =         "UT-CS-89-89, November 1989. (Replaced by LAWN 41 or
                 81!!). LAPACK Working Note \#16",
  URL =          ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "C. H. Bischof and J. J. Dongarra",
  title =        "A Linear Algebra Library for High-Performance
  crossref =     "Carey:1989:PSM",
  pages =        "45--56",
  year =         "1989",
  bibdate =      "Tue Oct 09 10:54:35 2007",
  bibsource =    "",
  note =         "Preprint MCS-P105-0989, Mathematics and Computer,
                 September 1989.",
  abstract =     "Argonne, the Courant Institute, and NAG are developing
                 a transportable linear algebra library in Fortran 77.
                 The library (called LAPACK) will provide routines for
                 solving systems of simultaneous linear equations,
                 least-squares solutions of overdetermined systems of
                 equations, and eigenvalue problems. The new library
                 will be based on the successful EISPACK and LINPACK
                 libraries. It will be designed to be efficient and
                 transportable across a wide range of computing
                 environments, with special emphasis on modern
                 high-performance computers. The new library will be
                 distributed over a system similar to netlib, at no or
                 minimal cost.",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxtitle =      "A project for developing a linear algebra library for
                 high-performance computers",

  author =       "O. Brewer and J. Dongarra and D. Sorensen",
  editor =       "Stanley Y. W. Su and George J. Knafl",
  booktitle =    "Proceedings: the thirteenth annual International
                 Computer Software \& Applications Conference",
  title =        "A graphics tool to aid in the generation of parallel
                 {FORTRAN} programs",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  bookpages =    "xx + 793",
  pages =        "89--93",
  year =         "1989",
  ISBN =         "0-8186-1964-3",
  ISBN-13 =      "978-0-8186-1964-9",
  LCCN =         "QA76.6.C6295 1989",
  bibdate =      "Tue Feb 26 06:00:30 2002",
  bibsource =    "",
  note =         "Computer Society order number 1964. IEEE catalog
                 number 89CH2743-3.",
  classcodes =   "C6115 (Programming support); C6130B (Graphics
                 techniques); C6110 (Systems analysis and programming)",
  conflocation = "Orlando, FL, USA; 20-22 Sept. 1989",
  corpsource =   "Argonne Nat. Lab., IL, USA",
  keywords =     "BUILD; computer graphics; execution graph; FORTRAN;
                 graphics tool; package; parallel FORTRAN programs;
                 parallel programming; SCHEDULE; software; tools",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "IEEE",
  treatment =    "P Practical",

  author =       "O. Brewer and J. Dongarra and D. Levine and D.
  title =        "Graphics tools for developing high-performance
  crossref =     "Evans:1989:PCM",
  pages =        "39--50",
  year =         "1989",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  abstract =     "This paper discusses two tools that aid in the
                 development of parallel algorithms for high-performance
                 computers. The authors describe the SCHEDULE package
                 which provides an environment for developing and
                 analyzing new parallel algorithms in Fortran that
                 require sophisticated synchronization at a large-grain
                 level. This package provides portability of a user's
                 code and also has a graphics postprocessor for
                 performance analysis and debugging. The authors also
                 discuss a graphics tool useful for studying memory
                 access patterns of algorithms.",
  affiliation =  "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  classcodes =   "C6130B (Graphics techniques); C6115 (Programming
                 support); C4240 (Programming and algorithm theory)",
  classification = "C4240 (Programming and algorithm theory); C6115
                 (Programming support); C6130B (Graphics techniques)",
  conflocation = "Verona, Italy; 28-30 Sept. 1988",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  keywords =     "algorithms; computer graphics; Debugging; debugging;
                 evaluation; Fortran; Graphics tools; graphics tools;
                 High-performance algorithms; high-performance
                 algorithms; Large-grain level; large-grain level;
                 Memory access patterns; memory access patterns;
                 parallel; Parallel algorithms; parallel algorithms;
                 performance; Performance analysis; performance
                 analysis; Portability; portability; SCHEDULE package;
                 software tools; Synchronization; synchronization",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "Univ. Verona; Univ. Calabria; et al",
  thesaurus =    "Computer graphics; Parallel algorithms; Performance
                 evaluation; Software tools",
  treatment =    "P Practical; T Theoretical or Mathematical",

  author =       "J. Browne and J. Dongarra and A. Karp and K. Kennedy
                 and D. Kuck",
  title =        "1988 {Gordon Bell Prize}",
  journal =      j-IEEE-SOFTWARE,
  volume =       "6",
  number =       "3",
  pages =        "78--85",
  month =        may,
  year =         "1989",
  CODEN =        "IESOEG",
  DOI =          "",
  ISSN =         "0740-7459 (print), 0740-7459 (electronic)",
  ISSN-L =       "0740-7459",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  abstract =     "The Gordon Bell Prize recognizes outstanding
                 achievement in all applications of supercomputers to
                 scientific and engineering problems. A description is
                 given of the winning entry and two honorable mentions.
                 The winning entry, from the raw-performance category,
                 was submitted by Phuong Vu, C. Ashcraft, R. Grimes, J.
                 Lewis and B. Peyton. They presented the solution of a
                 static-structures problem that ran at just over 1 Gflop
                 (billions of floating-point operations) on an
                 eight-processor Cray Y-MP. One honorable mention, in
                 the price/performance category, came from R. Pelz, who
                 used a 1024-processor N-Cube multicomputer to solve a
                 fluid-flow problem using a spectral method with a
                 speedup of about 800. Marina Chen, Young-Il Choo,
                 Jungke Li, and J. Wu received an honorable mention for
                 an entry in which a Crystal Compiler automatically
                 parallelized a financial modeling application.",
  affiliation =  "Dept. of Comput. Sci., Texas Univ., Austin, TX, USA",
  classcodes =   "C5440 (Multiprocessor systems and techniques)",
  classification = "C5440 (Multiprocessor systems and techniques)",
  corpsource =   "Dept. of Comput. Sci., Texas Univ., Austin, TX, USA",
  fjournal =     "IEEE Software",
  journal-URL =  "",
  keywords =     "application; Cray Y-MP; Crystal Compiler; Engineering
                 problems; engineering problems; financial modeling;
                 Financial modeling application; Fluid-flow problem;
                 fluid-flow problem; N-Cube multicomputer; parallel
                 processing; Scientific problems; scientific problems;
                 Static-structures problem; static-structures problem;
                 Supercomputers; supercomputers",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  thesaurus =    "Parallel processing",
  treatment =    "G General Review; P Practical",

  author =       "J. Demmel and J. J. Dongarra and J. DuCroz and A.
  title =        "A project for developing a linear algebra library for
                 high-performance computers",
  crossref =     "Wright:1989:ACA",
  pages =        "87--92",
  year =         "1989",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  classcodes =   "C6115 (Programming support); C7310 (Mathematics);
                 C4140 (Linear algebra)",
  conflocation = "Stanford, CA, USA; 22-26 Aug. 1988",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  keywords =     "Argonne; Basic Linear Algebra Subprograms; BLAS;
                 Courant Institute for Mathematical; EISPACK;
                 environment; environments; FORTRAN; Fortran 77;
                 high-performance computers; linear algebra; linear
                 algebra library; Linpack; mathematics computing;
                 National Laboratory; Numerical Algorithms Group;
                 programming; Sciences",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "Lawrence Livermore Nat. Lab.; Appl. Dynamics Int.;
                 Stanford Univ",
  treatment =    "P Practical",

  author =       "Jack Dongarra",
  title =        "{Advanced Computing Research Facility, Mathematics and
                 Computer Science Division, Argonne National
  journal =      j-IJSA,
  volume =       "3",
  number =       "4",
  pages =        "6--8",
  month =        dec,
  year =         "1989",
  CODEN =        "IJSAE9",
  DOI =          "",
  ISSN =         "0890-2720",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    ";
  URL =          "",
  fjournal =     "The International Journal of Supercomputer
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Danny C. Sorensen and Sven J.
  title =        "Block Reduction of Matrices to Condensed Forms for
                 Eigenvalue Computations",
  journal =      j-J-COMPUT-APPL-MATH,
  volume =       "27",
  number =       "1--2",
  pages =        "215--227",
  month =        sep,
  year =         "1989",
  CODEN =        "JCAMDI",
  DOI =          "",
  ISSN =         "0377-0427 (print), 1879-1778 (electronic)",
  ISSN-L =       "0377-0427",
  MRclass =      "65F30",
  MRnumber =     "020 164",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  note =         "(LAPACK Working Note \#2)",
  URL =          "",
  abstract =     "This paper describes block algorithms for the
                 reduction of a real symmetric matrix to tridiagonal
                 form and for the reduction of a general real matrix to
                 either bidiagonal or Hessenberg form by using
                 Householder transformations. The approach is to
                 aggregate the transformations and to apply them in a
                 blocked fashion, thus achieving algorithms that are
                 rich in matrix-matrix operations. These reductions
                 typically are a preliminary step in the computation of
                 eigenvalues or singular values. The authors demonstrate
                 how the initial reduction to tridiagonal or bidiagonal
                 form may be pipelined with the divide-and-conquer
                 technique for computing the eigensystem of a symmetric
                 matrix or the singular value decomposition of a general
                 matrix to achieve algorithms that are load balanced and
                 rich in matrix-matrix operations.",
  affiliation =  "Math. and Comput. Sci. Div., Argonne Nat. Lab., IL,
  classcodes =   "C4140 (Linear algebra); C4240 (Programming and
                 algorithm theory)",
  classification = "C4140 (Linear algebra); C4240 (Programming and
                 algorithm theory)",
  corpsource =   "Math. and Comput. Sci. Div., Argonne Nat. Lab., IL,
  fjournal =     "Journal of Computational and Applied Mathematics",
  journal-URL =  "",
  keywords =     "algorithms; bidiagonal; block algorithms; block
                 reduction of matrices; condensed; divide and conquer
                 technique; eigenvalue computations; eigenvalues and
                 eigenfunctions; forms; Hessenberg form; Householder
                 transformations; linear algebra; matrix-matrix
                 operations; parallel",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  pubcountry =   "Netherlands",
  thesaurus =    "Eigenvalues and eigenfunctions; Linear algebra;
                 Parallel algorithms",
  treatment =    "T Theoretical or Mathematical",

  author =       "Jack J. Dongarra and Jeremy {Du Croz} and Iain S. Duff
                 and Sven Hammarling",
  title =        "A proposal for a set of {Level} 3 {Basic Linear}
                 {Algebra Subprograms}",
  crossref =     "Rodrigue:1989:PPS",
  pages =        "40--44",
  year =         "1989",
  bibdate =      "Fri Nov 11 17:48:17 MST 1994",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra",
  title =        "Performance of Various Computers Using Standard Linear
                 Equations Software in a {Fortran} Environment",
  type =         type-TM,
  number =       "23",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  day =          "4",
  month =        jun,
  year =         "1989",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and E. Lusk",
  title =        "{Summer Institute in Parallel Computing: September
                 5--15, 1989}",
  type =         "Technical Report",
  number =       "MCS-TM-136",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        dec,
  year =         "1989",
  bibdate =      "Tue Oct 09 10:56:28 2007",
  bibsource =    "",
  abstract =     "This report summarizes the objectives of the Summer
                 Institute in Parallel Computing held at Argonne in
                 September 1989.",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Eric Grosse",
  title =        "Shopping for Mathematical Software Electronically",
  journal =      j-IEEE-POT,
  volume =       "8",
  number =       "1",
  pages =        "37--38",
  month =        feb,
  year =         "1989",
  CODEN =        "IEPTDF",
  DOI =          "",
  ISSN =         "0278-6648 (print), 1558-1772 (electronic)",
  ISSN-L =       "0278-6648",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  note =         "condensed version of CACM paper",
  URL =          "",
  abstract =     "A system called netlib that provides quick, easy, and
                 efficient distribution of public-domain software to the
                 scientific computing community on an as-needed basis is
                 described. A user simply sends a request by electronic
                 mail on a national network such as ARPAnet and receives
                 the requested software over the network. The
                 public-domain software currently included in netlib is
  classcodes =   "C0310 (EDP management); C6000 (Computer software);
                 C7000 (Computer applications)",
  classification = "C0310 (EDP management); C6000 (Computer software);
                 C7000 (Computer applications)",
  fjournal =     "IEEE Potentials",
  keywords =     "ARPAnet; Electronic mail; electronic mail;
                 Mathematical software; mathematical software; National
                 network; national network; Netlib; netlib; public
                 domain software; Public-domain software; public-domain
                 software; Scientific computing community; scientific
                 computing community; Shopping electronically; shopping
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  thesaurus =    "Public domain software",
  treatment =    "P Practical",

  author =       "J. Dongarra and D. Sorensen and O. Brewer",
  title =        "Tools to aid in the development of high-performance
  crossref =     "Cosnard:1989:PDA",
  pages =        "89--100",
  year =         "1989",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  classcodes =   "C4240 (Programming and algorithm theory); C6115
                 (Programming support); C6130B (Graphics techniques);
                 C5470 (Performance evaluation and testing)",
  conflocation = "Gers, France; 3-6 Oct. 1988",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  keywords =     "access patterns; computer graphics; debugging;
                 evaluation; Fortran; graphics postprocessor; graphics
                 tool; high-performance computers; memory; package;
                 parallel algorithms; performance; performance analysis;
                 programming environments; SCHEDULE; software tools;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "CNRS",
  treatment =    "P Practical",

  author =       "J. J. Dongarra and D. C. Sorensen and O. Brewer",
  title =        "Tools and methodology for programming parallel
  crossref =     "Wright:1989:ACA",
  pages =        "125--137",
  year =         "1989",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  classcodes =   "C6115 (Programming support); C5440 (Multiprocessor
                 systems and techniques)",
  conflocation = "Stanford, CA, USA; 22-26 Aug. 1988",
  corpsource =   "Math. and Comput. Sci. Div., Argonne Nat. Lab., IL,
  keywords =     "analysis; debugging; environments; equations; Fortran;
                 linear algebra; methodology; parallel algorithms;
                 parallel processing; parallel programming; parallel
                 programs; partial differential; performance;
                 preprocessor; programming; programming environment;
                 programming parallel processors; Schedule package;
                 software packages; synchronization; transportable
                 numerical software",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "Lawrence Livermore Nat. Lab.; Appl. Dynamics Int.;
                 Stanford Univ",
  treatment =    "P Practical",

  author =       "J. Dongarra and I. Duff and J. DuCroz and S.
  title =        "An update notice on the level 3 {BLAS}",
  journal =      j-SIGNUM,
  volume =       "24",
  number =       "1",
  pages =        "9--10",
  month =        jan,
  year =         "1989",
  CODEN =        "SNEWD6",
  ISSN =         "0163-5778 (print), 1558-0237 (electronic)",
  ISSN-L =       "0163-5778",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  abstract =     "In April 1987 we published a proposal for a set of
                 Level 3 BLAS (Argonne National Laboratory ANL-MCS-TM
                 88, May 1988). Since then the proposal has been
                 presented and discussed at various meetings, comments
                 have been received, and experience gained in using the
                 Level 3 BLAS to code block-structured algorithms in
                 linear algebra. As a result the authors have decided to
                 make a number of changes to the original proposal. They
                 outline these changes.",
  classcodes =   "C7310 (Mathematics); C4140 (Linear algebra)",
  classification = "C4140 (Linear algebra); C7310 (Mathematics)",
  fjournal =     "ACM SIGNUM Newsletter",
  journal-URL =  "",
  keywords =     "block-structured algorithms; Block-structured
                 algorithms; Level 3 BLAS; level 3 BLAS; linear algebra;
                 Linear algebra; mathematics computing",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  thesaurus =    "Linear algebra; Mathematics computing",

  author =       "Iain S. Duff",
  title =        "Parallel computation at {CERFACS}",
  crossref =     "Dongarra:1990:PPS",
  pages =        "66--67",
  year =         "1989",
  bibdate =      "Fri Nov 11 17:48:17 MST 1994",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and O. Brewer and S. Fineberg and J. A.
  title =        "A Tool to Aid in the Design, Implementation, and
                 Understanding of Matrix Algorithms for Parallel
  type =         "Technical Report",
  number =       "MCS-P115-1189",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  year =         "1989",
  bibdate =      "Tue Oct 09 10:59:08 2007",
  bibsource =    "",
  abstract =     "This paper discusses a tool that aids in the design,
                 development, and understanding of parallel algorithms
                 for high-performance computers. The tool provides a
                 vehicle for studying memory access patterns, different
                 cache strategies, and the effects of multiprocessors on
                 matrix algorithms in a Fortran setting. Such a tool
                 puts the user in a better position to understand where
                 performance problems may occur and enhances the
                 likelihood of increasing the program's performance
                 before actual execution on a high-performance
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Greenbaum and J. Dongarra",
  title =        "Experiments with {QR\slash QL} Methods for the
                 Symmetric Tridiagonal Eigenproblem",
  type =         "LAPACK Working Note" # " and " # type-CSDTR,
  number =       "17 and CS-89-92",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        nov,
  year =         "1989",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    ";
  note =         "UT-CS-89-92, November 1989. LAPACK Working Note
  URL =          ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. Anderson and J. Dongarra",
  title =        "Evaluating Block Algorithm Variants in {LAPACK}",
  type =         "LAPACK Working Note" # " and " # type-CSDTR,
  number =       "19 and CS-90-103",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        apr,
  year =         "1990",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    ";
  note =         "LAPACK Working Note \#19. UT-CS-90-103, April 1990.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. Anderson and J. Dongarra",
  title =        "Implementation Guide for {LAPACK}",
  type =         "LAPACK Working Note",
  number =       "18",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        apr,
  year =         "1990",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-90-101, April 1990.",
  URL =          ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. Anderson and Z. Bai and C. Bischof and J. Demmel
                 and J. Dongarra and J. {Du Croz} and A. Greenbaum and
                 S. Hammarling and A. McKenney and D. Sorensen",
  title =        "{LAPACK}: a Portable Linear Algebra Library for
                 High-Performance Computers",
  type =         "LAPACK Working Note",
  number =       "20",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        may,
  year =         "1990",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-90-105, May 1990.",
  URL =          ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. Anderson and Z. Bai and C. Bischof and J. Demmel
                 and J. Dongarra and J. DuCroz and A. Greenbaum and S.
                 Hammarling and A. McKenney and D. Sorensen",
  title =        "{LAPACK}: a Portable Linear Algebra Library for
                 High-Performance Computers",
  crossref =     "IEEE:1990:PSN",
  pages =        "2--11",
  year =         "1990",
  bibdate =      "Mon Sep 9 14:47:18 1996",
  bibsource =    "",
  abstract =     "The goal of the LAPACK project is to design and
                 implement a portable linear algebra library for
                 efficient use on a variety of high-performance
                 computers. The library is based on the widely used
                 LINPACK and EISPACK packages for solving linear
                 equations, eigenvalue problems, and linear
                 least-squares problems, but extends their functionality
                 in a number of ways. The major methodology for making
                 the algorithms run faster is to restructure them to
                 perform block matrix operations (e.g., matrix-matrix
                 multiplication) in their inner loops. These block
                 operations may be optimized to exploit the memory
                 hierarchy of a specific architecture. The LAPACK
                 project is also working on new algorithms that yield
                 higher relative accuracy for a variety of linear
                 algebra problems.",
  affiliation =  "Tennessee Univ., Knoxville, TN, USA",
  classification = "C4140 (Linear algebra); C7310 (Mathematics)",
  keywords =     "Block matrix operations; Block operations; Eigenvalue
                 problems; Functionality; Inner loops; LAPACK; Linear
                 equations; Linear least-squares problems; Matrix-matrix
                 multiplication; Memory hierarchy; Portable linear
                 algebra library; Relative accuracy",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  page =         "1--10",
  thesaurus =    "Eigenvalues and eigenfunctions; Matrix algebra;
                 Software portability; Subroutines",

  author =       "E. Anderson and C. Bischof and J. Demmel and J.
                 Dongarra and J. {Du Croz} and S. Hammarling and W.
  title =        "Prospectus for an Extension to {LAPACK}: a Portable
                 Linear Algebra Library for High-Performance Computers",
  type =         "LAPACK Working Note" # " and " # type-CSDTR,
  number =       "26 and CS-90-118",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        nov,
  year =         "1990",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    ";
  note =         "LAPACK Working Note \#26. UT-CS-90-118, November
  URL =          ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. Angerson and Z. Bai and J. Dongarra and A.
                 Greenbaum and A. McKenney and J. {Du Croz} and S.
                 Hammarling and J. Demmel and C. Bischof and D.
  title =        "{LAPACK}: a portable linear algebra library for
                 high-performance computers",
  crossref =     "IEEE:1990:PSN",
  pages =        "2--11",
  year =         "1990",
  bibdate =      "Wed Apr 15 18:34:48 MDT 1998",
  bibsource =    "",
  classification = "C4140 (Linear algebra); C7310 (Mathematics)",
  corpsource =   "Tennessee Univ., Knoxville, TN, USA",
  keywords =     "block matrix operations; block operations; eigenvalue
                 problems; eigenvalues and eigenfunctions;
                 functionality; inner loops; LAPACK; linear equations;
                 linear least-squares problems; matrix algebra;
                 matrix-matrix multiplication; memory hierarchy;
                 portable linear algebra library; relative accuracy;
                 software portability; subroutines",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "IEEE; ACM; Lawrence Livermore Nat. Lab.; Los Alamos
                 Nat. Lab.; NASA Ames Res. Center; Nat. Center Atmos.
                 Res.; NSF; SIAM; Supercomput. Res. Center",
  treatment =    "P Practical",

  author =       "Jack J. Dongarra and Jeremy {Du Croz} and Sven
                 Hammarling and Iain Duff",
  title =        "{Algorithm 679}: a Set of {Level 3 Basic Linear
                 Algebra Subprograms}: Model Implementation and Test
  journal =      j-TOMS,
  volume =       "16",
  number =       "1",
  pages =        "18--28",
  month =        mar,
  year =         "1990",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  note =         "See also
  URL =          ";
  classcodes =   "C4140 (Linear algebra); C7310 (Mathematics)",
  corpsource =   "Oak Ridge Nat. Lab., TN, USA",
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  keywords =     "computers; Fortran 77; high-performance; level 3 basic
                 linear algebra subprograms; mathematics computing;
                 matrix algebra; matrix-matrix operations; portable;
                 program testing; subroutines; test programs",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "J. Dongarra and G. A. Geist and C. Romine",
  title =        "Computing the eigenvalues and eigenvectors of a
                 general matrix by reduction to tridiagonal form",
  type =         type-TR,
  number =       "ORNL/TM-11669",
  institution =  inst-ORNL,
  address =      inst-ORNL:adr,
  month =        "??",
  year =         "1990",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  note =         "Published in \cite{Dongarra:1992:AFS}.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Sven Hammarling",
  title =        "Evolution of numerical software for dense linear
  crossref =     "Cox:1990:RNC",
  pages =        "297--327",
  year =         "1990",
  MRclass =      "65-04 (65F99)",
  MRnumber =     "1 098 332",
  bibdate =      "Thu Dec 19 14:11:27 MST 1996",
  bibsource =    "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and George A. Geist and C. H. Romine",
  title =        "{Fortran} subroutines for computing the eigenvalues
                 and eigenvectors of a general matrix by reduction to
                 general tridiagonal form",
  type =         "Technical report",
  number =       "CS-90-116",
  institution =  "University of Tennessee, Computer Science Dept.",
  address =      "Knoxville, TN, USA",
  pages =        "13",
  month =        oct,
  year =         "1990",
  bibdate =      "Sat Jan 27 13:40:57 MST 1996",
  bibsource =    "",
  abstract =     "This paper describes programs to reduce a nonsymmetric
                 matrix to tridiagonal form, compute the eigenvalues of
                 the tridiagonal matrix, improve the accuracy of an
                 eigenvalue, and compute the corresponding
  annote =       "Supported in part by the Applied Mathematical Sciences
                 Research Program, Office of Energy Research Supported
                 in part by the U.S. Department of Energy with Martin
                 Marietta Energy Systems Inc.",
  keywords =     "Eigenvalues.; Eigenvectors.; Subroutines (Computer
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and P. Mayes and G. Radicati",
  title =        "The {IBM RISC System\slash 6000} and Linear Algebra
  type =         "LAPACK Working Note",
  number =       "28",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        dec,
  year =         "1990",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-90-122, December 1990.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra",
  title =        "The {LINPACK} benchmark: an explanation",
  crossref =     "VanderSteen:1990:ESS",
  pages =        "1--21",
  year =         "1990",
  bibdate =      "Mon Sep 9 13:25:47 MDT 1996",
  bibsource =    "",
  abstract =     "The LINPACK Benchmark was originally designed to
                 assist users of the LINPACK package by providing
                 information on execution times required to solve a
                 system of linear equations. Over the years other data
                 was added and today the collection includes 200
                 different computer systems. In addition the scope of
                 the Benchmark has also expanded. The author attempts to
                 clear up some of the confusion and mystery surrounding
                 the LINPACK Benchmark. He examines what is measured and
                 describes how to interpret the results of the
  acknowledgement = ack-nhfb,
  affiliation =  "Math. and Comput. Sci. Div., Argonne Nat. Lab., IL,
  classcodes =   "C5470 (Performance evaluation and testing); C6110B
                 (Software engineering techniques)",
  classification = "C5470 (Performance evaluation and testing); C6110B
                 (Software engineering techniques)",
  corpsource =   "Math. and Comput. Sci. Div., Argonne Nat. Lab., IL,
  keywords =     "execution times; Execution times; LINPACK Benchmark;
                 packages; performance evaluation; software; software
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  pubcountry =   "UK",
  thesaurus =    "Performance evaluation; Software engineering; Software
  treatment =    "P Practical",

  author =       "J. Dongarra and S. Ostrouchov",
  title =        "{LAPACK} Block Factorization Algorithms on the {Intel
                 iPSC\slash 860}",
  type =         "LAPACK Working Note" # " and " # type-CSDTR,
  number =       "24 and CS-90-115",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        oct,
  year =         "1990",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    ";
  note =         "LAPACK Working Note \#24. UT-CS-90-115, October,
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and S. Hammarling and J. H. Wilkinson",
  title =        "Numerical Considerations in Computing Invariant
  type =         "LAPACK Working Note" # " and " # type-CSDTR,
  number =       "25 and CS-90-117",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        oct,
  year =         "1990",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    ";
  note =         "LAPACK Working Note \#25. UT-CS-90-117, October,
  URL =          ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra",
  title =        "Performance of various computers using standard linear
                 equations software in a {Fortran} environment",
  type =         "??",
  number =       "CS-89-85",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        "??",
  year =         "1990",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra",
  title =        "Performance of Various Computers Using Standard Linear
                 Equations Software",
  journal =      j-COMP-ARCH-NEWS,
  volume =       "18",
  number =       "1",
  pages =        "17--31",
  month =        mar,
  year =         "1990",
  CODEN =        "CANED2",
  ISSN =         "0163-5964 (ACM), 0884-7495 (IEEE)",
  ISSN-L =       "0163-5964",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  classcodes =   "C5470 (Performance evaluation and testing)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "ACM SIGARCH Computer Architecture News",
  journal-URL =  "",
  keywords =     "Apollo; computer; CRAY Y-MP; dense systems; IBM PCs;
                 matrix algebra; performance; performance evaluation;
                 scientific workstations; standard linear equations
                 software; Sun; systems",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "Jack J. Dongarra and Jeremy {Du Croz} and Sven
                 Hammarling and Iain Duff",
  title =        "A Set of Level 3 {Basic Linear Algebra Subprograms}",
  journal =      j-TOMS,
  volume =       "16",
  number =       "1",
  pages =        "1--17",
  month =        mar,
  year =         "1990",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          ";
  classcodes =   "C4140 (Linear algebra); C7310 (Mathematics)",
  corpsource =   "Oak Ridge Nat. Lab., TN, USA",
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  keywords =     "hierarchical memory; high-performance computers; level
                 3 basic linear algebra subprograms; mathematics
                 computing; matrix algebra; matrix-matrix; operations;
                 parallel algorithms; parallel processing capability;
                 portable; subroutines",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "Jack Dongarra and Alan H. Karp and Ken Kennedy and
                 David Kuck",
  title =        "Special Report: 1989 {Gordon Bell Prize}",
  journal =      j-IEEE-SOFTWARE,
  volume =       "7",
  number =       "3",
  pages =        "100--104",
  month =        may,
  year =         "1990",
  CODEN =        "IESOEG",
  ISSN =         "0740-7459 (print), 0740-7459 (electronic)",
  ISSN-L =       "0740-7459",
  bibdate =      "Sat Jan 13 20:13:27 MST 1996",
  bibsource =    ";
  abstract =     "This year's winning entries both used the Connection
                 Machine to solve oil-industry problems. The winning
                 performance entry ran six times faster than last year's
  fjournal =     "IEEE Software",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Orlie Brewer and James Arthur Kohl
                 and Samuel Fineberg",
  title =        "A Tool to Aid in the Design, Implementation, and
                 Understanding of Matrix Algorithms for Parallel
  journal =      j-J-PAR-DIST-COMP,
  volume =       "9",
  number =       "2",
  pages =        "185--202",
  month =        jun,
  year =         "1990",
  CODEN =        "JPDCER",
  DOI =          "",
  ISSN =         "0743-7315 (print), 1096-0848 (electronic)",
  ISSN-L =       "0743-7315",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  URL =          "",
  classcodes =   "C4240 (Programming and algorithm theory); C6115
                 (Programming support)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Journal of Parallel and Distributed Computing",
  journal-URL =  "",
  keywords =     "high-; matrix algebra; matrix algorithms; parallel
                 algorithms; performance computers; software tools;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "T Theoretical or Mathematical",

  author =       "Nicholas J. Higham",
  title =        "Exploiting Fast Matrix Multiplication Within the Level
                 3 {BLAS}",
  journal =      j-TOMS,
  volume =       "16",
  number =       "4",
  pages =        "352--368",
  month =        dec,
  year =         "1990",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  MRclass =      "65-04 (65F99)",
  MRnumber =     "1 095 133",
  bibdate =      "Sun Sep 04 23:21:57 1994",
  bibsource =    "",
  note =         "Describes algorithms based on Strassen's method which
                 are asymptotically faster than the standard {$ {N}^3 $}
                 algorithm, and in practice, faster for {$ {N} \approx
                 100 $}, and examines their numerical stability. See
  URL =          "",
  abstract =     "The Level 3 BLAS (BLAS3) are a set of specifications
                 of FORTRAN 77 subprograms for carrying out matrix
                 multiplications and the solution of triangular systems
                 with multiple right-hand sides. They are intended to
                 provide efficient and portable building blocks for
                 linear algebra algorithms on high-performance
                 computers. We describe algorithms for the BLAS3
                 operations that are asymptotically faster than the
                 conventional ones. These algorithms are based on
                 Strassen's method for fast matrix multiplication, which
                 is now recognized to be a practically useful technique
                 once matrix dimensions exceed about 100. We pay
                 particular attention to the numerical stability of
                 these ``fast BLAS3.'' Error bounds are given and their
                 significance is explained and illustrated with the aid
                 of numerical experiments. Our conclusion is that the
                 fast BLAS3, although not as strongly stable as
                 conventional implementations, are stable enough to
                 merit careful consideration in many applications.",
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  keywords =     "algorithms",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  subject =      "{\bf G.1.3}: Mathematics of Computing, NUMERICAL
                 ANALYSIS, Numerical Linear Algebra. {\bf D.3.2}:
                 Software, PROGRAMMING LANGUAGES, Language
                 Classifications, FORTRAN 77.",

  author =       "Robert Schreiber and Jack Dongarra",
  title =        "Automatic Blocking of Nested Loops",
  type =         "Technical report",
  number =       "CS-90-108",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        may,
  year =         "1990",
  bibdate =      "Tue Feb 26 09:44:05 2002",
  bibsource =    "",
  URL =          ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. Anderson and Z. Bai and J. Dongarra",
  title =        "Generalized {$ Q R $} Factorization and its
  type =         "LAPACK Working Note",
  number =       "31",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        apr,
  year =         "1991",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-91-131, April 1991.",
  URL =          ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. Anderson and J. Dongarra and S. Ostrouchov",
  title =        "Implementation Guide for {LAPACK}",
  type =         "LAPACK Working Note" # " and " # type-CSDTR,
  number =       "35 and CS-91-138",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        aug,
  year =         "1991",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    ";
  note =         "LAPACK Working Note \#35. UT-CS-91-138, August 1991.",
  URL =          ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. Anderson and A. Benzoni and J. Dongarra and S.
                 Moulton and S. Ostrouchov and B. Tourancheau and R. van
                 de Geijn",
  title =        "Basic linear algebra communications subprograms",
  crossref =     "Stout:1991:SDM",
  pages =        "287--290",
  year =         "1991",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Beguelin and J. J. Dongarra and G. A. Geist and R.
                 Manchek and V. S. Sunderam",
  title =        "Graphical development tools for network-based
                 concurrent supercomputing",
  crossref =     "IEEE:1991:PSA",
  pages =        "435--444",
  year =         "1991",
  bibdate =      "Wed Apr 15 16:28:01 MDT 1998",
  bibsource =    "",
  classification = "C6110P (Parallel programming); C6115 (Programming
                 support); C6180G (Graphical user interfaces)",
  corpsource =   "Oak Ridge Nat Lab., TN, USA",
  keywords =     "application program; graphical development tools;
                 graphical user interfaces; HeNCE; heterogeneous network
                 computing environment; integrated graphical tools;
                 network-based concurrent supercomputing; parallel
                 programming; parallel programs; Parallel Virtual
                 Machine; process management and communication;
                 programming environments; PVM; software package;
                 X-window-based software environment",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "IEEE; ACM",
  treatment =    "P Practical",

  author =       "A. Beguelin and J. J. Dongarra and G. A. Geist and R.
                 Manchek and V. S. Sunderam",
  title =        "Heterogeneous network computing",
  crossref =     "IEE:1991:SIS",
  pages =        "94--99",
  month =        apr,
  year =         "1991",
  bibdate =      "Mon Sep 9 07:55:25 MDT 1996",
  bibsource =    "",
  abstract =     "HeNCE (Heterogeneous Network Computing Environment) is
                 a parallel programming paradigm and tool which supports
                 the creation, compilation, execution, debugging, and
                 analysis of parallel programs for a heterogeneous group
                 of computers. The HeNCE programmer specifies the
                 parallelism of a computation by drawing a graph
                 describing the dependencies between user defined
                 procedures. HeNCE will then automatically execute these
                 procedures on a user defined collection of machines on
                 some network. Different versions of a procedure may
                 exist for different architectures. HeNCE executes the
                 appropriate version of a procedure for a chosen target
                 machine architecture. HeNCE maps procedures to machines
                 based on a user defined cost matrix. The HeNCE user
                 dynamically configures a parallel collection of
                 machines, referred to as a parallel virtual machine, on
                 which the HeNCE program is to be run.",
  affiliation =  "Oak Ridge Lab., TN, USA",
  classification = "C5620 (Computer networks and techniques); C6110P
                 (Parallel programming); C6115 (Programming support)",
  keywords =     "HeNCE; Parallel programming paradigm; Parallel
                 programs; Tool",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  thesaurus =    "Computer networks; Parallel programming; Software

  author =       "A. Beguelin and J. Dongarra and A. Geist and R.
                 Manchek and V. S. Sunderam",
  title =        "Heterogeneous network supercomputing",
  journal =      j-SUPERCOMPUTING-REVIEW,
  volume =       "??",
  number =       "??",
  pages =        "??--??",
  month =        aug,
  year =         "1991",
  CODEN =        "SURVEG",
  ISSN =         "1048-6836",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  fjournal =     "Supercomputing Review",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Beguelin and J. Dongarra and A. Geist and R.
                 Manchek and K. Moore and R. Wade",
  title =        "{HeNCE}: a user's guide {(Draft)}",
  institution =  inst-ORNL,
  address =      inst-ORNL:adr,
  month =        nov,
  year =         "1991",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Beguelin and J. Dongarra and A. Geist and R.
                 Manchek and V. S. Sunderam",
  title =        "Opening the door to heterogeneous network
  journal =      j-SUPERCOMPUTING-REVIEW,
  volume =       "??",
  number =       "??",
  pages =        "44--45",
  month =        sep,
  year =         "1991",
  CODEN =        "SURVEG",
  ISSN =         "1048-6836",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Beguelin and J. Dongarra and A. Geist and R.
                 Manchek and V. S. Sunderam",
  title =        "Solving computational grand challenges using a network
                 of heterogeneous supercomputers",
  crossref =     "Dongarra:1992:PFS",
  pages =        "??--??",
  year =         "1991",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Beguelin and J. J. Dongarra and A. Geist and R.
                 Mancheck and V. Sunderam",
  title =        "A Users' Guide to {PVM} ({Parallel Virtual Machine})",
  type =         type-TR,
  number =       "ORNL/TM-11826",
  institution =  inst-MSS-ORNL,
  address =      inst-MSS-ORNL:adr,
  month =        jul,
  year =         "1991",
  bibdate =      "Tue Mar 05 17:31:39 2002",
  bibsource =    "",
  keywords =     "prll, operating system",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Adam Beguelin and Jack Dongarra and Al Geist and
                 Robert Manchek and Vaidy Sunderam",
  title =        "Workstation Solutions: Opening the Door to
                 Heterogeneous Network Supercomputing",
  journal =      j-SUPERCOMPUTING-REVIEW,
  volume =       "4",
  number =       "9",
  pages =        "44--45",
  month =        sep,
  year =         "1991",
  CODEN =        "SURVEG",
  ISSN =         "1048-6836",
  bibdate =      "Sat Jan 13 20:13:27 MST 1996",
  bibsource =    "",
  URL =          "",
  fjournal =     "Supercomputing Review",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Benguelin and J. J. Dongarra and G. A. Geist and R.
                 Manchek and V. S. Sunderam",
  booktitle =    "Second International Specialist Seminar on the Design
                 and Application of Parallel Digital Processors: 15--19
                 April 1991, venue, the Gulbenkian Foundation, Lisbon,
  title =        "Heterogeneous network computing",
  number =       "334",
  publisher =    pub-IEE,
  address =      pub-IEE:adr,
  bookpages =    "vii + 152",
  pages =        "??--??",
  year =         "1991",
  ISBN =         "0-85296-519-2",
  ISBN-13 =      "978-0-85296-519-1",
  ISSN =         "0537-9989",
  LCCN =         "QA76.58 .I567 1991",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C6115 (Programming support); C6110P (Parallel
                 programming); C5620 (Computer networks and
  conflocation = "Lisbon, Portugal; 15-19 April 1991",
  corpsource =   "Oak Ridge Lab., TN, USA",
  keywords =     "computer networks; HeNCE; parallel; parallel
                 programming; parallel programming paradigm; programs;
                 software tools; tool",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "Office of Naval Res. Eur. Office",
  treatment =    "P Practical",

  author =       "James Demmel and Jack Dongarra and W. Kahan",
  title =        "On Designing Portable High Performance Numerical
  type =         "LAPACK Working Note",
  number =       "39",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        jul,
  year =         "1991",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-91-141, July, 1991.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Demmel and J. Dongarra and W. Kahan",
  title =        "On Designing Portable High Performance Numerical
  crossref =     "Griffiths:1991:NAP",
  pages =        "??--??",
  month =        jun,
  year =         "1991",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and W. Gentzsch",
  title =        "Benchmarking of High-Performance Computers",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "17",
  number =       "10--11",
  pages =        "1067--1069",
  month =        "????",
  year =         "1991",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and A. Karp and K. Miura and H. D.
  title =        "{Gordon Bell Prize} lectures (supercomputer
  crossref =     "IEEE:1991:PSA",
  pages =        "328--337",
  year =         "1991",
  bibdate =      "Wed Apr 15 16:28:01 MDT 1998",
  bibsource =    "",
  URL =          "",
  classification = "C5440 (Multiprocessor systems and techniques)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  keywords =     "128-node Intel iPSC/860; compiler speedup; Connections
                 Machine; electronic structure; floating point
                 processors; Fortran 77; Fortran 90; grid generation
                 program; parallel processing; partial differential
                 equation; price/performance award; scientific and
                 engineering problems; supercomputers",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "IEEE; ACM",
  treatment =    "G General Review; P Practical",

  author =       "J. J. Dongarra and P. Mayes and G. {Radicati di
  title =        "The {IBM RISC System\slash 6000} and Linear Algebra
  journal =      j-SUPERCOMPUTER,
  volume =       "8",
  number =       "4",
  pages =        "15--30",
  month =        jul,
  year =         "1991",
  CODEN =        "SPCOEL",
  ISSN =         "0168-7875",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          "",
  abstract =     "The paper discusses the IBM RISC System/6000
                 workstation and a set of experiments with blocked
                 algorithms commonly used in solving problems in
                 numerical linear algebra. The authors describe the
                 performance of these algorithms and discuss the
                 techniques used in achieving high performance on such
                 an architecture.",
  acknowledgement = ack-nhfb,
  affiliation =  "Math. Sci. Section, Oak Ridge Nat. Lab., TN, USA",
  classcodes =   "C5420 (Mainframes and minicomputers); C5470
                 (Performance evaluation and testing); C4140 (Linear
  classification = "C4140 (Linear algebra); C5420 (Mainframes and
                 minicomputers); C5470 (Performance evaluation and
  corpsource =   "Math. Sci. Section, Oak Ridge Nat. Lab., TN, USA",
  fjournal =     "Supercomputer",
  keywords =     "blocked algorithms; Blocked algorithms; Floating point
                 performance; floating point performance; IBM computers;
                 IBM RISC System/6000; IBM RISC System/6000 workstation;
                 linear algebra; numerical linear algebra; Numerical
                 linear algebra; performance evaluation; reduced
                 instruction set computing; workstation",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  pubcountry =   "Netherlands",
  thesaurus =    "IBM computers; Linear algebra; Performance evaluation;
                 Reduced instruction set computing",
  treatment =    "P Practical",

  author =       "J. Dongarra",
  title =        "{LAPACK}: a Portable High Performance Numerical
                 Library for Linear Algebra",
  crossref =     "Anonymous:1991:PIS",
  pages =        "73--76",
  year =         "1991",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and J. Demmel",
  title =        "{LAPACK}: a portable high-performance numerical
                 library for linear algebra",
  journal =      j-SUPERCOMPUTER,
  volume =       "8",
  number =       "6",
  pages =        "33--38",
  month =        nov,
  year =         "1991",
  CODEN =        "SPCOEL",
  ISSN =         "0168-7875",
  bibdate =      "Mon Sep 9 07:55:25 MDT 1996",
  bibsource =    "",
  abstract =     "High quality portable numerical libraries have existed
                 for many years. These libraries, such as LINPACK and
                 EISPACK, were designed to be accurate, robust,
                 efficient and portable in a Fortran environment of
                 conventional uniprocessors, diverse floating-point
                 arithmetics, and limited input data structures. These
                 libraries are no longer adequate on modern
                 high-performance computer architectures. The authors
                 describe their inadequacies and how they are addressing
                 them in the LAPACK project, a library of numerical
                 linear algebra routines designed to supplant LINPACK
                 and EISPACK. They show how the new architectures lead
                 to important changes in the goals as well as the
                 methods of library design.",
  affiliation =  "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  classcodes =   "C7310 (Mathematics)",
  classification = "C7310 (Mathematics)",
  conflocation = "Fukuoka, Japan; 6-8 Nov. 1991",
  conftitle =    "International Symposium on Supercomputing '91",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Supercomputer",
  keywords =     "Fortran environment; LAPACK; LAPACK project; linear
                 algebra; mathematics computing; numerical linear
                 algebra routines; Numerical linear algebra routines;
                 Portable numerical libraries; portable numerical
                 libraries; project; software packages; subroutines",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  thesaurus =    "Linear algebra; Mathematics computing; Software
                 packages; Subroutines",
  treatment =    "P Practical",

  author =       "J. Dongarra",
  title =        "{LAPACK Working Note} 34: {Workshop} on the {BLACS}",
  type =         type-CSDTR,
  number =       "CS-91-134",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        may,
  year =         "1991",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Robert A. {van de Geijn}",
  title =        "{LAPACK} Working Note 37: Two dimensional basic linear
                 algebra communications subprograms",
  institution =  inst-ORNL,
  address =      inst-ORNL:adr,
  day =          "28",
  month =        oct,
  year =         "1991",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  note =         "Proposed Standard.",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Bill Rosener",
  title =        "{NA-NET}: {Numerical} Analysis {NET}",
  type =         "Technical Report",
  number =       "CS-91-146",
  institution =  inst-CS-U-Tenn,
  address =      inst-CS-U-Tenn:adr,
  pages =        "21",
  month =        sep,
  year =         "1991",
  bibdate =      "Wed Sep 28 14:04:23 2011",
  bibsource =    ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and M. Sidani",
  title =        "A Parallel Algorithm for the Non-Symmetric Eigenvalue
  type =         "Report",
  number =       "ORNL/TM-12003",
  institution =  inst-MSS-ORNL,
  address =      inst-MSS-ORNL:adr,
  month =        "??",
  year =         "1991",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  keywords =     "nla, prll, eig, nonsymmetric matrix",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and M. Sidani",
  title =        "A Parallel Algorithm for the Non-Symmetric Eigenvalue
  type =         type-CSDTR,
  number =       "CS-91-137",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "1991",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and M. Furtney and S. Reinhardt and J.
  title =        "Parallel loops --- a test suite for parallelizing
                 compilers: description and example results",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "17",
  number =       "10--11",
  pages =        "1247--1255",
  month =        dec,
  year =         "1991",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          "",
  abstract =     "Several multiprocessor systems are now commercially
                 available, and advances in compiler technology provide
                 automatic conversion of programs to run on such
                 systems. However, no accepted measure of this parallel
                 compiler ability exists. This paper presents a test
                 suite of subroutines and loops, called parallel loops,
                 designed to (1) measure the ability of parallelizing
                 compilers to convert code to run in parallel and (2)
                 determine how effectively parallel hardware and
                 software work together to achieve high performance
                 across a range of problem sizes. In addition, they
                 present the results of compiling this suite using two
                 commercially available parallelizing Fortran compilers,
                 Cray and Convex.",
  affiliation =  "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  classcodes =   "C6150C (Compilers, interpreters and other processors);
                 C5440 (Multiprocessor systems and techniques)",
  classification = "C5440 (Multiprocessor systems and techniques);
                 C6150C (Compilers, interpreters and other processors)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  keywords =     "Convex; Cray; Fortran; hardware; Loops; loops;
                 multiprocessing systems; multiprocessor systems;
                 Multiprocessor systems; parallel; Parallel hardware;
                 parallel loops; Parallel loops; parallelizing
                 compilers; Parallelizing compilers; program compilers;
                 Subroutines; subroutines; test suite; Test suite",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  pubcountry =   "Netherlands",
  thesaurus =    "Multiprocessing systems; Program compilers",
  treatment =    "P Practical",

  author =       "J. Dongarra",
  title =        "Performance of Various Computers Using Standard Linear
                 Equations Software in a {Fortran} Environment",
  type =         "??",
  number =       "CS-89-85",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        "??",
  year =         "1991",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and R. A. {van de Geijn}",
  title =        "Reduction to Condensed Form for the Eigenvalue Problem
                 on Distributed Memory Architectures",
  type =         "LAPACK Working Note" # " and " # type-CSDTR,
  number =       "30 and CS-91-130 and ORNL/TM-12006",
  institution =  inst-UTK-CS # " and " # inst-MSS-ORNL,
  address =      inst-UTK-CS:adr # " and " # inst-MSS-ORNL:adr,
  month =        apr,
  year =         "1991",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    ";
  note =         "LAPACK Working Note \#30, to appear in {\em Parallel
                 Computing}. UT-CS-91-130, April 1991.",
  URL =          ";
  acknowledgement = ack-nhfb,
  keywords =     "nla, prll, eig, distributed memory, Hessenberg matrix,
                 tridiagonal matrix",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Iain S. Duff and Danny C.
                 Sorensen and Henk A. {van der Vorst}",
  title =        "Solving Linear Systems on Vector and Shared Memory
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "x + 256",
  year =         "1991",
  ISBN =         "0-89871-270-X",
  ISBN-13 =      "978-0-89871-270-4",
  LCCN =         "QA184 .S65 1991",
  bibdate =      "Mon Oct 26 07:30:53 1998",
  bibsource =    ";
                 MathSciNet database",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  tableofcontents = "Introduction / 1 \\
                 1 Vector and Parallel Processing / 3 \\
                 1.1 Traditional Computers and Their Limitations / 3 \\
                 1.2 Parallelism within a Single Processor / 4 \\
                 1.2.1 Multiple Functional Units / 4 \\
                 1.2.2 Pipelining / 4 \\
                 1.2.3 Overlapping / 6 \\
                 1.2.5 VLIW / 8 \\
                 1.2.6 Vector Instructions / 8 \\
                 1.2.7 Chaining / 9 \\
                 1.2.8 Memory-to-Memory and Register-to-Register
                 Organizations / 10 \\
                 1.2.9 Register Set / 10 \\
                 1.2.10 Stripmining / 11 \\
                 1.2.11 Reconfigurable Vector Registers / 11 \\
                 1.2.12 Memory Organization / 12 \\
                 1.3 Data Organization / 14 \\
                 1.3.1 Main Memory / 14 \\
                 1.3.2 Cache / 16 \\
                 1.3.3 Local Memory / 18 \\
                 1.4 Memory Management / 18 \\
                 1.5 Parallelism through Multiple Pipes or Multiple
                 Processors / 21 \\
                 1.6 Interconnection Topology / 22 \\
                 1.6.1 Crossbar Switch / 23 \\
                 1.6.2 Timeshared Bus / 24 \\
                 1.6.3 Ring Connection / 25 \\
                 1.6.4 Mesh Connection / 25 \\
                 1.6.5 Hypercube / 26 \\
                 1.6.6 Multistaged Network / 27 \\
                 1.7 Programming Techniques / 29 \\
                 2 Overview of Current High-Performance Computers / 33
                 2.1 Supercomputers / 33 \\
                 2.2 Mini-Supercomputers / 36 \\
                 2.3 Vector Mainframes / 37 \\
                 2.4 Novel Parallel Processors / 37 \\
                 3 Implementation Details and Overhead / 43 \\
                 3.1 Parallel Decomposition and Data Dependency Graphs /
                 43 \\
                 3.2 Synchronization / 46 \\
                 3.3 Load Balancing / 48 \\
                 3.4 Recurrence / 49 \\
                 3.5 Indirect Addressing / 51 \\
                 4 Performance: Analysis, Modeling, and Measurements /
                 53 \\
                 4.1 Amdahl's Law / 54 \\
                 4.1.1 Simple Case of Amdahl's Law / 54 \\
                 4.1.2 General Form of Amdahl's Law / 55 \\
                 4.2 Vector Speed and Vector Length / 56 \\
                 4.3 Amdahl's Law-Parallel Processing / 57 \\
                 4.3.1 A Simple Model / 60 \\
                 4.3.2 Gustafson's Model / 60 \\
                 4.4 Examples of $(r_\infty, n_{1/2})$-values for
                 Various Computers / 60 \\
                 4.4.1 CRAY-1 and CRAY-2 (one processor) / 62 \\
                 4.4.2 CRAY X-MP (one processor; clock cycle time 8.5
                 nsec) / 63 \\
                 4.4.3 CYBER 205 (2-pipe) and ETA-10P (single processor)
                 / 63 \\
                 4.4.4 IBM 3090/VF (1 processor; clock cycle time 18.5
                 nsec) / 64 \\
                 4.4.5 NEC SX/2 / 65 \\
                 4.4.6 Convex C-1 and Convex C-210 / 66 \\
                 4.4.7 Alliant FX/80 / 66 \\
                 4.4.8 General Observations / 68 \\
                 4.5 LINPACK Benchmark / 68 \\
                 4.5.1 Description of the Benchmark / 69 \\
                 4.5.2 Calls to the BLAS / 69 \\
                 4.5.3 Asymptotic Performance / 75 \\
                 5 Building Blocks in Linear Algebra / 75 \\
                 5.1 Basic Linear Algebra Subprograms / 75 \\
                 5.1.1 Level 1 BLAS / 76 \\
                 5.1.2 Level 2 BLAS / 77 \\
                 5.1.3 Level 3 BLAS / 78 \\
                 5.2 Levels of Parallelism / 81 \\
                 5.2.1 Vector Computers / 81 \\
                 5.2.2 Parallel Processors with Shared Memory / 82 \\
                 5.2.3 Parallel-Vector Computers / 83 \\
                 5.2.4 Clusters of Parallel Vector Processors / 84 \\
                 5.3 Basic Factorizations of Linear Algebra / 84 \\
                 5.3.1 Point Algorithm: Gaussian Elimination with
                 Partial Pivoting / 84 \\
                 5.3.2 Special Matrices / 86 \\
                 5.4 Blocked Algorithms: Matrix-Vector and Matrix-Matrix
                 Versions / 89 \\
                 5.4.1 Right-Looking Algorithm / 90 \\
                 5.4.2 Left-Looking Algorithm / 92 \\
                 5.4.3 Crout Algorithm / 98 \\
                 5.4.4 Typical Performance of Blocked LU Decomposition /
                 94 \\
                 5.4.5 Blocked Symmetric Indefinite Factorization / 95
                 5.4.6 Typical Performance of Blocked Symmetric
                 Indefinite Factorization. / 98 \\
                 5.5 Linear Least Squares / 98 \\
                 5.5.1 Householder Method / 99 \\
                 5.5.2 Blocked Householder Method / 100 \\
                 5.5.3 Typical Performance of the Blocked Householder
                 Factorization / 101 \\
                 5.6 Organization of the Modules / 102 \\
                 5.6.1 Matrix--Vector Product / 102 \\
                 5.6.2 Matrix--Matrix Product / 103 \\
                 5.6.3 Typical Performance for Parallel Processing / 104
                 5.6.4 Benefits / 105 \\
                 5.7 LAPACK / 106 \\
                 6 Direct Solution of Sparse Linear Systems / 109 \\
                 6.1 Introduction to Direct Methods for Sparse Linear
                 Systems / 111 \\
                 6.1.1 Three Approaches / 111 \\
                 6.1.2 Description of Sparse Data Structure / 112 \\
                 6.1.3 Manipulation of Sparse Data Structure / 114 \\
                 6.2 General Sparse Matrix Methods / 116 \\
                 6.3 Methods for Symmetric Matrices and Band Systems /
                 124 \\
                 6.3.1 The Clique Concept in Gaussian Elimination / 125
                 6.3.2 Code Performance and Symmetry / 128 \\
                 6.4 Frontal Methods / 130 \\
                 6.4.1 Organization / 130 \\
                 6.4.2 Vector Performance / 132 \\
                 6.5 Multifrontal Methods / 135 \\
                 6.5.1 Performance on Vector Machines / 139 \\
                 6.5.2 Performance on Parallel Machines / 139 \\
                 6.6 Other Approaches for Exploitation of Parallelism /
                 141 \\
                 6.7 Software / 141 \\
                 6.8 Brief Summary / 142 \\
                 7 Iterative Solution of Sparse Linear Systems / 143 \\
                 7.1 Iterative Methods / 145 \\
                 7.1.1 Conjugate Gradient / 145 \\
                 7.1.2 Least Squares Conjugate Gradients / 148 \\
                 7.1.3 Biconjugate Gradients / 150 \\
                 7.1.4 Conjugate Gradient Squared / 152 \\
                 7.1.5 GMRES and GMRES(m) / 154 \\
                 7.1.6 Adaptive Chebychev / 156 \\
                 7.2 Vector and Parallel Aspects / 158 \\
                 7.2.1 General Remarks / 158 \\
                 7.2.2 Sparse Matrix-Vector Multiplication / 160 \\
                 7.2.3 Performance of the Unpreconditioned Methods / 164
                 7.3 Preconditioning / 165 \\
                 7.3.1 General Aspects / 165 \\
                 7.3.2 Efficient Implementations / 168 \\
                 7.3.3 Partial Vectorization / 170 \\
                 7.3.4 Reordering the Unknowns / 172 \\
                 7.3.5 Changing the Order of Computation / 174 \\
                 7.3.6 Some Other Vectorizable Preconditioners / 180 \\
                 7.3.7 Parallel Aspects / 183 \\
                 7.4 Experiences with Parallelism / 186 \\
                 7.4.1 General Remarks / 186 \\
                 7.4.2 Overlapping Local Preconditioners / 186 \\
                 7.4.3 Repeated Twisted Factorization / 188 \\
                 7.4.4 Twisted and Nested Twisted Factorization / 189
                 7.4.5 Hyperplane Ordering / 189 \\
                 A Acquiring Mathematical Software / 191 \\
                 B Glossary / 197 \\
                 C Information on Various High-Performance Computers /
                 213 \\
                 D Level 1, 2, and 3 BLAS Quick Reference / 221 \\
                 E Operation Counts for Various BLAS and Decompositions
                 / 227 \\
                 Index / 247",

  author =       "Jack Dongarra and Alan Karp and Ken Miura and Horst
  title =        "Special Report: 1990 {Gordon Bell Prize}",
  journal =      j-IEEE-SOFTWARE,
  volume =       "8",
  number =       "3",
  pages =        "92--98",
  month =        may,
  year =         "1991",
  CODEN =        "IESOEG",
  ISSN =         "0740-7459 (print), 0740-7459 (electronic)",
  ISSN-L =       "0740-7459",
  bibdate =      "Tue Jan 9 17:09:45 MST 1996",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Software",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Robert A. van de Geijn",
  title =        "Two dimensional {Basic Linear Algebra Communication
  type =         "LAPACK Working Note" # " and " # type-CSDTR,
  number =       "37 and CS-91-138",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        oct,
  year =         "1991",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and others",
  title =        "A Users' Guide to {PVM Parallel Virtual Machine}",
  organization = inst-ORNL,
  address =      inst-ORNL:adr,
  pages =        "??",
  month =        jul,
  year =         "1991",
  bibdate =      "Mon Jan 15 17:51:23 1996",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra",
  title =        "Workshop on the {BLACS}",
  type =         "LAPACK Working Note" # " and " # type-CSDTR,
  number =       "34 and CS-91-134",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        may,
  year =         "1991",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    ";
  note =         "LAPACK Working Note \#34. UT-CS-91-134, May 1991.",
  URL =          ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "D. Levine and D. Callahan and J. Dongarra",
  title =        "A Comparative Study of Automatic Vectorizing
  type =         "??",
  number =       "MCS-P218-0391",
  institution =  inst-ANL,
  address =      inst-ANL:adr,
  month =        "??",
  year =         "1991",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "D. Levine and D. Callahan and J. Dongarra",
  title =        "A comparative study of automatic vectorizing
  journal =      j-PARALLEL-COMPUTING,
  volume =       "17",
  number =       "10--11",
  pages =        "1223--1244",
  month =        dec,
  year =         "1991",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          "",
  abstract =     "The authors compare the capabilities of several
                 commercially available, vectorizing Fortran compilers
                 using a test suite of Fortran loops. They present the
                 results of compiling and executing these loops on a
                 variety of supercomputers, mini-supercomputers, and
  acknowledgement = ack-nhfb,
  affiliation =  "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  classcodes =   "C6150C (Compilers, interpreters and other processors);
                 C5440 (Multiprocessor systems and techniques); C6140D
                 (High level languages)",
  classification = "C5440 (Multiprocessor systems and techniques);
                 C6140D (High level languages); C6150C (Compilers,
                 interpreters and other processors)",
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  keywords =     "Automatic vectorizing compilers; automatic vectorizing
                 compilers; FORTRAN; Mainframes; mainframes;
                 Minisupercomputers; minisupercomputers; parallel
                 processing; program compilers; Supercomputers;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  pubcountry =   "Netherlands",
  thesaurus =    "FORTRAN; Parallel processing; Program compilers",
  treatment =    "P Practical",

  author =       "E. Anderson and Z. Bai and J. Dongarra",
  title =        "Generalized {$ Q R $} factorization and its
  journal =      j-LINEAR-ALGEBRA-APPL,
  volume =       "162/164",
  pages =        "243--271",
  year =         "1992",
  CODEN =        "LAAPAW",
  DOI =          "",
  ISSN =         "0024-3795 (print), 1873-1856 (electronic)",
  ISSN-L =       "0024-3795",
  MRclass =      "65F15 15A23",
  MRnumber =     "92j:65050",
  bibdate =      "Thu Dec 19 14:07:22 1996",
  bibsource =    "",
  note =         "Directions in matrix theory (Auburn, AL, 1990).",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Linear Algebra and its Applications",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. Anderson and A. Benzoni and J. Dongarra and S.
                 Moulton and S. Ostrouchov and B. Tourancheau and R.
                 {van de Geijn}",
  title =        "{LAPACK} for distributed memory architectures:
                 progress report",
  crossref =     "Dongarra:1992:PFS",
  pages =        "625--630",
  year =         "1992",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics); C4140 (Linear algebra); C5440
                 (Multiprocessor systems and techniques); C4170
                 (Differential equations)",
  conflocation = "Houston, TX, USA; 25-27 March 1991",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TX,
  keywords =     "algebraic eigenvalue problem; algorithms; block;
                 Cholesky decomposition; distributed memory
                 architectures; distributed memory systems; eigenvalues
                 and eigenfunctions; Hessenberg and; Intel; iPSC/860;
                 LAPACK; linear algebra; linear algebra subroutine
                 library; LU; mathematics computing; QR; routines;
                 subset of; tridiagonal reduction",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "SIAM",
  treatment =    "P Practical",

  author =       "E. Anderson and Z. Bai and C. Bischof and J. Demmel
                 and J. Dongarra and J. {Du Croz} and A. Greenbaum and
                 S. Hammarling and A. McKenney and S. Ostrouchov and D.
  title =        "{LAPACK} Users' Guide",
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "xv + 235",
  year =         "1992",
  ISBN =         "0-89871-294-7",
  ISBN-13 =      "978-0-89871-294-0",
  LCCN =         "QA76.73.F25 L36 1992",
  bibdate =      "Tue Dec 14 22:36:17 1993",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  tableofcontents = "Part 1: Guide / 1 \\
                 1: Essentials / 3 \\
                 2: Contents of LAPACK / 7 \\
                 3: Performance of LAPACK / 34 \\
                 4: Accuracy and Stability / 44 \\
                 5: Documentation and Software Conventions / 61 \\
                 6: Installing LAPACK Routines / 71 \\
                 7: Troubleshooting / 75 \\
                 A: Index of Driver and Computational Routines / 79 \\
                 B: Index of Auxiliary Routines / 89 \\
                 C: Quick Reference Guide to the BLAS / 96 \\
                 D: Converting from LINPACK or EISPACK / 101 \\
                 E: LAPACK Working Notes / 109 \\
                 Bibliography / 112 \\
                 Index / 116 \\
                 Part 2: Specifications of Routines / 119",

  author =       "Edward Anderson and Jack Dongarra",
  title =        "Performance of {LAPACK}: a Portable Library of
                 Numerical Linear Algebra Routines",
  type =         "LAPACK Working Note",
  number =       "44",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        may,
  year =         "1992",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-92-156, May 1992.",
  URL =          ";
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Mario Arioli and Iain S. Duff and Daniel Ruiz and
                 Miloud Sadkane",
  editor =       "J. Dongarra and K. Kennedy and P. Messina and D. C.
                 Sorensen and R. G. Voigt",
  booktitle =    "Proceedings of Fifth {SIAM} Conference on Parallel
                 Processing for Scientific Computing",
  title =        "Techniques for accelerating the Block {Cimmino}
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "98--104",
  year =         "1992",
  bibdate =      "Fri Nov 11 17:48:17 MST 1994",
  note =         "Also reprinted in Proceedings of One-day Workshop on
                 Parallel Numerical Analysis, 21 June 1991. Editors D B
                 Duncan, K I M Mc Kinnon, and F Plab. Report
                 EPCC-TR92-05, Edinburgh Parallel Computing Centre,
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Adam Beguelin and Jack J. Dongarra and others",
  title =        "Graphical Development Tools for Network-Based
                 Concurrent Supercomputing",
  year =         "1992",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  note =         "HeNCE document",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Adam Beguelin and Jack J. Dongarra and Al Geist and
                 Robert Manchek and Keith Moore and Reed Wade and Vaidy
  title =        "{HeNCE}: {Graphical} Development Tools for
                 Network-Based Concurrent Computing",
  crossref =     "IEEE:1992:SHP",
  pages =        "129--136",
  year =         "1992",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  note =         "IEEE catalog number 92TH0432-5.",
  acknowledgement = ack-nhfb,
  classcodes =   "C6115 (Programming support); C6150C (Compilers,
                 interpreters and other processors); C6180G (Graphical
                 user interfaces); C6130B (Graphics techniques); C6110P
                 (Parallel programming)",
  conflocation = "Williamsburg, VA, USA; 26-29 April 1992",
  corpsource =   "Oak Ridge Nat. Lab., TN, USA",
  keyword =      "network supercomputing, distributed computing,
                 graphical programming",
  keywords =     "compilers; distributed virtual computer; graphical;
                 graphical development; graphical parallel programming
                 environment; graphical user interfaces; HeNCE;
                 heterogeneous machines; heterogeneous network computing
                 environment; interface; network-based concurrent
                 computing; parallel programming; program; program
                 compiler; program debugging; programming environments;
                 PVM; software tools; tools; Unix; workstation; X
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "IEEE",
  treatment =    "P Practical",

  author =       "Adam Beguelin and Jack J. Dongarra and others",
  title =        "{HeNCE}: a Users' Guide Version 1.2",
  organization = inst-ORNL,
  address =      inst-ORNL:adr,
  pages =        "??",
  month =        Feb,
  year =         "1992",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Beguelin and J. Dongarra and A. Geist and R.
                 Manchek and V. Sunderam",
  title =        "{PVM} and {HeNCE}: traversing the parallel
  journal =      j-CRAY-CHANNELS,
  volume =       "14",
  number =       "4",
  pages =        "22--25",
  month =        "Fall",
  year =         "1992",
  CODEN =        "CRCHE8",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C6110P (Parallel programming); C6150N (Distributed
                 systems); C5440 (Multiprocessor systems and
                 techniques); C7430 (Computer engineering)",
  corpsource =   "Carnegie-Mellon Univ., Pittsburgh, PA, USA",
  fjournal =     "CRAY Channels",
  keywords =     "cost-effective use; Cray Research MPP systems; diverse
                 architectures; diverse computer systems; HeNCE;
                 Heterogeneous Network Computing Environment;
                 heterogeneous networks; Machine; network operating
                 systems; networked resources; packages; parallel;
                 parallel machines; Parallel Virtual; portability;
                 programming; PVM; software; software packages; virtual
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical; R Product Review",

  author =       "A. Beguelin and J. Dongarra and A. Geist and R.
                 Manchek and V. Sunderam",
  title =        "Solving computational grand challenges using a network
                 of heterogeneous supercomputers",
  crossref =     "Dongarra:1992:PFS",
  pages =        "596--601",
  year =         "1992",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C6115 (Programming support); C6110P (Parallel
                 programming); C7430 (Computer engineering); C5440
                 (Multiprocessor systems and techniques); C5620W (Other
  conflocation = "Houston, TX, USA; 25-27 March 1991",
  corpsource =   "Oak Ridge Nat. Lab., Tennessee Univ., Knoxville, TN,
  keywords =     "CM2; computational grand challenges; Cray XMP;
                 environments; flexibility; high speed network; Intel
                 iPSC/860; network of heterogeneous; parallel
                 processing; parallel programming; parallel virtual
                 machine; programming; supercomputers; Thinking
                 Machines; virtual computer; virtual machines; wide area
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "SIAM",
  treatment =    "P Practical",

  author =       "Susan Blackford and Jack Dongarra",
  title =        "Installation Guide for {LAPACK}",
  type =         "LAPACK Working Note",
  number =       "41",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        mar,
  year =         "1992",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-92-151, March, 1992.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Choi and J. J. Dongarra and D. W. Walker",
  title =        "The design of distributed level 3 {BLAS} routines",
  howpublished = "??",
  year =         "1992",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  note =         "in preparation",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Choi and J. J. Dongarra and R. Pozo and D. W.
  title =        "{ScaLAPACK}: a Scalable Linear Algebra Library for
                 Distributed Memory Concurrent Computers",
  crossref =     "Siegel:1992:FSF",
  pages =        "120--127",
  year =         "1992",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jaeyoung Choi and Jack J. Dongarra and Roldan Pozo and
                 David W. Walker",
  title =        "{ScaLAPACK}: a Scalable Linear Algebra for Distributed
                 Memory Concurrent Computers",
  type =         "LAPACK Working Note",
  number =       "55",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        nov,
  year =         "1992",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    ";
  note =         "UT-CS-92-181, November 1992.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Choi and J. J. Dongarra and R. Pozo and D. W.
  title =        "{ScaLAPACK}: a scalable linear algebra library for
                 distributed memory concurrent computers",
  crossref =     "Siegel:1992:FSF",
  pages =        "120--127",
  year =         "1992",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  note =         "IEEE catalog number 92CH3185-6.",
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics); C4140 (Linear algebra); C6110J
                 (Object- oriented programming); C5470 (Performance
                 evaluation and testing); C5440 (Multiprocessor systems
                 and techniques)",
  conflocation = "McLean, VA, USA; 19-21 Oct. 1992",
  corpsource =   "Oak Ridge Nat. Lab., TN, USA",
  keywords =     "algorithm; computations; computing; distributed;
                 distributed memory systems; distributed memory version;
                 evaluation; Intel Delta multicomputer; Level 3 BLAS;
                 library routines; linear algebra; mathematics; matrix;
                 memory concurrent computers; object-oriented interface;
                 object-oriented programming; performance; right-looking
                 LU factorization; scalable linear algebra library;
                 ScaLAPACK; software package; software packages; square
                 block scattered decomposition",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "IEEE; NASA",
  treatment =    "A Application; P Practical",

  author =       "James W. Demmel and Nicholas J. Higham",
  title =        "Stability of Block Algorithms with Fast Level-3
  journal =      j-TOMS,
  volume =       "18",
  number =       "3",
  pages =        "274--291",
  month =        sep,
  year =         "1992",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  bibdate =      "Fri Sep 30 01:27:16 1994",
  bibsource =    "",
  note =         "See
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Iain S. Duff",
  editor =       "H. Adeli",
  booktitle =    "Supercomputing in Engineering Analysis",
  title =        "Advanced architecture computers",
  publisher =    pub-MARCEL-DEKKER,
  address =      pub-MARCEL-DEKKER:adr,
  pages =        "19--62",
  year =         "1992",
  bibdate =      "Fri Nov 11 17:48:17 MST 1994",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and G. A. Geist and C. H. Romine",
  title =        "{Algorithm 710}: {FORTRAN} Subroutines for Computing
                 the Eigenvalues and Eigenvectors of a General Matrix by
                 Reduction to General Tridiagonal Form",
  journal =      j-TOMS,
  volume =       "18",
  number =       "4",
  pages =        "392--400",
  month =        dec,
  year =         "1992",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  bibdate =      "Fri Sep 30 00:52:57 1994",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  classcodes =   "C4140 (Linear algebra); C7310 (Mathematics)",
  corpsource =   "Math. Sci. Syst., Oak Ridge Nat. Lab., TN, USA",
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  keywords =     "dense nonsymmetric matrix; eigenpairs; eigenvalues;
                 eigenvalues and eigenfunctions; eigenvectors; EISPACK
                 paths; FORTRAN subroutines; general; generation
                 tridiagonal form; HQR-INVIT; mathematics computing;
                 matrix; matrix algebra; nonsymmetric matrix; RG;
                 subroutines; tridiagonal matrix",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "Jack Dongarra",
  title =        "Book Reviews: {{\booktitle{The Connection Machine}}}",
  journal =      j-IJSA,
  volume =       "1",
  number =       "1",
  pages =        "112--112",
  month =        mar,
  year =         "1987",
  CODEN =        "IJSAE9",
  DOI =          "",
  ISSN =         "0890-2720",
  bibdate =      "Tue Nov 6 11:28:49 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "The International Journal of Supercomputer
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra",
  title =        "Editorial",
  journal =      j-IJSA,
  volume =       "6",
  number =       "4",
  pages =        "313--313",
  month =        "Winter",
  year =         "1992",
  CODEN =        "IJSAE9",
  ISSN =         "0890-2720",
  bibdate =      "Fri Aug 23 07:32:35 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "The International Journal of Supercomputer
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and R. {van de Geijn} and D. W.
  title =        "A Look at Scalable Dense Linear Algebra Libraries",
  type =         type-TR,
  number =       "ORNL/TM-12126",
  institution =  inst-MSS-ORNL,
  address =      inst-MSS-ORNL:adr,
  month =        "??",
  year =         "1992",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  keywords =     "nla, prll, lud, mimd, blas, distributed memory,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and R. {van de Geijn} and D. Walker",
  title =        "A look at scalable dense linear algebra libraries",
  crossref =     "IEEE:1992:SHP",
  pages =        "372--379",
  year =         "1992",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  note =         "IEEE catalog number 92TH0432-5.",
  acknowledgement = ack-nhfb,
  classcodes =   "C4140 (Linear algebra); C7310 (Mathematics); C6110P
                 (Parallel programming)",
  conflocation = "Williamsburg, VA, USA; 26-29 April 1992",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., TN, USA",
  keywords =     "14 GFLOPS; applications; concurrent computers; Delta
                 system; dense matrix problems; distributed memory;
                 double precision; Intel Touchstone; linear algebra; LU
                 factorization; mathematics computing; object-oriented;
                 object-oriented interface; parallel implementation;
                 parallel programming; portable; programming; scalable
                 dense linear algebra libraries; software portability;
                 square block scattered decomposition; subroutines; user
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "IEEE",
  treatment =    "P Practical",

  author =       "Jack Dongarra",
  title =        "{LAPACK} is Now Available",
  journal =      j-SIGNUM,
  volume =       "27",
  number =       "1",
  pages =        "3--4",
  month =        jan,
  year =         "1992",
  CODEN =        "SNEWD6",
  ISSN =         "0163-5778 (print), 1558-0237 (electronic)",
  ISSN-L =       "0163-5778",
  bibdate =      "Sat Jan 13 20:13:27 MST 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "ACM SIGNUM Newsletter",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Robert van de Geijn and David
  title =        "A Look at Scalable Dense Linear Algebra Libraries",
  type =         "LAPACK Working Note",
  number =       "43",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        apr,
  year =         "1992",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-92-155, April, 1992.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra",
  title =        "{LAPACK} Working Note 34: Workshop on the {BLACS}",
  day =          "6",
  month =        feb,
  year =         "1992",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  note =         "Oak Ridge National Laboratory",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Sven Hammarling and James H.
  title =        "Numerical Considerations in Computing Invariant
  journal =      j-SIAM-J-MAT-ANA-APPL,
  volume =       "13",
  number =       "1",
  pages =        "145--161",
  month =        jan,
  year =         "1992",
  CODEN =        "SJMAEL",
  DOI =          "",
  ISSN =         "0895-4798 (print), 1095-7162 (electronic)",
  ISSN-L =       "0895-4798",
  MRclass =      "65F15",
  MRnumber =     "93a:65049",
  bibdate =      "Mon Jan 15 10:23:32 1996",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM Journal on Matrix Analysis and Applications",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  reviewer =     "Colette Lebaud",

  author =       "J. J. Dongarra and M. Sidani",
  title =        "A parallel algorithm for the nonsymmetric eigenvalue
  crossref =     "Griffiths:1992:NAP",
  pages =        "85--102",
  year =         "1992",
  MRclass =      "65F15 (65Y05)",
  MRnumber =     "177 229",
  bibdate =      "Mon Jan 15 10:37:55 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Rolf Hempel and Anthony J. G. Hey
                 and David W. Walker",
  title =        "A Proposal for a User-Level Message-Passing Interface
                 in a Distributed Memory Environment",
  type =         type-TR,
  number =       "TM-12231",
  institution =  inst-ORNL,
  address =      inst-ORNL:adr,
  month =        oct,
  year =         "1992",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Henk A. van der Vorst",
  title =        "Performance of Various Computers Using Standard
                 Techniques for Solving Sparse Linear Equations",
  type =         "Technical Report",
  number =       "CS-92-168",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  pages =        "????",
  year =         "1992",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Henk A. van der Vorst",
  title =        "Performance of Various Computers Using Standard Sparse
                 Linear Equations Solving Techniques",
  journal =      j-SUPERCOMPUTER,
  volume =       "9",
  number =       "5",
  pages =        "17--29",
  month =        sep,
  year =         "1992",
  CODEN =        "SPCOEL",
  ISSN =         "0168-7875",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "C5470 (Performance evaluation and testing); C4130
                 (Interpolation and function approximation); C4140
                 (Linear algebra)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Supercomputer",
  keywords =     "architecture; benchmark program; computer performance;
                 conjugate gradient iterative solver; conjugate gradient
                 methods; definite linear systems; evaluation; linear
                 equations; LINPACK; matrices; matrix algebra;
                 performance; positive; sparse; symmetric linear
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical; T Theoretical or Mathematical",
  xxtitle =      "Performance of various computers using standard
                 techniques for solving sparse linear equations",
  xxtitle =      "Performance of Various Computers Using Standard Linear
                 Equations Software in a {Fortran} Environment",

  author =       "Jack J. Dongarra",
  title =        "Performance of Various Computers Using Standard Linear
                 Equations Software",
  journal =      j-COMP-ARCH-NEWS,
  volume =       "20",
  number =       "3",
  pages =        "22--44",
  month =        jun,
  year =         "1992",
  CODEN =        "CANED2",
  ISSN =         "0163-5964 (ACM), 0884-7495 (IEEE)",
  ISSN-L =       "0163-5964",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  abstract =     "The article compares the performance of different
                 computer systems in solving dense systems of linear
                 equations. The comparison involves approximately a
                 hundred computers, ranging from a CRAY Y-MP to
                 scientific workstations such as the Apollo and Sun to
                 IBM PCs.",
  acknowledgement = ack-nhfb,
  affiliation =  "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  classcodes =   "C5470 (Performance evaluation and testing); C7310
                 (Mathematics); C4140 (Linear algebra)",
  classification = "C4140 (Linear algebra); C5470 (Performance
                 evaluation and testing); C7310 (Mathematics)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "ACM SIGARCH Computer Architecture News",
  journal-URL =  "",
  keywords =     "Apollo; computer; Computer systems; CRAY Y-MP; Dense
                 systems; dense systems; evaluation; IBM PCs; linear
                 algebra; Linear equations software; linear equations
                 software; mathematics computing; performance;
                 Performance comparison; performance comparison;
                 Scientific workstations; scientific workstations; Sun;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  thesaurus =    "Linear algebra; Mathematics computing; Performance
  treatment =    "P Practical",

  author =       "J. J. Dongarra and M. Sidani",
  title =        "Reduction to Condensed Form for the Eigenvalue Problem
                 on Distributed Memory Architectures",
  type =         "Report",
  number =       "ORNL/TM-12006",
  institution =  inst-MSS-ORNL,
  address =      inst-MSS-ORNL:adr,
  month =        "??",
  year =         "1992",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  keywords =     "nla, prll, eig, nonsymmetric matrix",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Robert A. {van de Geijn}",
  title =        "Reduction to condensed form for the eigenvalue problem
                 on distributed memory architectures",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "18",
  number =       "9",
  pages =        "973--982",
  month =        sep,
  year =         "1992",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  MRclass =      "65Y05 (65F15)",
  MRnumber =     "1 190 458",
  bibdate =      "Thu Sep 16 09:30:12 1999",
  bibsource =    "",
  URL =          "",
  abstract =     "The authors describe a parallel implementation for the
                 reduction of general and symmetric matrices to
                 Hessenberg and tridiagonal form, respectively. The
                 methods are based on LAPACK sequential codes and use a
                 panel-wrapped mapping of matrices to nodes. Results
                 from experiments on the Intel Touchstone Delta are
  acknowledgement = ack-nhfb,
  affiliation =  "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  classcodes =   "C7310 (Mathematics); C5220P (Parallel architecture);
                 C4140 (Linear algebra)",
  classification = "C4140 (Linear algebra); C5220P (Parallel
                 architecture); C7310 (Mathematics)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  keywords =     "architectures; distributed memory; Distributed memory
                 architectures; distributed memory systems; Eigenvalue
                 problem; eigenvalue problem; eigenvalues and
                 eigenfunctions; Hessenberg form; Intel Touchstone
                 Delta; LAPACK sequential codes; linear algebra;
                 mapping; mathematics computing; panel-wrapped;
                 Panel-wrapped mapping; parallel; Parallel
                 implementation; parallel implementation; Symmetric
                 matrices; symmetric matrices; Tridiagonal form;
                 tridiagonal form",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  pubcountry =   "Netherlands",
  thesaurus =    "Distributed memory systems; Eigenvalues and
                 eigenfunctions; Linear algebra; Mathematics computing;
                 Parallel architectures",
  treatment =    "P Practical",

  author =       "J. Dongarra and D. Sorensen and O. Brewer",
  title =        "Tools to aid in the design, implementation, and
                 understanding of algorithms for parallel processors",
  crossref =     "Perrott:1992:SPC",
  pages =        "195--219",
  year =         "1992",
  bibdate =      "Mon Sep 9 07:55:25 MDT 1996",
  bibsource =    "",
  abstract =     "Two tools have been implemented that aid in the
                 development of parallel algorithms that are portable
                 across a range of high-performance computers. The first
                 tool, Schedule, aids in implementing and analysing
                 programs within a large-grain control flow model of
                 computation. The underlying concept is based on a
                 natural graphical interpretation of parallel
                 computation that is useful in designing and
                 implementing parallel algorithms. This graphical
                 interpretation may be used to automate the generation
                 of a parallel program through a facility called Build.
                 Schedule also provides a means for postprocessing
                 performance analysis through an animated visualization
                 of the flow of a parallel program's execution. This
                 animation is accomplished through the Trace facility.
                 The second tool, MAP, provides a graphical display of
                 memory access patterns in algorithms. Such patterns can
                 be important in understanding memory bottlenecks in
                 compute-intensive algorithms.",
  acknowledgement = ack-nhfb,
  affiliation =  "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  classcodes =   "C6115 (Programming support); C6110P (Parallel
                 programming); C6130B (Graphics techniques); C6120 (File
  classification = "C6110P (Parallel programming); C6115 (Programming
                 support); C6120 (File organisation); C6130B (Graphics
  corpsource =   "Div. of Math. and Comput. Sci., Argonne Nat. Lab., IL,
  keywords =     "access patterns; algorithms; animated; Animated
                 visualization; Build; compute-intensive;
                 Compute-intensive algorithms; computer graphics;
                 Graphical display; graphical display; high-performance
                 computers; High-performance computers; interpretation;
                 large-grain control flow model; Large-grain control
                 flow model; MAP; memory; Memory access patterns; Memory
                 bottlenecks; memory bottlenecks; natural graphical;
                 Natural graphical interpretation; parallel; Parallel
                 algorithms; parallel algorithms; parallel computation;
                 Parallel computation; parallel program; Parallel
                 program; Postprocessing performance analysis;
                 postprocessing performance analysis; programming;
                 Schedule; software tools; storage management; Trace
                 facility; visualization",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  pubcountry =   "UK",
  thesaurus =    "Computer graphics; Parallel algorithms; Parallel
                 programming; Software tools; Storage management",
  treatment =    "P Practical",

  author =       "C. M. Pancake and R. Bailey and D. Barkai and B. Smith
                 and J. Brandenburg and J. Dongarra and M. Kalos and M.
                 Snir and D. Gelernter",
  title =        "What Should We Expect from Parallel Language
  journal =      j-IJSAHPC,
  volume =       "6",
  number =       "1",
  pages =        "112--117",
  month =        "????",
  year =         "1992",
  CODEN =        "IJSCFG",
  ISSN =         "1078-3482",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of Supercomputer Applications
                 and High Performance Computing",
  journal-URL =  "",
  onlinedate =   "SPR-1992",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. C. Anderson and J. Dongarra",
  title =        "Performance of {LAPACK}: a portable library of
                 numerical linear algebra routines",
  journal =      j-PROC-IEEE,
  volume =       "81",
  number =       "8",
  pages =        "1094--1102",
  month =        aug,
  year =         "1993",
  CODEN =        "IEEPAD",
  DOI =          "",
  ISSN =         "0018-9219 (print), 1558-2256 (electronic)",
  ISSN-L =       "0018-9219",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics); C4140 (Linear algebra); C5440
                 (Multiprocessor systems and techniques); C6150G
                 (Diagnostic, testing, debugging and evaluating
  corpsource =   "Cray Res. Center, Eagan, MN, USA",
  fjournal =     "Proceedings of the IEEE",
  journal-URL =  "",
  keywords =     "algebra routines; computers; evaluation; LAPACK
                 project; library; linear algebra; mathematics
                 computing; numerical linear; numerical linear algebra;
                 parallel; parallel processors; performance; performance
                 tuning; portability; portable library; program testing;
                 shared memory systems; shared-memory vector; software",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "R. Barrett and T. Chan and J. Demmel and J. Donato and
                 J. Dongarra and V. Eijkhout and V. Pozo and Romime C.
                 and H. van der Vorst",
  title =        "Building Blocks for Iterative Solution of Linear
  howpublished = "in preparation",
  year =         "1993",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Beguelin and J. Dongarra and A. Geist and R.
                 Manchek and Otto and S. and J. Walpole",
  title =        "{PVM}: Experiences, current status and future
  crossref =     "IEEE:1993:PSP",
  pages =        "765--766",
  year =         "1993",
  bibdate =      "Wed Apr 15 12:04:03 MDT 1998",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classification = "C6110P (Parallel programming); C6150N (Distributed
                 systems software); C7320 (Physics and chemistry
                 computing); C7410D (Electronic engineering computing)",
  corpsource =   "Sch. of Comput. Sci., Carnegie Mellon Univ.,
                 Pittsburgh, PA, USA",
  keywords =     "circuit analysis; computational requirements;
                 computing requirements; concurrent computing;
                 concurrent processing; electronic engineering
                 computing; engineering design; hardware
                 multiprocessors; high-performance applications;
                 integration aspects; material sciences; multiprocessing
                 programs; parallel processors; parallel programming;
                 parallel virtual machine; physical sciences; physics
                 computing; PVM; scientific computational problems;
                 simulation; software package; software packages",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "IEEE; ACM SIGARCH",
  treatment =    "P Practical",

  author =       "A. Beguelin and J. Dongarra and A. Geist and R.
                 Manchek and K. Moore and V. Sunderam",
  title =        "{PVM} and {HeNCE}: Tools for Heterogeneous Network
  crossref =     "Kowalik:1993:SPC",
  pages =        "??--??",
  year =         "1993",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Beguelin and J. Dongarra and A. Geist and R.
  title =        "Tools for Heterogeneous Network Computing",
  crossref =     "Sincovec:1993:SCP",
  pages =        "854--861",
  year =         "1993",
  bibdate =      "Fri Mar 1 10:04:10 MST 1996",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Adam Beguelin and Jack Dongarra and Al Geist and Vaidy
  title =        "Visualization and Debugging in a Heterogeneous
  journal =      j-COMPUTER,
  volume =       "26",
  number =       "6",
  pages =        "88--95",
  month =        jun,
  year =         "1993",
  CODEN =        "CPTRB4",
  DOI =          "",
  ISSN =         "0018-9162 (print), 1558-0814 (electronic)",
  ISSN-L =       "0018-9162",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  URL =          "",
  abstract =     "A monitoring tool and a graphical interface working on
                 top of the PVM software can help programmers make
                 better use of heterogeneous networks of computers.",
  acknowledgement = ack-nhfb,
  classcodes =   "C6150G (Diagnostic, testing, debugging and evaluating
                 systems); C6150N (Distributed systems); C6115
                 (Programming support)",
  corpsource =   "Sch. of Comput. Sci., Carnegie Mellon Univ.,
                 Pittsburgh, PA, USA",
  fjournal =     "Computer",
  journal-URL =  "",
  keywords =     "debugging; distributed programs; graphical monitoring
                 package; graphical programming environment; Hence;
                 heterogeneous; heterogeneous environment; monitoring;
                 multiprocessing programs; open systems; parallel;
                 parallel virtual machine; program debugging; program
                 visualisation; programming; software tools; system;
                 virtual machines; visual programming; Xab",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "Michael W. Berry and Jack J. Dongarra and Brian H.
  title =        "{PDS}: {A Performance Database Server}",
  journal =      j-SCI-COMPUT,
  volume =       "??",
  number =       "??",
  pages =        "??--??",
  month =        "??",
  year =         "1993",
  CODEN =        "SCHRCU",
  ISSN =         "1930-5753 (print), 1930-6156 (electronic)",
  ISSN-L =       "1930-5753",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  note =         "(to appear)",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Scientific Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jaeyoung Choi and Jack J. Dongarra and David W.
  title =        "Parallel Matrix Transpose Algorithms on Distributed
                 Memory Concurrent Computers",
  type =         "LAPACK Working Note",
  number =       "65",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        nov,
  year =         "1993",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-93-215, November, 1993.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jaeyoung Choi and Jack J. Dongarra and David W.
  title =        "{PUMMA}: {Parallel Universal Matrix Multiplication
                 Algorithms} on Distributed Memory Concurrent
  type =         "LAPACK Working Note",
  number =       "57",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        may,
  year =         "1993",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-93-187, May 1993.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Demmel and J. Dongarra and R. {Van de Geijn} and D.
  title =        "{LAPACK} for Distributed Memory Architectures: The
                 Next Generation",
  crossref =     "Sincovec:1993:SCP",
  pages =        "323--329",
  year =         "1993",
  bibdate =      "Fri Mar 1 10:04:10 MST 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "F. Desprez and J. Dongarra and B. Tourancheau",
  title =        "Performance Complexity of {$ L U $} Factorization with
                 Efficient Pipelining and Overlap on a Multiprocessor",
  type =         "LAPACK Working Note",
  number =       "67",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        dec,
  year =         "1993",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-93-218, December, 1993.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and David W. Walker",
  title =        "The Design of Linear Algebra Libraries for High
                 Performance Computers",
  type =         "LAPACK Working Note" # " and " # type-CSDTR,
  number =       "58 and ORNL/TM-12404",
  institution =  inst-UTK-CS # " and " # inst-MSS-ORNL,
  address =      inst-UTK-CS:adr # " and " # inst-MSS-ORNL:adr,
  month =        jun,
  year =         "1993",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    ";
  note =         "UT-CS-93-188, June 1993.",
  URL =          ";
  acknowledgement = ack-nhfb,
  keywords =     "nla, prll, distributed memory, assignment",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra",
  title =        "From Dinos to Rhinos",
  crossref =     "Fincham:1993:CSO",
  pages =        "1--10",
  year =         "1993",
  MRclass =      "65Y05",
  MRnumber =     "1 370 932",
  bibdate =      "Fri Mar 1 10:04:10 MST 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and R. Hempel and A. J. G. Hey and D.
                 W. Walker",
  title =        "A Draft Standard for Message Passing in a Distributed
                 Memory Environment",
  crossref =     "Hoffmann:1993:PSA",
  pages =        "465--481",
  year =         "1993",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C6150N (Distributed systems); C5220P (Parallel
                 architecture); C5440 (Multiprocessor systems and
  conflocation = "Reading, UK; 23-27 Nov. 1992",
  conftitle =    "Proceedings of the Fifth ECMWF Worshop on the Use of
                 Parallel Processor in Meteorology. Parallel
                 Supercomputing in Atmospheric Science",
  corpsource =   "Math. Sci. Sect., Oak Ridge Nat. Lab., TN, USA",
  keywords =     "C language; data; distributed memory; distributed
                 memory systems; distribution transformations; draft
                 standard; environment; Fortran 77; interface standard;
                 library; message passing; Message Passing Interface 1;
                 message selectivity; message type; MPI1; process;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "Jack Dongarra and G. A. Geist and Robert Manchek and
                 V. S. Sunderam",
  title =        "Integrated {PVM} Framework Supports Heterogeneous
                 Network Computing",
  journal =      j-COMPUT-PHYS,
  volume =       "7",
  number =       "2",
  pages =        "166--174",
  month =        mar # "--" # apr,
  year =         "1993",
  CODEN =        "CPHYE2",
  DOI =          "",
  ISSN =         "0894-1866 (print), 1558-4208 (electronic)",
  ISSN-L =       "0894-1866",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  classcodes =   "C6150N (Distributed systems); C7430 (Computer
                 engineering); C6110P (Parallel programming); C7300
                 (Natural sciences)",
  corpsource =   "Tennessee Univ., Knoxville, TN, USA",
  fjournal =     "Computers in Physics",
  journal-URL =  "",
  keywords =     "computer networks; computing; concurrent applications;
                 distributed processing; heterogeneous network
                 computing; integrated framework; natural sciences;
                 parallel programming; parallel virtual machine
                 software; scientific computations; virtual machines",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "G General Review; P Practical",

  author =       "J. Dongarra",
  title =        "Linear algebra libraries for high-performance
                 computers: a personal perspective",
  journal =      j-IEEE-PAR-DIST-TECH,
  volume =       "1",
  number =       "1",
  pages =        "17--24",
  month =        feb,
  year =         "1993",
  CODEN =        "IPDTEX",
  DOI =          "",
  ISSN =         "1063-6552 (print), 1558-1861 (electronic)",
  ISSN-L =       "1063-6552",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics); C4140 (Linear algebra)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Koxville, TN,
  fjournal =     "IEEE Parallel and Distributed Technology: Systems and
  keywords =     "benchmark; data reuse; high-performance computers;
                 linear algebra; linear algebra libraries; Linpack
                 software; locality; mathematics computing; of
                 reference; standards development",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "Jack J. Dongarra and Roldan Pozo and David W. Walker",
  title =        "{LAPACK++}: a design overview of object-oriented
                 extensions for high performance linear algebra",
  crossref =     "IEEE:1993:PSP",
  pages =        "162--171",
  year =         "1993",
  bibdate =      "Wed Apr 15 12:04:03 MDT 1998",
  bibsource =    "Compendex database;
  acknowledgement = ack-nhfb,
  affiliation =  "Univ of Tennessee",
  classcodes =   "C4140 (Linear algebra); C6110J (Object-oriented
                 programming); C4130 (Interpolation and function
                 approximation); C6110P (Parallel programming); C7310
                 (Mathematics computing)",
  classification = "723; 723.1; 921.1; C4130 (Interpolation and function
                 approximation); C4140 (Linear algebra); C6110J
                 (Object-oriented programming); C6110P (Parallel
                 programming); C7310 (Mathematics computing)",
  conflocation = "Portland, OR, USA; 15-19 Nov. 1993",
  conftitle =    "SUPERCOMPUTING '93",
  corpsource =   "Oak Ridge Nat. Lab., TN, USA",
  keywords =     "Algebra; approximations; architectures; calling
                 sequences; Computer software; Computers; decomposition
                 classes; design overview; distributed memory;
                 distributed memory architectures; Distributed memory
                 architectures; eigenvalue problems; eigenvalues and
                 eigenfunctions; Eigenvalues and eigenfunctions;
                 extendible; extendible software framework; generality;
                 high; high performance linear algebra; High performance
                 linear Algebra; high-performance computer;
                 high-performance computer architectures; LAPACK++;
                 least squares; least squares approximations; Least
                 squares approximations; linear algebra; linear least;
                 linear least squares; linear systems; mathematics
                 computing; matrix; matrix algebra; matrix
                 representations; numerical linear algebra; Object
                 oriented approach; object-oriented approach;
                 object-oriented C++ extension; object-oriented
                 extensions; object-oriented programming; parallel;
                 parallel programming; performance linear algebra;
                 programming; representations; ScaLAPACK++; software
                 framework; software libraries; squares; subroutines;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "IEEE; ACM SIGARCH",
  treatment =    "T Theoretical or Mathematical",

  author =       "J. Dongarra and R. Pozo and D. Walker",
  title =        "An Object Oriented Design for High Performance Linear
                 Algebra on Distributed Memory Architectures",
  type =         "LAPACK Working Note",
  number =       "61",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        aug,
  year =         "1993",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-93-200, August 1993.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Majed Sidani",
  title =        "A Parallel Algorithm for the Non-Symmetric Eigenvalue
  journal =      j-SIAM-J-SCI-COMP,
  volume =       "14",
  number =       "3",
  pages =        "542--569",
  month =        may,
  year =         "1993",
  CODEN =        "SJOCE3",
  DOI =          "",
  ISSN =         "1064-8275 (print), 1095-7197 (electronic)",
  ISSN-L =       "1064-8275",
  MRclass =      "65F15 (65Y05)",
  MRnumber =     "94e:65045",
  MRreviewer =   "Bruno Codenotti",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  classcodes =   "C4240P (Parallel programming and algorithm theory);
                 C4140 (Linear algebra); C4130 (Interpolation and
                 function approximation)",
  corpsource =   "Comput. Sci., Tennessee Univ., Knoxville, TN, USA",
  fjournal =     "SIAM Journal on Scientific Computing",
  journal-URL =  "",
  keywords =     "algebra; divide-and-conquer procedure; eigenvalues and
                 eigenfunctions; eigenvectors; iterative; iterative
                 methods; matrix; nonsymmetric eigenvalue; nonsymmetric
                 matrix; parallel algorithm; parallel algorithms;
                 refinement technique",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  reviewer =     "Bruno Codenotti",
  treatment =    "P Practical",

  author =       "J. Dongarra and R. Hempel and A. Hay and D. Walker",
  title =        "A Proposal for a User-Level Message Passing Interface
                 in a Distributed Memory Environment",
  type =         type-TR,
  number =       "ORNL/TM-12231",
  institution =  inst-ORNL,
  address =      inst-ORNL:adr,
  month =        feb,
  year =         "1993",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra",
  title =        "Performance of various computers using standard linear
                 equations software",
  type =         type-CSDTR,
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        jan,
  year =         "1993",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Henk A. van der Vorst",
  title =        "Performance of Various Computers Using Standard Sparse
                 Linear Equations Solving Techniques",
  crossref =     "Dongarra:1993:CB",
  pages =        "177--188",
  year =         "1993",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and T. Rowan and R. Wade",
  title =        "Software Distribution Using {XNETLIB}",
  type =         type-CSDTR,
  number =       "CS-93-214",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        "??",
  year =         "1993",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and R. A. {Van de Geijn} and R. {Clint
  title =        "Two Dimensional Basic Linear Algebra Communication
  crossref =     "Sincovec:1993:SCP",
  pages =        "347--352",
  year =         "1993",
  bibdate =      "Fri Mar 1 10:04:10 MST 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and R. A. {van de Geijn} and R. C.
  title =        "A Users' Guide to the {BLACS}",
  year =         "1993",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  note =         "Manuscript. Department of Computer Science, University
                 of Tennessee, Knoxville, TN 37996.",
  acknowledgement = ack-nhfb,
  keywords =     "nla, prll, communication, distributed memory, message
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and A. Geist and R. Manchek and W.
  title =        "Using {PVM} 3.0 to Run Grand Challenge Applications on
                 a Heterogeneous Network of Parallel Computers",
  crossref =     "Sincovec:1993:SCP",
  pages =        "873--877",
  year =         "1993",
  bibdate =      "Thu Feb 29 17:59:11 MST 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Geist and J. Dongarra and A. Beguelin and B.
                 Manchek and Weicheng Jiang",
  title =        "{PVM} takes over the world",
  crossref =     "IEEE:1993:PSP",
  pages =        "618--618",
  year =         "1993",
  DOI =          "",
  bibdate =      "Fri May 27 10:20:49 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "R. Pozo and J. J. Dongarra and D. W. Walker",
  title =        "{LAPACK++}: a Design Overview of Object-Oriented
                 Extensions for High Performance Linear Algebra",
  crossref =     "IEEE:1993:PSP",
  pages =        "162--171",
  year =         "1993",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Anonymous",
  title =        "{MPI}: a Message-Passing Interface Standard",
  journal =      j-IJSAHPC,
  volume =       "8",
  number =       "3/4",
  pages =        "159--416",
  month =        "Fall\slash Winter",
  year =         "1994",
  CODEN =        "IJSAE9",
  ISSN =         "0890-2720",
  bibdate =      "Tue Feb 18 09:18:46 MST 1997",
  bibsource =    "Compendex database;
  note =         "Edited by J. Dongarra.",
  URL =          "",
  abstract =     "Message passing is a paradigm used widely on certain
                 classes of parallel machines, especially these with
                 distributed memory. Although there are many variations,
                 the basic concept of processes communicating through
                 messages is well understood. Over the last ten years,
                 substantial progress has been made in casting
                 significant applications in this paradigm. Each vendor
                 has implemented its own variant. More recently, several
                 systems have demonstrated that a message-passing system
                 can be efficiently and portably implemented. A
                 definition of both the syntax and semantics of a core
                 of library routines is thus presented. It will be
                 useful to a wide range of users and efficiently
                 implementable on a wide range of computers.",
  acknowledgement = ack-nhfb,
  classification = "722.2; 722.3; 722.4; 723.1; 723.1.1",
  fjournal =     "International Journal of Supercomputer Applications
                 and High Performance Computing",
  journal-URL =  "",
  journalabr =   "Int J Supercomput Appl High Perform Comput",
  keywords =     "C (programming language); Codes (standards);
                 Computational linguistics; Computer software; Data
                 communication systems; FORTRAN (programming language);
                 Interfaces (computer); Message passing interface;
                 Parallel machines; Parallel processing systems; Point
                 to point communication; Standardization",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Richard Barrett and Michael Berry and Jack Dongarra
                 and Victor Eijkhout and Charles Romine",
  title =        "Algorithmic Bombardment for the Iterative Solution of
                 Linear Systems: a Poly-Iterative Approach",
  type =         "LAPACK Working Note",
  number =       "76",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        aug,
  year =         "1994",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-94-239, August, 1994.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Richard Barrett and Michael Berry and Tony F. Chan and
                 James Demmel and June Donato and Jack Dongarra and
                 Victor Eijkhout and Roldan Pozo and Charles Romine and
                 Henk van der Vorst",
  title =        "Templates for the Solution of Linear Systems:
                 {Building} Blocks for Iterative Methods",
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "xiii + 112",
  year =         "1994",
  ISBN =         "0-89871-328-5",
  ISBN-13 =      "978-0-89871-328-2",
  LCCN =         "QA297.8 .T45 1994",
  bibdate =      "Tue Mar 05 17:39:36 2002",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Richard Barrett and Michael Berry and Tony F. Chan and
                 James W. Demmel and June Donato and Jack Dongarra and
                 Victor Eijkhout and Roldan Pozo and Charles Romine and
                 Henk van der Vorst",
  title =        "Templates for the Solution of Linear Systems: Building
                 Blocks for Iterative Methods ({Japanese})",
  publisher =    "Asakura Shoten",
  address =      "Tokyo, Japan",
  pages =        "????",
  year =         "1994",
  ISBN =         "4-254-11401-X",
  ISBN-13 =      "978-4-254-11401-0",
  LCCN =         "????",
  bibdate =      "Mon Jun 07 19:34:29 1999",
  bibsource =    ";
  note =         "See book review \cite{Anonymous:1995:BRB}.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Adam Beguelin and Jack J. Dongarra and George Al Geist
                 and Robert Manchek and Keith Moore",
  title =        "{HeNCE}: a heterogeneous network computing
  journal =      j-SCI-PROG,
  volume =       "3",
  number =       "1",
  pages =        "49--60",
  month =        "Spring",
  year =         "1994",
  CODEN =        "SCIPEV",
  ISSN =         "1058-9244 (print), 1875-919X (electronic)",
  ISSN-L =       "1058-9244",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  URL =          "",
  abstract =     "Network computing seeks to utilize the aggregate
                 resources of many networked computers to solve a single
                 problem. In so doing it is often possible to obtain
                 supercomputer performance from an inexpensive local
                 area network. The drawback is that network computing is
                 complicated and error prone when done by hand,
                 especially if the computers have different operating
                 systems and data formats and are thus heterogeneous.
                 The heterogeneous network computing environment (HeNCE)
                 is an integrated graphical environment for creating and
                 running parallel programs over a heterogeneous
                 collection of computers. It is built on a lower level
                 package called parallel virtual machine (PVM). The
                 HeNCE philosophy of parallel programming is to have the
                 programmer graphically specify the parallelism of a
                 computation and to automate, as much as possible, the
                 tasks of writing, compiling, executing, debugging, and
                 tracing the network computation. Key to HeNCE is a
                 graphical language based on directed graphs that
                 describe the parallelism and data dependencies of an
                 application. Nodes in the graphs represent conventional
                 Fortran or C subroutines and the arcs represent data
                 and control flow. This article describes the present
                 state of HeNCE, its capabilities, limitations, and
                 areas of future research.",
  acknowledgement = ack-nhfb,
  affiliation =  "Carnegie Mellon Univ",
  affiliationaddress = "Pittsburgh, PA, USA",
  classcodes =   "C6150N (Distributed systems software); C1160
                 (Combinatorial mathematics); C6110P (Parallel
                 programming); C6115 (Programming support); C6150G
                 (Diagnostic, testing, debugging and evaluating
                 systems); C6150C (Compilers, interpreters and other
                 processors); C5620L (Local area networks)",
  classification = "722.4; 723.1; 723.1.1; 723.5",
  corpsource =   "Sch. of Comput. Sci., Carnegie Mellon Univ.,
                 Pittsburgh, PA, USA",
  fjournal =     "Scientific Programming",
  journal-URL =  "",
  journalabr =   "Sci Program",
  keywords =     "aggregate resources; C (programming language);
                 compilation; Computer aided software engineering;
                 Computer networks; Computer operating systems; data;
                 data dependencies; Data format; Data transfer;
                 debugging; directed graphs; execution; formats; FORTRAN
                 (programming language); graph nodes; Graphical
                 language; graphical language; HeNCE; Heterogeneous
                 network computing environment; heterogeneous network
                 computing environment; integrated graphical
                 environment; Interactive computer graphics; local area
                 network; Local area networks; local area networks;
                 network computation; networked computers; operating
                 systems; parallel; Parallel processing systems;
                 parallel programming; Parallel programs; Parallel
                 virtual machine; parallel virtual machine;
                 parallelising compilers; parallelism; performance;
                 Program compilers; Program debugging; program
                 debugging; programs; Subroutines; supercomputer;
                 tracing; virtual machines; writing",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "Michael W. Berry and Jack J. Dongarra and Youngbae
  title =        "A Highly Parallel Algorithm for the Reduction of a
                 Nonsymmetric Matrix to Block Upper-{Hessenberg} Form",
  type =         "LAPACK Working Note",
  number =       "68",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        feb,
  year =         "1994",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-94-221, February 1994.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "M. W. Berry and J. J. Dongarra and B. H. Larosei and
                 T. A. Letsche",
  title =        "{PDS}: a performance database server",
  journal =      j-SCI-PROG,
  volume =       "3",
  number =       "2",
  pages =        "147--156",
  month =        "Summer",
  year =         "1994",
  CODEN =        "SCIPEV",
  ISSN =         "1058-9244 (print), 1875-919X (electronic)",
  ISSN-L =       "1058-9244",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C5470 (Performance evaluation and testing); C7430
                 (Computer engineering); C5630 (Networking equipment);
                 C7250L (Non- bibliographic retrieval systems); C7220
                 (Generation, dissemination, and use of information);
                 C7210 (Information services and centres); C6160Z (Other
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Scientific Programming",
  journal-URL =  "",
  keywords =     "archival system; benchmark data; benchmarks;
                 cataloguing; central depository; data; data archiving;
                 data gathering; database management systems;
                 distribution; dynamic database; file servers;
                 information dissemination; Internet;
                 Internet-accessible; LINPACK benchmark; NAS parallel
                 benchmarks; Netlib; online catalog; PDS; Perfect;
                 performance database server; performance evaluation;
                 performance metrics; public-domain computer; server;
                 user interfaces; X-Windows-based user interface;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "S. Blackford and J. Dongarra",
  title =        "Quick Installation Guide for {LAPACK} on {Unix}
  type =         "LAPACK Working Note",
  number =       "81",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        sep,
  year =         "1994",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-94-249, September, 1994.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Shirley V. Browne and Jack J. Dongarra and Stan C.
                 Green and Keith Moore and Thomas H. Rowan and Reed C.
  title =        "{Netlib} Services and Resources",
  type =         "Report",
  number =       "ORNL/TM-12680",
  institution =  inst-ORNL,
  address =      inst-ORNL:adr,
  pages =        "42",
  month =        apr,
  year =         "1994",
  bibdate =      "Wed Sep 28 14:04:23 2011",
  bibsource =    ";
  acknowledgement = ack-njh # " and " # ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Choi and J. J. Dongarra and R. Pozo and D. W.
  title =        "Constructing Numerical Software Libraries for
                 High-Performance Computing Environments",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "879",
  pages =        "147--168",
  year =         "1994",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Wed Sep 15 10:01:31 MDT 1999",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  keywords =     "computing; heterogeneous network; PARA; parallel
                 scientific computing",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jaeyoung Choi and Jack J. Dongarra and Roldan Pozo and
                 Danny C. Sorensen and David W. Walker",
  title =        "{CRPC} research into linear algebra software for high
                 performance computers",
  journal =      j-IJSAHPC,
  volume =       "8",
  number =       "2",
  pages =        "99--118",
  month =        "Summer",
  year =         "1994",
  CODEN =        "IJSAE9",
  DOI =          "",
  ISSN =         "0890-2720",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  URL =          "",
  abstract =     "In this paper we look at a number of approaches being
                 investigated in the Center for Research on Parallel
                 Computation (CRPC) to develop linear algebra software
                 for high-performance computers. These approaches are
                 exemplified by the LAPACK, templates, and ARPACK
                 projects. LAPACK is a software library for performing
                 dense and banded linear algebra computations, and was
                 designed to run efficiently on high-performance
                 computers. We focus on the design of the
                 distributed-memory version of LAPACK, and on an
                 object-oriented interface to LAPACK.",
  acknowledgement = ack-nhfb,
  affiliation =  "Oak Ridge Natl Lab",
  affiliationaddress = "Oak Ridge, TN, USA",
  classcodes =   "C7310 (Mathematics); C0310B (Computer facilities);
                 C5440 (Multiprocessor systems and techniques)",
  classification = "722.2; 722.4; 723.1; 901.1.1; 921.1",
  corpsource =   "Math. Sci. Sec., Oak Ridge Nat. Lab., Oak Ridge., TN,
  fjournal =     "International Journal of Supercomputer Applications
                 and High Performance Computing",
  journal-URL =  "",
  journalabr =   "Int J Supercomput Appl High Perform Comput",
  keywords =     "Algorithms; ARPACK; Center for Research on Parallel
                 Computation; Center for Research on Parallel
                 Computation (CRPC); computer centres; Computer
                 software; Distributed computer systems;
                 distributed-memory; High performance computers;
                 high-performance computers; Interfaces (computer);
                 LAPACK; Linear algebra; linear algebra; linear algebra
                 computations; mathematics computing; Object oriented
                 programming; object-oriented interface; object-oriented
                 programming; parallel processing; projects; Societies
                 and institutions; software; software library; Software
                 package ARPACK; Software package LAPACK",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "A Application; P Practical",

  author =       "J. Choi and J. J. Dongarra and S. Ostrouchov and A. P.
                 Petitet and D. W. Walker and R. C. Whaley",
  title =        "The Design and Implementation of the {ScaLAPACK} {$ L
                 U $}, {$ Q R $}, and {Cholesky} Factorization
  type =         "LAPACK Working Note",
  number =       "80",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        sep,
  year =         "1994",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-94-246, September, 1994.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Choi and J. J. Dongarra and D. W. Walker",
  title =        "The design of a parallel, dense linear algebra
                 software library: reduction to {Hessenberg},
                 tridiagonal, and bidiagonal form",
  crossref =     "Dongarra:1994:PSW",
  pages =        "98--111",
  year =         "1994",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics computing); C6110B (Software
                 engineering techniques); C5440 (Multiprocessing
                 systems); C4140 (Linear algebra); C6110P (Parallel
  conflocation = "Townsend, TN, USA; 25-27 May 1994",
  conftitle =    "Proceedings of the Second Workshop on Environments and
                 Tools for Parallel Scientific Computing",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  keywords =     "algebra; Basic Linear Algebra Communication
                 Subprograms; bidiagonal form; distributed Level 3 BLAS
                 routines; distributed memory concurrent computers;
                 distributed memory systems; Hessenberg; higher level;
                 library routines; mathematics computing; matrix; panel
                 reduction phase; Parallel Block BLAS; parallel dense
                 linear algebra software library; parallel programming;
                 PB-BLAS; reduction algorithms; ScaLAPACK; sequential
                 BLAS; software engineering considerations; software
                 libraries; tridiagonal",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "Jaeyoung Choi and J. J. Dongarra and D. W. Walker",
  title =        "The Design of Scalable Software Libraries for
                 Distributed Memory Concurrent Computers",
  crossref =     "Siegel:1994:PEI",
  pages =        "792--799",
  year =         "1994",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  note =         "IEEE catalog number 94TH0652-8.",
  acknowledgement = ack-nhfb,
  classcodes =   "C6110P (Parallel programming); C4140 (Linear algebra);
                 C7310 (Mathematics)",
  conflocation = "Cancun, Mexico; 26-29 April 1994",
  conftitle =    "Proceedings of 8th International Parallel Processing
  corpsource =   "Math. Sci. Sect., Oak Ridge Nat. Lab., TN, USA",
  keywords =     "algebra subroutines; allocation; banded linear algebra
                 computations; basic linear; block cyclic data
                 distribution; block-; computers; computing; data
                 distribution; dense linear algebra computations;
                 distributed memory concurrent; distributed memory
                 systems; interprocessor communication; Level 3 BLAS;
                 linear algebra; load balance; mathematics; matrix
                 algebra; parallel programming; partitioned matrix
                 decomposition; performance; resource; scalable software
                 libraries; ScaLAPACK; specification; subroutines",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "IEEE; ACM",
  treatment =    "P Practical",
  xxnote =       "Check author order??",

  author =       "Jaeyoung Choi and J. J. Dongarra and D. W. Walker",
  title =        "Parallel matrix transpose algorithms on distributed
                 memory concurrent computers",
  crossref =     "IEEE:1994:PSP",
  pages =        "245--252",
  year =         "1994",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics); C4240P (Parallel programming and
                 algorithm theory); C4140 (Linear algebra); C5440
                 (Multiprocessor systems and techniques)",
  conflocation = "Mississippi State, MS, USA; 6-8 Oct. 1993",
  conftitle =    "Proceedings of Scalable Parallel Libraries
  corpsource =   "Math. Sci. Sect., Oak Ridge Nat. Lab., TN, USA",
  keywords =     "algebra; block scattered data distribution; computer;
                 concurrent computers; distributed memory; distributed
                 memory systems; Intel Touchstone Delta; mathematics
                 computing; matrix; matrix multiplication routine;
                 parallel algorithms; parallel matrix transpose
                 algorithms; point-to-point communication; PUMMA
                 package; synchronisation; transposed matrices",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "Mississippi State Univ.; Nat. Sci. Found",
  treatment =    "A Application; P Practical",

  author =       "Jaeyoung Choi and Jack J. Dongarra and David W.
  title =        "{PUMMA}: {Parallel Universal Matrix Multiplication
                 Algorithms} on distributed memory concurrent
  journal =      j-CPE,
  volume =       "6",
  number =       "7",
  pages =        "543--570",
  month =        oct,
  year =         "1994",
  CODEN =        "CPEXEI",
  DOI =          "",
  ISSN =         "1040-3108 (print), 1096-9128 (electronic)",
  ISSN-L =       "1040-3108",
  bibdate =      "Tue Feb 26 09:30:21 2002",
  bibsource =    "Compendex database;
  URL =          "",
  abstract =     "The paper describes Parallel Universal Matrix
                 Multiplication Algorithms (PUMMA) on distributed memory
                 concurrent computers. The PUMMA package includes not
                 only the non-transposed matrix multiplication routine
                 {$ C = A \dot B $}, but also transposed multiplication
                 routines {$ C = A^T \dot B $}, {$ C = A \dot B^T $},
                 and {$ C = A^T \dot B^T $}, for a block cyclic data
                 distribution. The routines perform efficiently for a
                 wide range of processor configurations and block sizes.
                 The PUMMA together provide the same functionality as
                 the Level 3 BLAS routine xGEMM. Details of the parallel
                 implementation of the routines are given, and results
                 are presented for runs on the Intel Touchstone Delta
  acknowledgement = ack-nhfb,
  affiliation =  "Oak Ridge Natl Lab",
  affiliationaddress = "Oak Ridge, TN, USA",
  classcodes =   "C7310 (Mathematics); C5440 (Multiprocessor systems and
                 techniques); C4240P (Parallel programming and algorithm
                 theory); C4140 (Linear algebra)",
  classification = "722.4; 723.1; 921.1",
  corpsource =   "Math. Sci. Sect., Oak Ridge Nat. Lab., TN, USA",
  fjournal =     "Concurrency, practice and experience",
  journal-URL =  "",
  journalabr =   "Concurrency Pract Exper",
  keywords =     "algebra; Algorithms; block cyclic data distribution;
                 block sizes; Computer architecture; configurations;
                 Distributed memory concurrent computers; distributed
                 memory concurrent computers; distributed memory
                 systems; Intel Touchstone Delta Computer; level 3 BLAS
                 routine xGEMM; Mathematical operators; mathematics
                 computing; matrix; Matrix algebra; matrix
                 multiplication routine; Multiprogramming;
                 nontransposed; parallel algorithms; Parallel processing
                 systems; Parallel Universal Matrix Multiplication
                 Algorithm (PUMMA); parallel universal matrix
                 multiplication algorithms; processor; PUMMA; routines;
                 transposed multiplication",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "A Application; P Practical",

  author =       "Jaeyoung Choi and J. J. Dongarra and D. W. Walker",
  title =        "{PB-BLAS}: a Set of Parallel Block {Basic Linear
                 Algebra Subprograms}",
  crossref =     "IEEE:1994:PSH",
  pages =        "534--541",
  year =         "1994",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  note =         "IEEE catalog number 94TH0637-9.",
  acknowledgement = ack-nhfb,
  classcodes =   "C4240P (Parallel programming and algorithm theory);
                 C4140 (Linear algebra); C6110P (Parallel programming);
                 C5440 (Multiprocessor systems and techniques); C7310
  conflocation = "Knoxville, TN, USA; 23-25 May 1994",
  conftitle =    "Proceedings of IEEE Scalable High Performance
                 Computing Conference",
  corpsource =   "Math. Sci. Sect., Oak Ridge Nat. Lab., TN, USA",
  keywords =     "BLAS routines; block-; computing; distributed memory
                 systems; distributed-memory version; LAPACK; linear
                 algebra; linear algebra computations; mathematics;
                 matrix algebra; parallel; parallel algorithms; Parallel
                 Block Basic Linear Algebra Subprograms; partitioned
                 matrices; PB-BLAS; portability; programming; ScaLAPACK;
                 subroutine library; subroutines; unrestricted
                 two-dimensional array",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "IEEE Comput. Soc. Tech. Committee on Supercomput.
  treatment =    "P Practical; T Theoretical or Mathematical",

  author =       "Michael J. Dayd{\'e} and Iain S. Duff and Antoine
  title =        "A Parallel Block Implementation of Level-3 {BLAS} for
                 {MIMD} Vector Processors",
  journal =      j-TOMS,
  volume =       "20",
  number =       "2",
  pages =        "178--193",
  month =        jun,
  year =         "1994",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  bibdate =      "Fri Sep 09 13:52:29 1994",
  bibsource =    "",
  note =         "See
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  keywords =     "algorithms; Level-3 BLAS; matrix-matrix kernels;
                 measurement; parallelization; performance;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  subject =      "F.2.1 [Analysis of Algorithms and Problem Complexity]:
                 Numerical Algorithms and Problems --- computations on
                 matrices; G.1.0 [Numerical Analysis]: General ---
                 numerical algorithms; G.1.3 [Numerical Analysis]:
                 Numerical Linear Algebra --- linear systems (direct and
                 iterative methods); G.4 [Mathematics of Computing]:
                 Mathematical Software --- certification and testing;
                 efficiency; portability; reliability and robustness;

  author =       "J. J. Dongarra and Iain S. Duff",
  title =        "Advanced architecture computers",
  number =       "CS-89-90",
  institution =  "University of Tennessee",
  address =      "Knoxville, TN, USA",
  year =         "1994",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  note =         "Revision of 1987 Report AERE R12415, HMSO, London. An
                 earlier version appeared in Federal Supercomputer
                 Programs and Policies, US Government Printing Office,
                 Washington DC, 710--799.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Andrew Lumsdaine and Xinhui Niu and
                 Roldan Pozo and Karin Remington",
  editor =       "????",
  booktitle =    "{OONSKI'94}: Proceedings of the second annual
                 object-oriented numerics conference, Sunriver, Oregon,
                 April 24--27, 1994",
  title =        "Accurate and efficient (parallel) algorithms have been
                 formulated and implemented on distributive platforms
                 for solving \ldots{}",
  publisher =    "Rogue Wave Software",
  address =      "Corvallis, OR, USA",
  pages =        "??--??",
  year =         "1994",
  bibdate =      "Wed Jan 14 05:41:38 2004",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and M. Kolatis",
  title =        "Call Conversion Interface ({CCI}) for {LAPACK\slash
  type =         "LAPACK Working Note",
  number =       "82",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        aug,
  year =         "1994",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-94-250, August, 1994.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra",
  title =        "Constructing Numerical Software Libraries for {HPCC}
  crossref =     "IEEE:1994:PTI",
  pages =        "4--??",
  year =         "1994",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  note =         "IEEE catalog number 94TH0667-6.",
  abstract =     "Numerical software libraries have long been used in
                 engineering and scientific computations on workstations
                 and mainframes, but are just now becoming widely
                 available on HPCC platforms. We describe recent
                 developments in the SCALAPACK numerical linear algebra
                 library, which have recently become available for
                 currently existing massively parallel machines and
                 networks of workstations. We outline SCALAPACK's
                 functionality and current performance. We also describe
                 our efforts to ease technology transfers by providing
                 24-hour electronic access and on-line books of
                 `templates' to help users find the best program to
  acknowledgement = ack-nhfb,
  affiliation =  "Univ of Tennessee",
  affiliationaddress = "TN, USA",
  classcodes =   "C7310 (Mathematics); C4140 (Linear algebra); C5620
                 (Computer networks and techniques); C5440
                 (Multiprocessor systems and techniques)",
  classification = "722.3; 722.4; 723.2; 901.3; 901.4; 921.1",
  conference =   "Proceedings of the 3rd IEEE International Symposium on
                 High Performance Distributed Computing",
  conflocation = "San Francisco, CA, USA; 2-5 Aug. 1994",
  conftitle =    "Proceedings of 3rd IEEE International Symposium on
                 High Performance Distributed Computing",
  corpsource =   "Oak Ridge Nat. Lab., TN, USA",
  keywords =     "24-hour electronic access; computer networks; Computer
                 software; Computer workstations; computing; Engineering
                 research; HPCC; HPCC environments; Linear algebra;
                 linear algebra; massively parallel machines;
                 mathematics; Numerical software libraries; numerical
                 software libraries; online books; parallel machines;
                 Parallel processing systems; platforms; SCALAPACK
                 numerical linear algebra library; Software engineering;
                 Software package SCALAPACK; subroutines; technology;
                 Technology transfer; templates; transfer;
  meetingabr =   "Proc 3 IEEE Int Symp High Perform Distrib Comput",
  meetingaddress = "San Francisco, CA, USA",
  meetingdate =  "Apr 2--5 1994",
  meetingdate2 = "04/02--05/94",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsor =      "IEEE Computer Society",
  sponsororg =   "IEEE Comput. Soc. Tech. Committee on Distributed
                 Process.; Northeast Parallel Archit. Center (NPAC) at
                 Syracuse Univ.; ACM SIGCOMM",
  treatment =    "P Practical",

  author =       "J. Dongarra and D. Reed",
  title =        "Introduction to the {HPC} Early Evaluation Vendor
  crossref =     "Anonymous:1994:HPC",
  pages =        "131--134",
  year =         "1994",
  bibdate =      "Fri Mar 1 10:04:10 MST 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Michael Kolatis",
  title =        "{IBM RS\slash 6000-550 \& -590} Performance for
                 Selected Routines in {ESSL}",
  type =         "LAPACK Working Note",
  number =       "71",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        apr,
  year =         "1994",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-94-231, April 1994.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra",
  title =        "Performance of {LAPACK}",
  crossref =     "Gilbert:1994:LMP",
  pages =        "55--68 (or 55--67??)",
  year =         "1994",
  MRclass =      "65-04",
  MRnumber =     "1 285 625",
  bibdate =      "Fri Mar 1 10:04:10 MST 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and R. A. {Van de Geijn} and D. W.
  title =        "Scalability Issues Affecting the Design of a Dense
                 Linear Algebra Library",
  journal =      j-J-PAR-DIST-COMP,
  volume =       "22",
  number =       "3",
  pages =        "523--537",
  month =        sep,
  year =         "1994",
  CODEN =        "JPDCER",
  DOI =          "",
  ISSN =         "0743-7315 (print), 1096-0848 (electronic)",
  ISSN-L =       "0743-7315",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  classcodes =   "C4140 (Linear algebra); C6130 (Data handling
                 techniques); C6110P (Parallel programming); C4240P
                 (Parallel programming and algorithm theory); C7310
                 (Mathematics); C6150N (Distributed systems)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Journal of Parallel and Distributed Computing",
  journal-URL =  "",
  keywords =     "128-node Intel iPSC/860; block cyclic data
                 distribution; block-partitioned algorithms; Cholesky;
                 computers; computing; data; dense linear algebra
                 library; distributed memory systems; factorization
                 routines; hypercube; LAPACK; library; linear algebra;
                 LU factorization routines; manipulation; mathematics;
                 memory hierarchy; MIMD distributed memory concurrent;
                 movement; parallel block-; parallel programming;
                 partitioned algorithms; performance; QR; scalability
                 issues; ScaLAPACK mathematical software library;
                 sequential block-partitioned algorithms; subroutines;
                 symbol; timings",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "T Theoretical or Mathematical",

  author =       "J. Dongarra and A. Lumsdaine and X. Niu and R. Pozo
                 and K. Remington",
  title =        "A Sparse Matrix Library in {C++} for High Performance
  type =         "LAPACK Working Note",
  number =       "74",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        jul,
  year =         "1994",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-94-236, July 1994.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and A. Lumsdaine and X. Niu and R. Pozo
                 and K. Remington",
  title =        "A Sparse Matrix Library in {C++} For High Performance
  crossref =     "Anonymous:1994:OON",
  pages =        "214--218",
  year =         "1994",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and R. Pozo and D. W. Walker",
  title =        "{ScaLAPACK++}: an object oriented linear algebra
                 library for scalable systems",
  crossref =     "IEEE:1994:PSP",
  pages =        "216--223",
  year =         "1994",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics); C6110B (Software engineering
                 techniques)C5440 (Multiprocessor systems and
                 techniques); C6115 (Programming support); C4140 (Linear
                 algebra); C6110J (Object-oriented programming)",
  conflocation = "Mississippi State, MS, USA; 6-8 Oct. 1993",
  conftitle =    "Proceedings of Scalable Parallel Libraries
  corpsource =   "Math. Sci. Sect., Oak Ridge Nat. Lab., TN, USA",
  keywords =     "computing; distributed memory multicomputers;
                 distributed memory systems; flexibility; linear
                 algebra; LU factorization; mathematics; matrix
                 operations; object oriented linear algebra library;
                 object-oriented programming; portability;
                 right-looking; scalable systems; ScaLAPACK++; software;
                 software tools; sparse",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "Mississippi State Univ.; Nat. Sci. Found",
  treatment =    "A Application; P Practical",

  author =       "Al Geist and Adam Beguelin and Jack Dongarra and
                 Weicheng Jiang and Robert Manchek and Vaidy Sunderam",
  title =        "{PVM}: Parallel Virtual Machine: a Users' Guide and
                 Tutorial for Networked Parallel Computing",
  publisher =    pub-MIT,
  address =      pub-MIT:adr,
  pages =        "xvii + 279",
  year =         "1994",
  ISBN =         "0-262-57108-0 (paperback)",
  ISBN-13 =      "978-0-262-57108-1 (paperback)",
  LCCN =         "QA76.58 .P85 1994",
  bibdate =      "Thu Feb 29 17:35:15 1996",
  bibsource =    "",
  price =        "US\$19.95",
  series =       "Scientific and engineering computation",
  acknowledgement = ack-nhfb,
  keywords =     "Computer networks.; Networks --- Parallel programming;
                 Parallel computers.",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "{PARKBENCH Committee\slash Assembled by R.Hockney
                 (Chairman) and M. Berry (Secretary)}",
  title =        "{PARKBENCH} Report: Public International Benchmarks
                 for Parallel Computers",
  journal =      j-SCI-PROG,
  volume =       "3",
  number =       "2",
  pages =        "101--146",
  month =        "Summer",
  year =         "1994",
  CODEN =        "SCIPEV",
  ISSN =         "1058-9244 (print), 1875-919X (electronic)",
  ISSN-L =       "1058-9244",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Scientific Programming",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. S. Plank and Y. Kim and J. J. Dongarra",
  title =        "Algorithm-Based Diskless Checkpointing for Fault
                 Tolerant Matrix Operations",
  type =         "LAPACK Working Note",
  number =       "90",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        dec,
  year =         "1994",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-94-268, December 1994.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Francis Sullivan and Jack Dongarra",
  title =        "Algorithm Design for Large-Scale Computations",
  journal =      j-IJSA,
  volume =       "1",
  number =       "1",
  pages =        "99--105",
  month =        mar,
  year =         "1987",
  CODEN =        "IJSAE9",
  DOI =          "",
  ISSN =         "0890-2720",
  bibdate =      "Tue Nov 6 11:28:49 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "The International Journal of Supercomputer
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "V. S. Sunderam and G. A. Geist and J. Dongarra and R.
  title =        "The {PVM} concurrent computing system: Evolution,
                 experiences, and trends",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "20",
  number =       "4",
  pages =        "531--545",
  day =          "31",
  month =        mar,
  year =         "1994",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "B6210L (Computer communications); C6110P (Parallel
                 programming); C6150N (Distributed systems); C5620
                 (Computer networks and techniques)",
  corpsource =   "Dept. of Math. and Comput. Sci., Emory Univ., Atlanta,
                 GA, USA",
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  keywords =     "auxiliary facilities; case studies; climate modeling;
                 communication overheads; computer networks; computing
                 model; environmental science; experimental
                 enhancements; heterogeneous; heterogeneous concurrent
                 computing; interface; large scale scientific
                 supercomputing; materials science; message passing;
                 message passing model; MPP; network computing;
                 networked computing platforms; networked environments;
                 parallel processing; parallel programming; process
                 groups; programming; PVM concurrent computing system;
                 software framework; support",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "E. Anderson and Z. Bai and C. Bischof and J. Demmel
                 and J. Dongarra and J. {Du Croz} and A. Greenbaum and
                 S. Hammarling and A. McKenney and S. Ostrouchov and D.
  title =        "{LAPACK} Users' Guide",
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  edition =      "Second",
  pages =        "xix + 325",
  year =         "1995",
  ISBN =         "0-89871-345-5 (paperback)",
  ISBN-13 =      "978-0-89871-345-9 (paperback)",
  LCCN =         "QA76.73.F25 L36 1995",
  bibdate =      "Sat Dec 06 17:25:09 2003",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  keywords =     "algebras, linear -- data processing; Fortran (computer
                 program language); LAPACK; subroutines (computer
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Z. Bai and J. Demmel and J. Dongarra and A. Petitet
                 and H. Robinson and K. Stanley",
  title =        "The Spectral Decomposition of Nonsymmetric Matrices on
                 Distributed Memory Parallel Computers",
  type =         "LAPACK Working Note",
  number =       "91",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        jan,
  year =         "1995",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-95-273, January 1995.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Z. Bai and D. Day and J. Demmel and J. Dongarra and M.
                 Gu and A. Ruhe and H. van der Vorst",
  title =        "Templates for Linear Algebra Problems",
  type =         "LAPACK Working Note",
  number =       "106",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        oct,
  year =         "1995",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    ";
  note =         "UT-CS-95-311, October 1995. Published in
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Z. Bai and D. Day and J. Demmel and J. Dongarra",
  title =        "Templates for Linear Algebra Problems",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1000",
  pages =        "115--??",
  year =         "1995",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Sat May 11 13:45:32 MDT 1996",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Adam Beguelin and Jack Dongarra and Al Geist and
                 Robert Manchek and Vaidy Sunderam",
  title =        "Recent enhancements to {PVM}",
  journal =      j-IJSAHPC,
  volume =       "9",
  number =       "2",
  pages =        "108--127",
  month =        "Summer",
  year =         "1995",
  CODEN =        "IJSCFG",
  DOI =          "",
  ISSN =         "1078-3482",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  URL =          "",
  abstract =     "This paper presents new features of PVM, a popular
                 standard for writing parallel programs that execute
                 over networks of heterogeneous machines. Although PVM
                 has become an important infrastructure for parallel
                 programmers, we continue to develop the system based
                 both on user feedback and our own research interests.
                 In this paper we present new communications routines
                 and briefly characterize their performance. We describe
                 new extensible services that allow advanced users to
                 customize certain aspects of the default PVM
                 functionality. An overview of shared-memory PVM
                 optimizations is presented. PVM's new tracing facility
                 and a graphical console that utilizes this capability
                 are described. Finally, we discuss future extensions to
                 PVM now under investigation.",
  acknowledgement = ack-nhfb,
  affiliation =  "Carnegie Mellon Univ",
  affiliationaddress = "Pittsburgh, PA, USA",
  classcodes =   "C6110P (Parallel programming); C5440 (Multiprocessing
                 systems); C6150N (Distributed systems software); C6115
                 (Programming support)",
  classification = "722.1; 722.2; 722.4; 723.1; 723.1.1; 921.5",
  corpsource =   "Sch. of Comput. Sci., Carnegie Mellon Univ.,
                 Pittsburgh, PA, USA",
  fjournal =     "International Journal of Supercomputer Applications
                 and High Performance Computing",
  journal-URL =  "",
  journalabr =   "Int J Supercomput Appl High Perform Comput",
  keywords =     "advanced users; communications; Computer architecture;
                 Computer networks; Computer programming languages;
                 Computer software; console; Data communication systems;
                 Data storage equipment; evaluation; extensible
                 services; graphical; heterogeneous machines; Message
                 passing; Optimization; parallel machines; Parallel
                 processing systems; parallel programmers; parallel
                 programming; parallel programs; Parallel virtual
                 machine; Parallel Virtual Machine; performance; PVM;
                 routines; Shared memory; shared memory; shared-memory
                 PVM optimizations; software libraries; software
                 performance; software standards; standard; systems;
                 tracing facility; user feedback; virtual machines",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "A Application; P Practical",

  author =       "Michael W. Berry and Jack J. Dongarra and Youngbae
  title =        "A parallel algorithm for the reduction of a
                 nonsymmetric matrix to block upper-{Hessenberg} form",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "21",
  number =       "8",
  pages =        "1189--1211",
  day =          "10",
  month =        aug,
  year =         "1995",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  MRclass =      "65Y05 (65F15)",
  MRnumber =     "1 343 401, 96c:65223",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  abstract =     "In this paper, we present an algorithm for the
                 reduction to block upper-Hessenberg form which can be
                 used to solve the nonsymmetric eigenvalue problem on
                 message-passing multicomputers. On such multicomputers,
                 a nonsymmetric matrix can be distributed across
                 processing nodes logically configured into a
                 two-dimensional mesh using the block-cyclic data
                 distribution. Based on the matrix partitioning and
                 mapping, the algorithm employs both Householder
                 reflectors and Givens rotations within each reduction
                 step. We analyze the arithmetic and communication
                 complexities and describe the implementation details of
                 the algorithm on message-passing multicomputers. We
                 discuss two different implementations --- synchronous
                 and asynchronous --- and present performance results on
                 the Intel iPSC\slash 860 and DELTA. We conclude with an
                 evaluation of the algorithm's communication cost, and
                 suggest areas for further improvement.",
  acknowledgement = ack-nhfb,
  affiliation =  "Univ of Tennessee",
  affiliationaddress = "Knoxville, TN, USA",
  classcodes =   "C4240P (Parallel programming and algorithm theory);
                 C6110P (Parallel programming); C4140 (Linear algebra);
                 C5440 (Multiprocessing systems)",
  classification = "721.1; 722.3; 722.4; 723; 921; 921.1",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  journalabr =   "Parallel Comput",
  keywords =     "Algorithms; algorithms; block; block-cyclic data
                 distribution; communication complexities; communication
                 complexity; Computational complexity; Data
                 communication systems; DELTA; dimensional mesh;
                 Distributed computer systems; Distributed memory
                 multiprocessors; distributed memory systems;
                 Eigenvalues and eigenfunctions; eigenvalues and
                 eigenfunctions; Givens; Householder reflectors; Intel
                 iPSC/860; linear algebra; mapping; matrix;
                 message-passing multicomputers; Nonsymmetric eigenvalue
                 problem; nonsymmetric eigenvalue problem; nonsymmetric
                 matrix reduction; parallel; Parallel algorithm;
                 parallel algorithm; Parallel processing systems;
                 partitioning; performance results; Problem solving;
                 processing nodes; rotations; two-; Upper-Hessenberg
                 form; upper-Hessenberg form",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "A Application; P Practical",

  author =       "Ronald Boisvert and Shirley Browne and Jack Dongarra",
  booktitle =    "A Forum on Research and Technology Advances in Digital
                 Libraries {(DL'95)}, May 15--19, 1995, {McLean} {VA}",
  title =        "Digital Software and Data Repositories for Support of
                 Scientific Computing",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  month =        may,
  year =         "1995",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  note =         "McLean, Virginia",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Shirley Browne and Jack Dongarra and Geoffrey C. Fox
                 and Ken Hawick and Ken Kennedy and Rick Stevens and
                 Robert Olson and Tom Rowan",
  title =        "Distributed Information Management in the {National
                 HPCC Software Exchange}",
  crossref =     "Karin:1995:PAI",
  volume =       "1",
  pages =        "463--477",
  year =         "1995",
  bibdate =      "Thu Nov 7 06:34:19 1996",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Shirley Browne and Jack Dongarra and Stan Green and
                 Keith Moore and Theresa Pepin and Tom Rowan and Reed
                 Wade and Eric Grosse",
  booktitle =    "Symposium on Software Reusability",
  title =        "Location-Independent Naming for Virtual Distributed
                 Software Repositories",
  publisher =    pub-ACM,
  address =      pub-ACM:adr,
  pages =        "179--185",
  month =        apr,
  year =         "1995",
  bibdate =      "Mon Aug 26 07:53:48 1996",
  bibsource =    "Compendex database;
  note =         "Seattle, Washington",
  URL =          "",
  abstract =     "A location-independent naming system for network
                 resources has been designed to facilitate organization
                 and description of software components accessible
                 through a virtual distributed repository. This naming
                 system enables easy and efficient searching and
                 retrieval, and it addresses many of the consistency,
                 authenticity, and integrity issues involved with
                 distributed software repositories by providing
                 mechanisms for grouping resources and for authenticity
                 and integrity checking. This paper details the design
                 of the naming system, describes a prototype
                 implementation of some of the capabilities, and
                 describes how the system fits into the development of
                 the National HPCC Software Exchange, a virtual software
                 repository that has the goal of providing access to
                 reusable software components for high-performance
  acknowledgement = ack-nhfb,
  affiliation =  "Univ of Tennessee",
  affiliationaddress = "Knoxville, TN, USA",
  classification = "722.2; 723.1",
  conference =   "Proceedings of the ACM SIGSOFT Symposium on Software
  journalabr =   "ACM SIGSOFT Symp Software Reusability SSR",
  keywords =     "Authenticity checking; Computer networks; Computer
                 software; Computer software selection and evaluation;
                 High performance computing; Integrity checking;
                 Interfaces (computer); Naming system; Resource
                 allocation; Software repository",
  meetingaddress = "Seattle, WA, USA",
  meetingdate =  "Apr 28--30 1995",
  meetingdate2 = "04/28--30/95",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Shirley Browne and Jack Dongarra and Stan Green and
                 Keith Moore and Theresa Pepin and Tom Rowan and Reed
  title =        "Location-independent naming for virtual distributed
                 software repositories",
  journal =      j-SIGSOFT,
  volume =       "20",
  number =       "SI",
  pages =        "179--185",
  year =         "1995",
  CODEN =        "SFENDP",
  DOI =          "",
  ISSN =         "0163-5948 (print), 1943-5843 (electronic)",
  ISSN-L =       "0163-5948",
  bibdate =      "Wed Aug 1 17:13:04 MDT 2018",
  bibsource =    ";
  abstract =     "A location-independent naming system for network
                 resources has been designed to facilitate organization
                 and description of software components accessible
                 through a virtual distributed repository. This naming
                 system enables easy and efficient searching and
                 retrieval, and it addresses many of the consistency,
                 authenticity, and integrity issues involved with
                 distributed software repositories by providing
                 mechanisms for grouping resources and for authenticity
                 and integrity checking. This paper details the design
                 of the naming system, describes how the system fits
                 into the development of the National HPCC Software
                 Exchange, an virtual software repository that has the
                 goal of providing access to reusable software
                 components for high-performance computing.",
  acknowledgement = ack-nhfb,
  fjournal =     "ACM SIGSOFT Software Engineering Notes",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  remark =       "SSR '95 Proceedings of the 1995 Symposium on Software

  author =       "Shirley Browne and Jack Dongarra and Stan Green and
                 Keith Moore and Theresa Pepin and Tom Rowan and Reed
                 Wade and Eric Grosse",
  editor =       "Mansur H. Samadzadeh and Mansour K. Zand",
  booktitle =    "Proceedings of the {ACM} {SIGSOFT} Symposium on
                 Software Reusability {(SSR '95)}, April 28--30, 1995,
                 Seattle, Washington, {USA}: co-located with the 17th
                 International Conference on Software Engineering
                 {(ICSE-17)}, April 23--30, 1995",
  title =        "Location-independent naming for virtual distributed
                 software repositories",
  publisher =    pub-ACM,
  address =      pub-ACM:adr,
  bookpages =    "ix + 272",
  pages =        "179--185",
  month =        aug,
  year =         "1995",
  CODEN =        "SFENDP",
  ISBN =         "0-89791-739-1",
  ISBN-13 =      "978-0-89791-739-1",
  ISSN =         "0163-5948 (print), 1943-5843 (electronic)",
  LCCN =         "QA76.6 .S62 v.20 1995",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  note =         "ACM order number 595950.",
  URL =          ";
  abstract =     "A location-independent naming system for network
                 resources has been designed to facilitate organization
                 and description of software components accessible
                 through a virtual distributed repository. This naming
                 system enables easy and efficient searching and
                 retrieval, and it addresses many of the consistency,
                 authenticity, and integrity issues involved with
                 distributed software repositories by providing
                 mechanisms for grouping resources and for authenticity
                 and integrity checking. This paper details the design
                 of the naming system, describes a prototype
                 implementation of some of the capabilities, and
                 describes how the system fits into the development of
                 the National HPCC Software Exchange, a virtual software
                 repository that has the goal of providing access to
                 reusable software components for high-performance
  acknowledgement = ack-nhfb,
  affiliation =  "Univ of Tennessee",
  affiliationaddress = "Knoxville, TN, USA",
  classcodes =   "C6110B (Software engineering techniques); C6120 (File
                 organisation); C6115 (Programming support); C6150N
                 (Distributed systems software)",
  classification = "722.2; 723.1",
  conference =   "Proceedings of the ACM SIGSOFT Symposium on Software
  conflocation = "Seattle, WA, USA; 28-30 April 1995",
  conftitle =    "SSR'95: Symposium on Software Reusability",
  corpsource =   "Tennessee Univ., TN, USA",
  journalabr =   "ACM SIGSOFT Symp Software Reusability SSR",
  keywords =     "authenticity; Authenticity checking; Computer
                 networks; Computer software; Computer software
                 selection and evaluation; consistency; data integrity;
                 distributed processing; High performance computing;
                 high-; Integrity checking; integrity checking;
                 Interfaces (computer); location-independent naming;
                 naming services; Naming system; naming system; National
                 HPCC Software Exchange; network resources; performance
                 computing; prototype implementation; repositories;
                 Resource allocation; retrieval; reusable software;
                 searching; security of data; software libraries;
                 Software repository; software reusability; virtual
                 distributed software; virtual software repository",
  meetingaddress = "Seattle, WA, USA",
  meetingdate =  "Apr 28--30 1995",
  meetingdate2 = "04/28--30/95",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "ACM",
  treatment =    "P Practical",

  author =       "Shirley Browne and Jack Dongarra and Geoffrey C. Fox
                 and Ken Hawick and Ken Kennedy and Rick Stevens and
                 Robert Olson and Tom Rowan",
  editor =       "Frank M. Shipman and Richard Furuta and David M.
  booktitle =    "Proceedings of Digital Libraries '95: the {Second
                 Annual Conference on the Theory and Practice of Digital
                 Libraries, June 11--13, 1995, Austin, Texas}",
  title =        "Management of the {NHSE} --- {A Virtual Distributed
                 Digital Library: June 11--13, 1995, Austin, TX}",
  publisher =    "Hypermedia Research Laboratory, Texas A\&M
  address =      "College Station, TX",
  pages =        "??--??",
  year =         "1995",
  LCCN =         "Z699.A1 D54 1995",
  bibdate =      "Tue Oct 22 15:45:07 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxISBN =       "none",

  author =       "Shirley Browne and Jack Dongarra and Jeff Horner and
                 Paul McMahan and Scott Wells",
  title =        "{National HPCC Software Exchange (NHSE)}: Uniting the
                 High Performance Computing and Communications
  journal =      j-D-LIB-MAGAZINE,
  day =          "15",
  month =        may,
  year =         "1995",
  DOI =          "",
  ISSN =         "1082-9873",
  bibdate =      "Wed May 09 10:46:47 2007",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "D-Lib magazine: the magazine of the Digital Library
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  remark =       "Document ID

  author =       "Shirley Browne and Jack Dongarra and Stan Green and
                 Keith Moore and Tom Rowan and Reed Wade and Geoffrey
                 Fox and Ken Hawick and Ken Kennedy and Jim Pool and
                 Rick Stevens and Bob Olson and Terry Disz",
  title =        "The {National HPCC Software Exchange}",
  journal =      j-IEEE-COMPUT-SCI-ENG,
  volume =       "2",
  number =       "2",
  pages =        "62--69",
  month =        "Summer",
  year =         "1995",
  CODEN =        "ISCEE4",
  DOI =          "",
  ISSN =         "1070-9924 (print), 1558-190X (electronic)",
  ISSN-L =       "1070-9924",
  bibdate =      "Sat Jan 9 08:57:23 MST 1999",
  bibsource =    "Compendex database;
  URL =          ";
  abstract =     "The National HPCC Software Exchange (NHSE) is an
                 Internet-accessible resource that promotes software and
                 information exchange among those involved with
                 high-performance computing and communications. Now in
                 its infancy, the NHSE will link varied
                 discipline-oriented repositories of software and
                 documents, and encourage Grand Challenge teams and
                 other members of the HPCC community to contribute to
                 these repositories and use them. By acting as a
                 national on-line library of software that makes widely
                 distributed materials available through one place, the
                 exchange will cut down the amount of time, talent, and
                 money spent reinventing the wheel. Target audiences
                 include scientists and engineers in diverse HPCC
                 applications fields, computer scientists, users of
                 government and academic supercomputer centers, and
                 industrial users.",
  acknowledgement = ack-nhfb,
  affiliation =  "Univ of Tennessee",
  classcodes =   "C7210 (Information services and centres); C6130E (Data
                 interchange); C6000 (Computer software); C0310B
                 (Computer facilities)",
  classification = "722.2; 722.3; 722.4; 723.1; 723.3; 903.3",
  corpsource =   "Tennessee Univ., Knoxville, TN, USA",
  fjournal =     "IEEE Computational Science \& Engineering",
  journal-URL =  "",
  journalabr =   "IEEE Comput Sci Eng",
  keywords =     "Browsing; Cataloging information; computer facilities;
                 Computer networks; Computer software; Data
                 communication systems; Database systems;
                 discipline-oriented repositories; Distributed computer
                 systems; electronic data interchange; engineers; Expert
                 systems; Grand Challenge teams; Harvest system;
                 high-performance communications; high-performance
                 computing; Hypertext links; Hypertext roadmap;
                 industrial users; information exchange; Information
                 retrieval systems; information services; information
                 sharing; Internet; Internet-accessible resource;
                 National HPCC Software Exchange; national online
                 software library; Parallel processing systems; Program
                 debugging; scientists; Software engineering; software
                 libraries; software sharing; supercomputer centers;
                 Supercomputers; Technology transfer; User interfaces;
                 widely distributed materials",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "G General Review",

  author =       "Shirley Browne and Jack Dongarra and Eric Grosse and
                 Tom Rowan",
  title =        "The {Netlib Mathematical Software Repository}",
  journal =      j-D-LIB-MAGAZINE,
  month =        sep,
  year =         "1995",
  ISSN =         "1082-9873",
  bibdate =      "Wed Nov 1 16:13:40 1995",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "D-Lib magazine: the magazine of the Digital Library
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  remark =       "Document ID

  author =       "James C. Browne and Syed I. Hyder and Jack Dongarra
                 and Keith Moore and Peter Newton",
  title =        "Visual programming and debugging for parallel
  journal =      j-IEEE-PAR-DIST-TECH,
  volume =       "3",
  number =       "1",
  pages =        "75--83",
  month =        "Spring",
  year =         "1995",
  CODEN =        "IPDTEX",
  DOI =          "",
  ISSN =         "1063-6552 (print), 1558-1861 (electronic)",
  ISSN-L =       "1063-6552",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  abstract =     "In this article, visual parallel programming is
                 discussed and how it is implemented in two integrated
                 programming environments --- Computationally Oriented
                 Display Environment (CODE) and Heterogeneous Network
                 Computing Environment (Hence) --- that represent
                 parallel programs as directed graphs. With visual
                 parallel programming languages, performance and logical
                 debugging can be carried out with the same
                 representation used for programming. The article
                 focuses on logical debugging.",
  acknowledgement = ack-nhfb,
  affiliation =  "Univ of Texas at Austin",
  affiliationaddress = "Austin, TX, USA",
  classcodes =   "C6110P (Parallel programming); C6110V (Visual
                 programming); C6130B (Graphics techniques); C6115
                 (Programming support); C6150G (Diagnostic, testing,
                 debugging and evaluating systems); C6150N (Distributed
                 systems software); C1160 (Combinatorial mathematics)",
  classification = "722; 722.4; 723; 723.1; 723.1.1; 723.5",
  corpsource =   "Texas Univ., Austin, TX, USA",
  fjournal =     "IEEE Parallel and Distributed Technology: Systems and
  journalabr =   "IEEE Parallel Distrib Technol",
  keywords =     "annotated directed graph; Computational methods;
                 Computationally Oriented Display Environment;
                 computations; Computer architecture; Computer graphics;
                 Computer programming; Computer programming languages;
                 debugging; directed graphs; Flowcharting;
                 Heterogeneous; integrated programming environments;
                 Network Computing Environment; Parallel algorithms;
                 parallel computing; Parallel processing systems;
                 parallel programming; Parallel programs; parallel
                 programs; parallel structure; Program compilers;
                 Program debugging; program debugging; program
                 sequential; programming; Programming environment;
                 programming environments; representations; visual
                 parallel; Visual parallel programming; visual
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "Henri Casanova and Jack Dongarra and Weicheng Jiang",
  title =        "The Performance of {PVM} on {MPP} Systems",
  type =         "Technical report",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        aug,
  year =         "1995",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Choi and J. Dongarra and D. Walker",
  title =        "The Design of a Parallel Dense Linear Algebra Software
                 Library: Reduction to {Hessenberg}, Tridiagonal, and
                 Bidiagonal Form",
  type =         "LAPACK Working Note",
  number =       "92",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        feb,
  year =         "1995",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-95-275, February 1995.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jaeyoung Choi and Jack J. Dongarra and David W.
  title =        "The design of a parallel dense linear algebra software
                 library: reduction to {Hessenberg}, tridiagonal, and
                 bidiagonal form",
  journal =      j-NUMER-ALGORITHMS,
  volume =       "10",
  number =       "3--4",
  pages =        "379--399",
  month =        oct,
  year =         "1995",
  CODEN =        "NUALEG",
  ISSN =         "1017-1398 (print), 1572-9265 (electronic)",
  ISSN-L =       "1017-1398",
  MRclass =      "65-04 (65Y10)",
  MRnumber =     "1 355 739",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "B0290H (Linear algebra); C7310 (Mathematics
                 computing); C4140 (Linear algebra); C6110B (Software
                 engineering techniques); C6115 (Programming support)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Numerical Algorithms",
  journal-URL =  "",
  keywords =     "Basic Linear Algebra Communication; bidiagonal; BLACS;
                 computers; computing; dense; distributed memory
                 concurrent; eigenproblems; eigenvalues and
                 eigenfunctions; form; Hessenberg form; LAPACK; linear
                 algebra; linear algebra computations; mathematics;
                 matrices; matrix reduction algorithms; parallel BLAS;
                 parallel dense linear algebra software library;
                 routine; ScaLAPACK; sequencing BLAS; software
                 engineering; software libraries; Subprograms;
                 tridiagonal form",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "A Application; P Practical",

  author =       "Jaeyoung Choi and Jack J. Dongarra and David W.
  title =        "Parallel matrix transpose algorithms on distributed
                 memory concurrent computers",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "21",
  number =       "9",
  pages =        "1387--1405",
  day =          "12",
  month =        sep,
  year =         "1995",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  MRclass =      "65F10 (65Y05)",
  MRnumber =     "1 349 482",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  abstract =     "Several parallel matrix transpose algorithms on
                 distributed memory concurrent processors are described.
                 It is assumed that the matrix is distributed over a P
                 \$MUL Q processor template with a block cyclic data
                 distribution. The greatest common divisor (GCD) of P
                 and Q determine the communication schemes of the
                 algorithms. Since the algorithms make use of
                 non-blocking, point-to-point communication between
                 processors, a process can overlap the messages that it
                 sends to different processors, thereby avoiding
                 unnecessary synchronization. By combining the
                 algorithms with the matrix multiplication routine, they
                 can be used to compute parallel multiplications of
                 transported matrices in the PUMMA package. Finally,
                 details of the parallel implementation of the
                 algorithms are given, and the results are presented for
                 runs on the Intel Touchstone Delta computer.",
  acknowledgement = ack-nhfb,
  affiliation =  "Soongsil Univ",
  affiliationaddress = "Seoul, S Korea",
  classcodes =   "C4240P (Parallel programming and algorithm theory);
                 C4140 (Linear algebra); C6110P (Parallel programming)",
  classification = "722.3; 722.4; 921.1; 921.6",
  corpsource =   "Sch. of Comput., Soongsil Univ., Seoul, South Korea",
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  journalabr =   "Parallel Comput",
  keywords =     "algorithm; Block cyclic data distribution;
                 communication; complete exchange communication;
                 Computational methods; concurrent computers; Data
                 communication systems; Digital arithmetic; Distributed
                 computer systems; distributed memory; distributed
                 memory concurrent; Distributed memory concurrent
                 computers; greatest common divisor; matrix; Matrix
                 algebra; matrix multiplication; Matrix multiplication
                 routine; matrix transpose; multiplication routine;
                 Nonblocking communication; nonblocking point-to-point
                 communication; operations; Parallel algorithms;
                 parallel algorithms; Parallel matrix transpose
                 algorithms; parallel matrix transpose algorithms;
                 Parallel processing systems; processors; Transfer
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "T Theoretical or Mathematical",

  author =       "J. Choi and J. Dongarra and S. Ostrouchov and A.
                 Petitet and D. Walker and R. C. Whaley",
  title =        "A Proposal for a Set of Parallel Basic Linear Algebra
  type =         "LAPACK Working Note",
  number =       "100",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        may,
  year =         "1995",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "LAPACK Working Note \#100. UT-CS-95-292, May 1995.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jaeyoung Choi and J. J. Dongarra",
  title =        "Scalable Linear Algebra Software Libraries for
                 Distributed Memory Concurrent Computers",
  crossref =     "IEEE:1995:PFI",
  pages =        "170--177",
  year =         "1995",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  note =         "IEEE catalog number 95TB8106.",
  abstract =     "The design of ScaLAPACK, a scalable software library
                 for performing dense and banded linear algebra
                 computations on distributed memory concurrent
                 computers, is discussed. They are implemented using a
                 block cyclic data distribution, and are built using de
                 facto standard kernels for matrix and vector operations
                 and message passing communication. The details of the
                 implementation of the ScaLAPACK LU factorization
                 routine, and performance and scalability results on the
                 Intel iPSC\slash 680, Touchstone Delta, and Paragon
                 systems are presented.",
  acknowledgement = ack-nhfb,
  affiliation =  "Soongsil Univ",
  affiliationaddress = "Seoul, S Korea",
  classcodes =   "C6110P (Parallel programming); C6115 (Programming
                 support); C6110B (Software engineering techniques)",
  classification = "722.1; 722.4; 723.1; 723.3; 723.5; 921.1",
  conference =   "Proceedings of the 5th IEEE Computer Society Workshop
                 on Future Trends of Distributed Computing Systems",
  conflocation = "Cheju Island, South Korea; 28-30 Aug. 1995",
  conftitle =    "Proceedings of the Fifth IEEE Computer Society
                 Workshop on Future Trends of Distributed Computing
  corpsource =   "Sch. of Comput., Soongsil Univ., Seoul, South Korea",
  journalabr =   "Proc IEEE Computer Soc Workshop Future Trends Distrib
  keywords =     "Algorithms; block cyclic data distribution; Block
                 cyclic data distribution; communication; Computer
                 architecture; Computer software; Concurrency control;
                 core factorization routines; Data storage equipment; de
                 facto standard kernels; distributed; Distributed
                 computer systems; Distributed database systems;
                 Distributed-memory concurrent computers; Hierarchical
                 systems; Intel iPSC/860; library; Linear algebra;
                 Matrix algebra; matrix operations; memory concurrent
                 computers; message passing; Message passing
                 communication; Non-uniform memory access machines;
                 operations; Paragon systems; parallel implementations;
                 parallel programming; Performance; scalable linear
                 algebra software libraries; scalable software;
                 ScaLAPACK library; Shared memory computers; Software
                 engineering; software libraries; software reusability;
                 Standard kernels; symbol manipulation; Touchstone
                 Delta; vector; Vectors",
  meetingaddress = "Cheju Island, South Korea",
  meetingdate =  "Aug 28--30 1995",
  meetingdate2 = "08/28--30/95",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsor =      "IEEE",
  sponsororg =   "IEEE Comput. Soc. Tech. Committee on Distributed
                 Process.; IFIP WG 10.4 on Dependable Comput.; Korea
                 Inf. Soc. Soc. (KISS); Electron. and Telecommun. Res.
                 Inst. (ETRI) Korea; Korea Res. found.; Samsung Data
  treatment =    "P Practical",

  author =       "J. Choi and J. Demmel and I. Dhillon and J. Dongarra
                 and S. Ostrouchov and A. Petitet and K. Stanley and D.
                 Walker and R. C. Whaley",
  title =        "{ScaLAPACK}: a Portable Linear Algebra Library for
                 Distributed Memory Computers --- Design Issues and
  type =         "LAPACK Working Note",
  number =       "95",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        mar,
  year =         "1995",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "LAPACK Working Note \#95. UT-CS-95-283, March 1995.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "F. Desprez and J. J. Dongarra and B. Tourancheau",
  title =        "Performance study of {$ L U $} factorization with low
                 communication overhead on multiprocessors",
  journal =      j-PARALLEL-PROCESS-LETT,
  volume =       "5",
  number =       "2",
  pages =        "157--169",
  month =        jun,
  year =         "1995",
  CODEN =        "PPLTEE",
  ISSN =         "0129-6264 (print), 1793-642X (electronic)",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics computing); C4240C (Computational
                 complexity); C5470 (Performance evaluation and
                 testing); C5440 (Multiprocessing systems)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Parallel Processing Letters",
  journal-URL =  "",
  keywords =     "asynchronous communications; column-scattered data
                 decomposition; complexities; computational;
                 computational complexity; Intel iPSC/860; low
                 communication; LU factorization; mathematics computing;
                 multiprocessing systems; multiprocessors; overhead;
                 Paragon machines; performance evaluation; performance
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "A Application; P Practical",

  author =       "J. J. Dongarra and H. W. Meuer and E. Strohmaier",
  title =        "The Aims",
  journal =      j-SUPERCOMPUTER,
  volume =       "11",
  number =       "2--3",
  pages =        "4--5",
  month =        "????",
  year =         "1995",
  CODEN =        "SPCOEL",
  ISSN =         "0168-7875",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Supercomputer",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and S. Hammarling and S. Ostrouchov",
  title =        "{BLAS} Technical Workshop",
  type =         "LAPACK Working Note",
  number =       "109",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        nov,
  year =         "1995",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-95-317, November 1995.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra",
  title =        "Heterogeneous Network-Based Computing Systems",
  crossref =     "Dongarra:1995:HPC",
  pages =        "5--16",
  year =         "1995",
  bibdate =      "Fri Mar 1 10:04:10 MST 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Steve W. Otto and Marc Snir and
                 David Walker",
  title =        "An Introduction to the {MPI Standard}",
  type =         "Technical report",
  number =       "CS-95-274",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        jan,
  year =         "1995",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  note =         "Appears in CACM \cite{Dongarra:1996:MPS}.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and A. Lumsdaine and R. Pozo and K.
  title =        "{IML++ v. 1.2}: Iterative Methods Library Reference
  type =         "LAPACK Working Note",
  number =       "102",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        aug,
  year =         "1995",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-95-303, August 1995.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and R. Pozo and D. Walker",
  title =        "{LAPACK++ V. 1.0}: High Performance Linear Algebra
                 Users' Guide",
  type =         "LAPACK Working Note",
  number =       "98",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        may,
  year =         "1995",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-95-290, May 1995.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and T. Hey",
  title =        "The {ParkBench} Benchmark Collection",
  journal =      j-SUPERCOMPUTER,
  volume =       "11",
  number =       "2--3",
  pages =        "94--114",
  month =        jun,
  year =         "1995",
  CODEN =        "SPCOEL",
  ISSN =         "0168-7875",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C6150C (Compilers, interpreters and other processors);
                 C5440 (Multiprocessing systems)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Supercomputer",
  keywords =     "application kernels; compact research applications;
                 hierarchical structure; low-level benchmarks; parallel
                 processing; ParkBench benchmark collection; performance
                 characteristics; program compilers; synthetic compiler
                 benchmark suite",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "A Application; P Practical",

  author =       "J. J. Dongarra and J. {Du Croz} and S. Hammarling and
                 J. Wasniewski and A. Zemla",
  title =        "A Proposal for a {Fortran 90} Interface for {LAPACK}",
  type =         "LAPACK Working Note",
  number =       "101",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        jul,
  year =         "1995",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-95-295, July 1995.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra",
  title =        "Performance of Various Computers Using Standard Linear
                 Equations Software",
  type =         "Technical Report",
  number =       "CS-89-85",
  institution =  inst-CS-U-Tenn,
  address =      inst-CS-U-Tenn:adr,
  pages =        "34",
  month =        feb,
  year =         "1995",
  bibdate =      "Fri Apr 7 09:38:01 GMT 1995",
  bibsource =    "",
  mynote =       "An earlier version was Tech. Memo 23, Argonne, 1985.
                 Has kept 1989 CS report number!",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and V. Eijkhout and A. Kalhan",
  title =        "Reverse Communication Interface for Linear Algebra
                 Templates for Iterative Methods",
  type =         "LAPACK Working Note",
  number =       "99",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        may,
  year =         "1995",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-95-291, May 1995.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Jerzy Wa{\'s}niewski",
  title =        "Report on the {Second Workshop on Applied Parallel
                 Computing, PARA95}",
  journal =      j-SIGNUM,
  volume =       "30",
  number =       "4",
  pages =        "28--??",
  month =        oct,
  year =         "1995",
  CODEN =        "SNEWD6",
  ISSN =         "0163-5778 (print), 1558-0237 (electronic)",
  ISSN-L =       "0163-5778",
  bibdate =      "Wed Aug 14 07:49:37 MDT 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "ACM SIGNUM Newsletter",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and T. Rowan and R. Wade",
  title =        "Software distribution using {Xnetlib}",
  journal =      j-TOMS,
  volume =       "21",
  number =       "1",
  pages =        "79--88",
  month =        mar,
  year =         "1995",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics computing); C7250L
                 (Non-bibliographic retrieval systems); C7210
                 (Information services and centres); C7250N (Front end
                 systems for online searching); C7250R (Information
                 retrieval techniques)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  keywords =     "communication network; computer; front end;
                 information retrieval systems; information service;
                 information services; Laboratory; large distributed
                 collection; mathematics computing; netlib; numerical
                 analysis; online front-ends; online searching; online
                 service; public domain; public-domain mathematical;
                 retrieve; socket-based communication; software;
                 software distribution; software libraries; software
                 library; software repository; software tool;
                 telecommunication; Tennessee Oak Ridge National; X
                 Window interface; Xnetlib",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "A Application",

  author =       "Jack Dongarra and Tom Rowan and Reed Wade",
  title =        "Software Distribution using {XNETLIB}",
  journal =      j-TOMS,
  volume =       "21",
  number =       "1",
  pages =        "79--88",
  month =        mar,
  year =         "1995",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  bibdate =      "Wed Aug 14 07:57:30 1996",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-rfb,
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  keywords =     "Netlib; software repositories",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  subject =      "C.2.3 [Computer-Communication Networks]: Network
                 Operations --- public networks; D.2.2 [Software
                 Engineering]: Tools and Techniques --- software
                 libraries; user interfaces; D.2.7 [Software
                 Engineering]: Distribution and Maintenance ---
                 documentation; portability; G.1.0 [Numerical Analysis]:
                 General --- numerical algorithms; G.4 [Mathematics of
                 Computing]: Mathematical Software --- portability;
                 H.3.0 [Information Systems Applications]:
                 Communications Applications; H.3.3 [Information Storage
                 and Retrieval]: Information Search and Retrieval ---
                 search process; selection process; H.3.5 [Information
                 Storage and Retrieval]: Online Information Services ---
                 databank sharing; H.5.2 [Information Interfaces and
                 Presentation]: User Interfaces --- windowing systems;
                 K.6.3 [Management of Computing and Information
                 Systems]: Software Management --- software development;
                 software maintenance; software selection",

  author =       "Jack J. Dongarra and David W. Walker",
  title =        "Software libraries for linear algebra computations on
                 high performance computers",
  journal =      j-SIAM-REVIEW,
  volume =       "37",
  number =       "2",
  pages =        "151--180",
  month =        jun,
  year =         "1995",
  CODEN =        "SIREAD",
  DOI =          "",
  ISSN =         "0036-1445 (print), 1095-7200 (electronic)",
  ISSN-L =       "0036-1445",
  MRclass =      "65-04 (65F05 65Y05)",
  MRnumber =     "1 343 210, 96d:65004",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  URL =          ";
  abstract =     "This paper discusses the design of linear algebra
                 libraries for high performance computers. Particular
                 emphasis is placed on the development of scalable
                 algorithms for multiple instruction multiple data
                 (MIMD) distributed memory concurrent computers. A brief
                 description of the EISPACK, LINPACK, and LAPACK
                 libraries is given, followed by an outline of
                 ScaLAPACK, which is a distributed memory version of
                 LAPACK currently under development. The importance of
                 block-partitioned algorithms in reducing the frequency
                 of data movement between different levels of
                 hierarchical memory is stressed. The use of such
                 algorithms helps reduce the message startup costs on
                 distributed memory concurrent computers. Other key
                 ideas in our approach are the use of distributed
                 versions of the Level 2 and Level 3 basic linear
                 algebra subprograms (BLAS) as computational building
                 blocks, and the use of basic linear algebra
                 communication subprograms (BLACS) as communication
                 building blocks. Together the distributed BLAS and the
                 BLACS can be used to construct higher-level algorithms,
                 and hide many details of the parallelism from the
                 application developer. The block-cyclic data
                 distribution is described and adopted as a good way of
                 distributing block-partitioned matrices.
                 Block-partitioned versions of the Cholesky and LU
                 factorizations are presented, and optimization issues
                 associated with the implementation of the LU
                 factorization algorithm on distributed memory
                 concurrent computers are discussed, together with its
                 performance on the Intel Delta system. Finally,
                 approaches to the design of library interfaces are
  acknowledgement = ack-nhfb,
  affiliation =  "Univ of Tennessee",
  affiliationaddress = "Knoxville, TN, USA",
  classcodes =   "C7310 (Mathematics computing); C4140 (Linear algebra);
                 C6110B (Software engineering techniques); C6150N
                 (Distributed systems software)",
  classification = "721.1; 722.4; 723.1; 723.2; 921.1; 921.5",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "SIAM Review",
  journal-URL =  "",
  journalabr =   "SIAM Rev",
  keywords =     "Algorithms; algorithms; Basic linear algebra
                 subprograms; Block cyclic data distribution; block-;
                 block-cyclic data distribution; block-partitioned
                 matrices; Cholesky; Computational methods; Computer
                 architecture; Computer software; computing; Data
                 transfer; Distributed memory concurrent computers;
                 distributed memory concurrent computers; distributed
                 memory systems; Factorization; factorizations; High
                 performance computers; Intel Delta system; Interfaces
                 (computer); library interfaces; Linear algebra; linear
                 algebra; linear algebra computations; LU factorization;
                 mathematics; Message startup costs; MIMD; Multiple
                 instruction multiple data; multiple instruction
                 multiple data; Optimization; parallel processing;
                 Parallel processing systems; partitioned algorithms;
                 Performance; scalable; ScaLAPACK; software libraries;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical; T Theoretical or Mathematical",

  author =       "J. J. Dongarra and H. W. Meuer and E. Strohmaier",
  title =        "{TOP500} Supercomputer Sites",
  journal =      j-SUPERCOMPUTER,
  volume =       "11",
  number =       "2-3",
  pages =        "133--163 (or 164--194??)",
  month =        jun,
  year =         "1995",
  CODEN =        "SPCOEL",
  ISSN =         "0168-7875",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C5440 (Multiprocessing systems); C7310 (Mathematics
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Supercomputer",
  keywords =     "computers; high-performance; high-performance
                 computers; LINPACK benchmark performance; mathematics
                 computing; measure; parallel machines; parallel
                 processing; performance; performance measure;
                 statistics; TOP500 supercomputer sites",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "A Application; P Practical",

  author =       "P. Newton and J. Dongarra",
  title =        "Overview of {VPE}: a Visual Environment for
  crossref =     "IEEE:1995:FHC",
  pages =        "85--92",
  year =         "1995",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "James S. Plank and Youngbae Kim and Jack J. Dongarra",
  title =        "Algorithm-Based Diskless Checkpointing for
                 Fault-Tolerant Matrix Operations",
  crossref =     "IEEE:1995:DPT",
  pages =        "351--360",
  year =         "1995",
  bibdate =      "Mon Aug 26 07:58:57 1996",
  bibsource =    "",
  URL =          ";
  abstract =     "This paper is an exploration of diskless
                 check-pointing for distributed scientific computations.
                 With the widespread use of the `Network Of Workstation'
                 (NOW) platform for distributed computing, long-running
                 scientific computations need to tolerate the changing
                 and often faulty nature of NOW environments. We present
                 high-performance implementations of several algorithms
                 for distributed scientific computing, including
                 Cholesky factorization, LU factorization, QR
                 factorization, and Preconditioned Conjugate Gradient.
                 These implementations are able to run on PVM networks
                 of at least N processors, and can complete with low
                 overhead as long as any N processors remain functional.
                 We discuss the details of how the algorithms are tuned
                 for fault-tolerance, and present the performance
                 results on a PVM network of SUN workstations, and on
                 the IBM SP2.",
  acknowledgement = ack-nhfb,
  affiliation =  "Univ of Tennessee",
  affiliationaddress = "TN, USA",
  classcodes =   "C6150N (Distributed systems software); C6110B
                 (Software engineering techniques); C4140 (Linear
                 algebra); C7300 (Natural sciences computing); C4130
                 (Interpolation and function approximation)",
  classification = "722.2; 722.4; 723.1",
  conference =   "Proceedings of the 25th International Symposium on
                 Fault-Tolerant Computing",
  conflocation = "Pasadena, CA, USA; 27-30 June 1995",
  conftitle =    "Twenty-Fifth International Symposium on Fault-Tolerant
                 Computing. Digest of Papers",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., TN, USA",
  journalabr =   "Dig Pap Int Symp Fault Tolerant Comput",
  keywords =     "algebra; Algorithm based diskless checkpointing;
                 algorithm-based diskless checkpointing; Algorithms;
                 Cholesky; Cholesky factorization; computations;
                 Computer networks; Computer workstations; conjugate
                 gradient methods; Distributed computer systems;
                 Distributed scientific computations; distributed
                 scientific computations; factorization; fault tolerant;
                 Fault tolerant computer systems; Fault tolerant matrix
                 operations; fault-tolerance; high-performance
                 implementations; IBM SP2; local area networks;
                 long-running scientific; low overhead; LU
                 factorization; matrix; matrix operations; natural
                 sciences computing; Network of workstation (NOW)
                 platform; Parallel processing systems; performance;
                 preconditioned conjugate gradient; Preconditioned
                 conjugate gradient; processors; PVM networks; QR
                 factorization; software fault; subroutines; SUN;
                 tolerance; workstation network platform; workstations",
  meetingaddress = "Pasadena, CA, USA",
  meetingdate =  "Jun 27--30 1995",
  meetingdate2 = "06/27--30/95",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsor =      "IEEE",
  sponsororg =   "IEEE Comput. Soc. Tech. Committee on Fault-Tolerant
                 Comput.; LAAS-CNRS, France; Univ. Illinois at
                 Urbana-Champaign; Univ. California at Los Angeles; Jep
                 Propulsion Lab.; IFIP WG 10.4",
  treatment =    "T Theoretical or Mathematical",

  author =       "R. Barrett and M. Berry and J. Dongarra and V.
                 Eijkhout and Romine and C.",
  title =        "Algorithmic bombardment for the iterative solution of
                 linear systems: a poly-iterative approach",
  journal =      j-J-COMPUT-APPL-MATH,
  volume =       "74",
  number =       "1--2",
  pages =        "91--109",
  day =          "5",
  month =        "????",
  year =         "1996",
  CODEN =        "JCAMDI",
  DOI =          "",
  ISSN =         "0377-0427 (print), 1879-1778 (electronic)",
  ISSN-L =       "0377-0427",
  MRclass =      "65F10 (65N22 65Y05)",
  MRnumber =     "97j:65052",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  classcodes =   "B0290H (Linear algebra); B0290F (Interpolation and
                 function approximation); C4140 (Linear algebra); C4130
                 (Interpolation and function approximation); C4240P
                 (Parallel programming and algorithm theory)",
  conflocation = "Austin, TX, USA; April 1995",
  conftitle =    "TICAM Symposium. Texas Institute for Computational and
                 Applied Mathematics",
  corpsource =   "Distributed Comput. Group, Los Alamos Nat. Lab., NM,
  fjournal =     "Journal of Computational and Applied Mathematics",
  journal-URL =  "",
  keywords =     "algorithmic bombardment; convergence; cost;
                 environment; global communications; indefinite;
                 iterative methods; iterative solution; linear systems;
                 matrix; matrix algebra; matrix properties; nonsymmetric
                 matrix; parallel algorithms; parallel environment;
                 poly-iterative approach; sequential computing",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "T Theoretical or Mathematical",

  author =       "L. Susan Blackford and Jack J. Dongarra and Jeremy {Du
                 Croz} and Sven Hammarling and Jerzy Wasniewski",
  title =        "A {Fortran 90} Interface for {LAPACK}",
  type =         "LAPACK Working Note",
  number =       "117",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        dec,
  year =         "1996",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-96-341, December 1996.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "L. S. Blackford and A. Cleary and J. Demmel and I.
                 Dhillon and J. Dongarra and S. Hammarling and A.
                 Petitet and H. Ren and K. Stanley and R. C. Whaley",
  title =        "Practical Experience in the Dangers of Heterogeneous
  type =         "LAPACK Working Note",
  number =       "112",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        jul,
  year =         "1996",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-96-330, July 1996.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "L. S. Blackford and A. Cleary and J. Demmel and I.
                 Dhillon and J. Dongarra and S. Hammarling and A.
                 Petitet and H. Ren and K. Stanley and R. C. Whaley",
  title =        "Practical experience in the dangers of heterogeneous
  crossref =     "Wasniewski:1996:APC",
  pages =        "57--64",
  year =         "1996",
  bibdate =      "Tue Feb 26 08:49:09 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics computing); C6110B (Software
                 engineering techniques); C6110P (Parallel programming);
                 C6150N (Distributed systems software); C6115
                 (Programming support)",
  conflocation = "Lyngby, Denmark; 18-21 Aug. 1996",
  conftitle =    "Applied Parallel Computing. Industrial Computation and
                 Optimization. Third International Workshop, PARA'96.
  corpsource =   "Tennessee Univ., Knoxville, TN, USA",
  keywords =     "distributed memory systems; floating point arithmetic;
                 heterogeneous computing; libraries; mathematics
                 computing; numerical library software; parallel
                 algorithms; ScaLAPACK; software; software portability;
                 software reliability; software robustness",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "A Application; G General Review",

  author =       "Laura Susan Blackford and J. Choi and A. Cleary and A.
                 Petitet and R. C. Whaley and J. Demmel and I. Dhillon
                 and K. Stanley and J. Dongarra and S. Hammarling and G.
                 Henry and D. Walker",
  title =        "{ScaLAPACK}: a Portable Linear Algebra Library for
                 Distributed Memory Computers --- Design Issues and
  crossref =     "ACM:1996:SCP",
  pages =        "5--5",
  year =         "1996",
  bibdate =      "Mon Mar 23 12:31:18 1998",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "R. Boisvert and S. Browne and J. Dongarra and E.
  editor =       "Nabil R. Adam and B. K. Bhargava and M. Halem and Y.
  booktitle =    "Digital libraries: research and technology advances:
                 {ADL '95} Forum, {McLean}, Virginia, {USA}, May 15--17,
                 1995: selected papers",
  title =        "Digital software and data repositories for support of
                 scientific computing",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  bookpages =    "xiii + 290",
  pages =        "103--114",
  year =         "1996",
  ISBN =         "3-540-61410-9",
  ISBN-13 =      "978-3-540-61410-4",
  LCCN =         "QA267.A1 L43 no.1082; Z699 .D532 1996",
  bibdate =      "Tue Feb 26 06:06:39 2002",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C7300 (Natural sciences computing); C7210L (Library
                 automation); C6130D (Document processing techniques);
                 C7250 (Information storage and retrieval); C6110B
                 (Software engineering techniques)",
  conflocation = "McLean, VA, USA; 15-17 May 1995",
  conftitle =    "Proceedings of a Forum on Research and Technology
                 Advances in Digital Libraries",
  corpsource =   "Nat. Inst. of Stand. and Technol., USA",
  keywords =     "CNRI Digital Library project; data repositories;
                 digital libraries; digital software; document handling;
                 documents; GAMS Virtual; information; information
                 retrieval; library automation; National HPCC Software
                 Exchange; natural sciences computing; Netlib;
                 notification; online access; online software
                 repositories; remote program execution; Repository;
                 scientific computing; software change; software
                 libraries; software reusability; storage",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "NASA",
  treatment =    "G General Review",

  author =       "Shirley Browne and Jack Dongarra and Tom Rowan",
  editor =       "????",
  booktitle =    "Proceedings of the Scalable Parallel Libraries
                 Conference {III} {SPLC96}, Mississippi State
                 University, October 1996",
  title =        "Evaluation of High-Performance Computing Software",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "??--??",
  year =         "1996",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "S. Browne and H. Casanova and J. Dongarra",
  title =        "Providing access to high performance computing
  crossref =     "Wasniewski:1996:APC",
  pages =        "123--133",
  year =         "1996",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics computing); C7250 (Information
                 storage and retrieval); C6150N (Distributed systems
  conflocation = "Lyngby, Denmark; 18-21 Aug. 1996",
  conftitle =    "Applied Parallel Computing. Industrial Computation and
                 Optimization. Third International Workshop, PARA'96.
  corpsource =   "Tennessee Univ., Knoxville, TN, USA",
  keywords =     "access; client-server application; client-server
                 systems; computational science; domain-specific
                 repositories; high performance computing technologies;
                 information retrieval systems; information storage;
                 mathematics computing; National HPCC; NetSolve; problem
                 solving; project; Software Exchange",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "A Application; P Practical",

  author =       "S. Browne and J. Dongarra and G. Fox and K. Hawick and
                 T. Rowan",
  title =        "Software Reuse in High-Performance Computing",
  type =         "Technical report",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "1996",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Henri Casanova and Jack Dongarra",
  title =        "{NetSolve}: a Network Server for Solving Computational
                 Science Problems",
  type =         "Technical report",
  number =       "CS-96-328",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        may,
  year =         "1996",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Henri Casanova and Jack Dongarra",
  title =        "{NetSolve}: a Network Server for Solving Computational
                 Science Problems",
  crossref =     "ACM:1996:SCP",
  pages =        "40--40",
  year =         "1996",
  bibdate =      "Mon Mar 23 12:31:18 1998",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jaeyoung Choi and J. J. Dongarra and L. S. Ostrouchov
                 and Petitet and A. P. and D. W. Walker and R. C.
  title =        "Design and implementation of the {ScaLAPACK} {$ L U
                 $}, {$ Q R $}, and {Cholesky} factorization routines",
  journal =      j-SCI-PROG,
  volume =       "5",
  number =       "3",
  pages =        "173--184",
  month =        "Fall",
  year =         "1996",
  CODEN =        "SCIPEV",
  ISSN =         "1058-9244 (print), 1875-919X (electronic)",
  ISSN-L =       "1058-9244",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  classcodes =   "C4140 (Linear algebra); C6110B (Software engineering
                 techniques); C6115 (Programming support); C5440
                 (Multiprocessing systems); C6150N (Distributed systems
                 software); C6110P (Parallel programming)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Scientific Programming",
  journal-URL =  "",
  keywords =     "BLACS; BLAS; block; communication; cyclic data
                 distribution; de facto standard kernels; dense linear
                 equation system; distributed memory systems;
                 engineering; factorization routine; Intel; Intel
                 Touchstone Delta; Inter Paragon System; iPSC/860;
                 linear algebra; matrix; message passing; operations;
                 parallel implementations; parallel machines; parallel
                 programming; parallelized sequential LAPACK; PBLAS;
                 performance; performance evaluation; scalability;
                 ScaLAPACK Cholesky factorization routine; ScaLAPACK
                 library; ScaLAPACK LU factorization routine; ScaLAPACK
                 QR; software; software libraries; software packages;
                 vector operations",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "Jaeyoung Choi and Jack J. Dongarra and David W.
  title =        "{PB-BLAS}: a set of parallel block basic linear
                 algebra subprograms",
  journal =      j-CPE,
  volume =       "8",
  number =       "7",
  pages =        "517--535",
  month =        sep,
  year =         "1996",
  CODEN =        "CPEXEI",
  DOI =          "<517::AID-CPE226>3.0.CO;2-W",
  ISSN =         "1040-3108 (print), 1096-9128 (electronic)",
  ISSN-L =       "1040-3108",
  bibdate =      "Tue Sep 7 06:06:26 MDT 1999",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "C6110P (Parallel programming); C4140 (Linear algebra);
                 C6150N (Distributed systems software)",
  corpsource =   "Sch. of Comput., Soongsil Univ., Seoul, South Korea",
  fjournal =     "Concurrency, practice and experience",
  journal-URL =  "",
  keywords =     "basic linear algebra subprograms; block-cyclic data
                 distribution; ease-of-; LAPACK; linear algebra;
                 parallel block; parallel programming; PB-BLAS;
                 portability; ScaLAPACK; software package; software
                 packages; use",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical; T Theoretical or Mathematical",

  author =       "Jaeyoung Choi and J. Dongarra and S. Ostrouchov and A.
                 Petitet and D. Walker and R. C. Whaley",
  title =        "A proposal for a set of {Parallel Basic Linear Algebra
  crossref =     "Dongarra:1996:APC",
  pages =        "107--114",
  year =         "1996",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics computing); C6110P (Parallel
                 programming); C4140 (Linear algebra)",
  conflocation = "Lyngby, Denmark; 21-24 Aug. 1995",
  conftitle =    "Applied Parallel Computing. Computations in Physics,
                 Chemistry and Engineering Science",
  corpsource =   "Sch. of Comput., Soongsil Univ., Seoul, South Korea",
  keywords =     "basic linear algebra; distributed memory; linear
                 algebra; linear algebra subprograms; parallel; parallel
                 programming; PBLAS; software libraries",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "T Theoretical or Mathematical",

  author =       "J. Choi and J. Demmel and I. Dhillon and J. Dongarra
                 and S. Ostrouchov and A. Petitet and K. Stanley and D.
                 Walker and R. C. Whaley",
  title =        "{ScaLAPACK}: a portable linear algebra library for
                 distributed memory computers --- design issues and
  journal =      j-COMP-PHYS-COMM,
  volume =       "97",
  number =       "1--2",
  pages =        "1--15",
  day =          "2",
  month =        aug,
  year =         "1996",
  CODEN =        "CPHCBZ",
  DOI =          "",
  ISSN =         "0010-4655 (print), 1879-2944 (electronic)",
  ISSN-L =       "0010-4655",
  bibdate =      "Mon Feb 13 21:30:07 MST 2012",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics computing); C4140 (Linear algebra);
                 C4240P (Parallel programming and algorithm theory);
                 C6110P (Parallel programming); C6150N (Distributed
                 systems software)C6110B (Software engineering
                 techniques); C6115 (Programming support)",
  conflocation = "Skalsky dvur, Czech Republic; 5-14 Sept. 1995",
  conftitle =    "High-Performance Computing in Science. 10th European
                 Summer School on Computing Techniques in Physics",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Computer Physics Communications",
  journal-URL =  "",
  keywords =     "computations; computers; Distributed Linear Algebra
                 Machine; distributed memory; distributed memory
                 systems; linear algebra; mathematical software; message
                 passing; message passing interfaces; parallel; parallel
                 algorithms; performance evaluation; portable linear
                 algebra library; programmability; reusability;
                 ScaLAPACK; software; software libraries; software
                 portability; symbol manipulation; user-friendly
                 distributed systems",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "Eur. Phys. Soc.; German Phys. Soc.; et al",
  treatment =    "P Practical",

  author =       "J. Choi and J. Demmel and I. Dhillon and J. Dongarra
                 and S. Ostrouchov and A. Petitet and K. Stanley and D.
                 Walker and R. C. Whaley",
  title =        "{ScaLAPACK}: a portable linear algebra library for
                 distributed memory computers. Design issues and
  crossref =     "Dongarra:1996:APC",
  pages =        "95--106",
  year =         "1996",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics computing); C4140 (Linear algebra);
                 C6115 (Programming support)",
  conflocation = "Lyngby, Denmark; 21-24 Aug. 1995",
  conftitle =    "Applied Parallel Computing. Computations in Physics,
                 Chemistry and Engineering Science",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  keywords =     "computing; distributed memory computers; distributed
                 memory systems; distributed systems; heterogeneous
                 processors; linear algebra; linear algebra library;
                 mathematical; mathematics; portable linear algebra
                 library; ScaLAPACK; software; software libraries;
                 software portability",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical; T Theoretical or Mathematical",

  author =       "Jim Demmel and Jack Dongarra and Sven Hammarling and
                 Susan Ostrouchov and Ken Stanley",
  title =        "The Dangers of Heterogeneous Network Computing:
                 Heterogeneous Networks Considered Harmful",
  type =         "Technical report",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        mar,
  year =         "1996",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Demmel and J. Dongarra and S. Hammarling and S.
  title =        "The Dangers of Heterogeneous Network Computing:
                 Heterogeneous Networks Considered Harmful",
  crossref =     "IEEE:1996:HCW",
  pages =        "64--71",
  year =         "1996",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and B. Straughan and D. W. Walker",
  title =        "{Chebyshev} {tau-QZ} algorithm methods for calculating
                 spectra of hydrodynamic stability problems",
  journal =      j-APPL-NUM-MATH,
  volume =       "22",
  number =       "4",
  pages =        "399--434",
  month =        dec,
  year =         "1996",
  CODEN =        "ANMAEL",
  DOI =          "",
  ISSN =         "0168-9274 (print), 1873-5460 (electronic)",
  ISSN-L =       "0168-9274",
  MRclass =      "76M25 (65L06 76E99 76V05)",
  MRnumber =     "97k:76085",
  bibdate =      "Thu Sep 16 09:34:19 1999",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  classcodes =   "A4720 (Hydrodynamic stability and instability); A4715
                 (Laminar flows); A0210 (Algebra, set theory, and graph
                 theory); A4715F (Stability of laminar flows); C4130
                 (Interpolation and function approximation); C4140
                 (Linear algebra)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Applied Numerical Mathematics: Transactions of IMACS",
  journal-URL =  "",
  keywords =     "Chebyshev; Chebyshev approximation; Chebyshev
                 representation; Chebyshev tau method; Couette; Couette
                 flow; eigenfunctions; eigenvalue; eigenvalues and;
                 flow; flow instability; hydrodynamic stability;
                 hydrodynamics; multilayer flows; Orr-; pipe flow;
                 Poiseuille flow; polynomials; pressure gradient driven
                 circular pipe flow; problems; QZ algorithm; Sommerfeld
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "T Theoretical or Mathematical",

  author =       "J. J. Dongarra and H. W. Meuer and H. D. Simon and E.
  title =        "Changing Technologies of {HPC}",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1067",
  pages =        "875--879",
  year =         "1996",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Wed Aug 14 09:38:08 MDT 1996",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  keywords =     "boards; computer facilities; computing nodes; High
                 Performance Computing; supercomputer sites;
                 technological forecasting; workstation",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "G General Review",

  author =       "Jack Dongarra and Jerzy Wa{\'s}niewski",
  title =        "{Denmark} hosts {Workshop on Applied Parallel
                 Computing} ({PARA96})",
  journal =      j-SIGNUM,
  volume =       "31",
  number =       "3",
  pages =        "28--??",
  month =        "????",
  year =         "1996",
  CODEN =        "SNEWD6",
  ISSN =         "0163-5778 (print), 1558-0237 (electronic)",
  ISSN-L =       "0163-5778",
  bibdate =      "Tue Oct 29 05:58:33 MST 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "ACM SIGNUM Newsletter",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra",
  title =        "Future Linear-Algebra Libraries",
  journal =      j-IEEE-COMPUT-SCI-ENG,
  volume =       "3",
  number =       "2",
  pages =        "38--40",
  month =        "Summer",
  year =         "1996",
  CODEN =        "ISCEE4",
  DOI =          "",
  ISSN =         "1070-9924 (print), 1558-190X (electronic)",
  ISSN-L =       "1070-9924",
  bibdate =      "Sat Jan 9 08:57:23 MST 1999",
  bibsource =    "Compendex database;
  URL =          ";
  abstract =     "The ultimate development of fully mature, parallel
                 scalable libraries will necessarily depend on
                 breakthroughs in many supporting technologies. Scalable
                 library development cannot wait, however, until all the
                 enabling technologies are in place for two reasons: The
                 need for such libraries for existing and near-term
                 parallel architectures is immediate, and progress in
                 all the supporting technologies depends on feedback
                 from concurrent efforts in library development. Four
                 major research issues that need to be addressed in
                 developing parallel scalable linear-algebra libraries
                 are identified; inadequate user-library interface,
                 necessity of object-oriented programming for developing
                 portable libraries, the importance of work on
                 algorithms, and the lack of language standards.",
  acknowledgement = ack-nhfb,
  affiliation =  "Univ of Tennessee",
  affiliationaddress = "Knoxville, TN, USA",
  classcodes =   "C7310 (Mathematics computing); C4140 (Linear algebra);
                 C6110B (Software engineering techniques); C6110P
                 (Parallel programming)",
  classification = "722.2; 722.3; 722.4; 723.1; 723.2; 921.1",
  corpsource =   "Tennessee Univ., Knoxville, TN, USA",
  fjournal =     "IEEE Computational Science \& Engineering",
  journal-URL =  "",
  journalabr =   "IEEE Comput Sci Eng",
  keywords =     "Algorithms; Computer architecture; Computer networks;
                 Computer software portability; Computer systems
                 programming; Computer workstations; Data structures;
                 development; enabling technologies; future; Graphical
                 user interfaces; Graphical workstations; library;
                 Linear algebra; linear algebra; linear algebra
                 libraries; mathematics computing; parallel
                 architectures; Parallel processing systems; parallel
                 programming; Parallel scalable libraries; parallel
                 scalable libraries; Problem solving; reusability;
                 software; Software libraries; software libraries;
                 software portability; Standards; Subroutines",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "Jack Dongarra and Horst D. Simon",
  title =        "High Performance Computing in the {U.S.} in 1995 ---
                 An Analysis on the Basis of the {TOP500} List",
  type =         "Technical report",
  number =       "CS-96-318",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "1996",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and H. D. Simon",
  title =        "High Performance Computing in the {U.S.} in 1995 ---
                 An Analysis on the Basis of the {TOP500} List",
  journal =      j-SUPERCOMPUTER,
  volume =       "12",
  number =       "1",
  pages =        "16--22",
  month =        jan,
  year =         "1996",
  CODEN =        "SPCOEL",
  ISSN =         "0168-7875",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C0310B (Computer facilities)",
  corpsource =   "Math. Sci. Sect., Oak Ridge Nat. Lab., TN, USA",
  fjournal =     "Supercomputer",
  keywords =     "computer facilities; computer installation;
                 installations; supercomputer; supercomputer sites;
                 supercomputers; TOP500 list; U.S.; world market",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "G General Review",

  author =       "J. Dongarra and A. Lumsdaine and R. Pozo and K.
  title =        "{IML++ v. 1.2}: Iterative Methods Library Reference
  type =         "Technical report",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "1996",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Sven Hammarling and David W.
  title =        "Key Concepts For Parallel Out-Of-Core {$ L U $}
  type =         "LAPACK Working Note",
  number =       "110",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        apr,
  year =         "1996",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-96-324, April 1996.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and J. {Du Croz} and S. Hammarling and
                 J. Wa{\'s}niewski and A. Zemla",
  title =        "{LAPACK} for {Fortran 90}",
  journal =      j-APPL-MATH-COMP-SCI,
  volume =       "6",
  number =       "2",
  pages =        "375--382",
  month =        "????",
  year =         "1996",
  CODEN =        "AMCPE9",
  ISSN =         "0867-857X",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics computing); C6140D (High level
                 languages); C6180 (User interfaces); C6150E (General
                 utility programs); C4140 (Linear algebra)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Applied Mathematics and Computer Science",
  keywords =     "application program interfaces; arrays; assumed-shape;
                 code; code rewriting; computational routines;
                 computing; driver; FORTRAN; Fortran 77; Fortran 90
                 jackets; generic interfaces; LAPACK; linear equations;
                 mathematics; matrix; matrix algebra; optional
                 arguments; performance; persistence; routines; user
                 interface; user interfaces",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "J. J. Dongarra and J. {Du Croz} and S. Hammarling and
                 J. Wa{\'s}niewski and A. Zemla",
  title =        "{LAPACK} for {Fortran 90} compiler",
  crossref =     "Liddell:1996:HCN",
  pages =        "826--833",
  year =         "1996",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C6150C (Compilers, interpreters and other processors);
                 C6110P (Parallel programming); C6140D (High level
  conflocation = "Brussels, Belgium; 15-19 April 1996",
  conftitle =    "High-Performance Computing and Networking.
                 International Conference and Exhibition HPCN Europe
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  keywords =     "FORTRAN; FORTRAN 90 compiler; Fortran 90 interface;
                 interface; LAPACK; parallel programming; parallelising
                 compilers; user-",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "J. Dongarra and R. Pozo and D. Walker",
  title =        "{LAPACK++ V. 1.0}: High Performance Linear Algebra
                 Users' Guide",
  type =         "Technical report",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "1996",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Tom Dunigan",
  title =        "Message-Passing Performance of Various Computers",
  type =         "Technical report",
  number =       "CS-95-299",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "1996",
  bibdate =      "Tue Feb 26 08:48:32 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Steve W. Otto and Marc Snir and
                 David Walker",
  title =        "A message passing standard for {MPP} and
  journal =      j-CACM,
  volume =       "39",
  number =       "7",
  pages =        "84--90",
  month =        jul,
  year =         "1996",
  CODEN =        "CACMA2",
  DOI =          "",
  ISSN =         "0001-0782 (print), 1557-7317 (electronic)",
  ISSN-L =       "0001-0782",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "Compendex database;
  abstract =     "The Message Passing Interface (MPI) is a portable
                 message-passing standard that facilitates development
                 of parallel applications and libraries. MPI has been
                 developed over a 12-month period in 1993 to 1994 of
                 intensive meetings involving more than 80 people from
                 approximately 40 organizations, mainly from the U.S.
                 and Europe. Programming in MPI is straightforward and
                 similar to programming with other message-passing
  acknowledgement = ack-nhfb,
  affiliation =  "Univ of Tennessee",
  affiliationaddress = "Knoxville, TN, USA",
  classcodes =   "C6150N (Distributed systems software); C5440
                 (Multiprocessing systems); C6110P (Parallel
  classification = "716.1; 722.2; 722.3; 722.4; 723.1; 902.2",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Communications of the ACM",
  journal-URL =  "",
  journalabr =   "Commun ACM",
  keywords =     "Application programming interface; C (programming
                 language); collective communication operations;
                 Communication library routines; communication library
                 routines; communication ports; Computer networks;
                 Computer software; Computer systems programming;
                 Computer workstations; Concurrency control; Concurrent
                 programs; concurrent programs; Data communication
                 systems; distributed memory multicomputers; FORTRAN
                 (programming language); Interfaces (computer);
                 Massively parallel processing; massively parallel
                 processing; message passing; Message passing interface;
                 message passing paradigm; Message passing programs;
                 Message passing standard; message passing standard; MPI
                 standard; MPP machines; multiprocessors; Networks of
                 workstations; NOWs; parallel machines; Parallel
                 processing systems; parallel programming; persistent;
                 Point to point communications; Program compilers;
                 scoping mechanisms; shared memory; software standards;
                 Standards; Subroutines; telecommunication standards;
                 user defined data types; workstations",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "J. J. Dongarra and H. W. Meuer and E. Strohmaier",
  title =        "Preface",
  journal =      j-SUPERCOMPUTER,
  volume =       "12",
  number =       "1",
  pages =        "4--5",
  month =        "????",
  year =         "1996",
  CODEN =        "SPCOEL",
  ISSN =         "0168-7875",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Supercomputer",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and J. {Du Croz} and S. Hammarling and
                 J. Wa{\'s}niewski and A. Zemla",
  title =        "A proposal for a {Fortran 90} interface for {LAPACK}",
  crossref =     "Dongarra:1996:APC",
  pages =        "158--165",
  year =         "1996",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics computing); C4140 (Linear algebra);
                 C6140D (High level languages); C6180 (User
  conflocation = "Lyngby, Denmark; 21-24 Aug. 1995",
  conftitle =    "Applied Parallel Computing. Computations in Physics,
                 Chemistry and Engineering Science",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  keywords =     "FORTRAN; Fortran 90 interface; LAPACK; LAPACK code;
                 linear algebra; mathematics computing; packages;
                 software; user interfaces; user-interface",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical; T Theoretical or Mathematical",

  author =       "J. J. Dongarra and T. Hey and E. Strohmaier",
  title =        "{PARKBENCH}: methodology, relations and results",
  crossref =     "Liddell:1996:HCN",
  pages =        "770--777",
  year =         "1996",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C6110P (Parallel programming); C6150N (Distributed
                 systems software); C6150G (Diagnostic, testing,
                 debugging and evaluating systems)",
  conflocation = "Brussels, Belgium; 15-19 April 1996",
  conftitle =    "High-Performance Computing and Networking.
                 International Conference and Exhibition HPCN Europe
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  keywords =     "computer benchmarking; message passing standards;
                 parallel benchmarks; parallel programming; PARKBENCH;
                 performance comparison; software performance
                 evaluation; standards",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "J. J. Dongarra and T. Hey and E. Strohmaier",
  title =        "Selected results from the {PARKBENCH} benchmark",
  crossref =     "Bouge:1996:EPP",
  volume =       "2",
  pages =        "251--254",
  year =         "1996",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C5220P (Parallel architecture); C5470 (Performance
                 evaluation and testing); C6150G (Diagnostic, testing,
                 debugging and evaluating systems)",
  conflocation = "Lyon, France; 26-29 Aug. 1996",
  conftitle =    "Proceedings of European Conference on Parallel
                 Processing EURO-PAR '96",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  keywords =     "computer testing; evaluation; hierarchical; MPI;
                 parallel architectures; parallel benchmarks; PARKBENCH
                 benchmark; performance; PVM; suite",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "J. Dongarra and A. Petitet",
  title =        "{ScaLAPACK} tutorial",
  crossref =     "Dongarra:1996:APC",
  pages =        "166--176",
  year =         "1996",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C7310 (Mathematics computing); C4140 (Linear algebra);
                 C6115 (Programming support)",
  conflocation = "Lyngby, Denmark; 21-24 Aug. 1995",
  conftitle =    "Applied Parallel Computing. Computations in Physics,
                 Chemistry and Engineering Science",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  keywords =     "Basic Linear Algebra Subprograms; block-partitioned
                 algorithms; distributed memory; LAPACK library; linear
                 algebra; mathematical libraries; mathematics computing;
                 Parallel Basic Linear Algebra Subprograms; ScaLAPACK;
                 software libraries; user-friendly distributed systems;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "J. Dongarra and L. S. Blackford",
  title =        "{ScaLAPACK} Tutorial",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1184",
  pages =        "204--215",
  year =         "1996",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Fri Aug 22 11:59:49 MDT 1997",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Hans Meuer and Erich Strohmaier",
  title =        "{Top500} Report",
  type =         "Technical report",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        nov,
  year =         "1996",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and H. W. Meuer and E. Strohmaier",
  title =        "{TOP500} supercomputer sites",
  journal =      j-SUPERCOMPUTER,
  volume =       "12",
  number =       "1",
  pages =        "91--120",
  month =        jan,
  year =         "1996",
  CODEN =        "SPCOEL",
  ISSN =         "0168-7875",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C0310B (Computer facilities); C5420 (Mainframes and
                 minicomputers); C5440 (Multiprocessing systems)",
  corpsource =   "Math. Sci. Sect., Oak Ridge Nat. Lab., TN, USA",
  fjournal =     "Supercomputer",
  keywords =     "computer centre; computer centres; computer
                 facilities; computer facility; high-performance
                 computer; LINPACK benchmark performance; machines;
                 mainframes; most powerful computer; parallel; parallel
                 computer; statistics; supercomputer installation;
                 supercomputer site; top 500 sites; TOP500; world
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Graham Fagg and Jack Dongarra",
  title =        "{PVMPI}: An Integration of {PVM} and {MPI} Systems",
  journal =      "Calculateurs Parall{\`e}les",
  volume =       "8",
  number =       "2",
  pages =        "151--166",
  year =         "1996",
  CODEN =        "????",
  ISSN =         "1260-3198",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "G. E. Fagg and K. S. London and J. J. Dongarra",
  title =        "Taskers and general resource managers: {PVM}
                 supporting {DCE} process management",
  crossref =     "Bode:1996:PVM",
  pages =        "180--187",
  year =         "1996",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  classcodes =   "C6150N (Distributed systems software); C7430 (Computer
                 engineering); C6150E (General utility programs)",
  conflocation = "Munich, Germany; 7-9 Oct. 1996",
  conftitle =    "Parallel Virtual Machine - EuroPVM '96. Third European
                 PVM Conference. Proceedings",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  keywords =     "allocation schemes; application program interfaces;
                 DCE process; distributed algorithms; distributed
                 computing environments; dynamic meta-computing
                 environments; general resource managers; management;
                 Message; message passing; MPI; MPIRUN systems;
                 operations; Parallel Virtual Machine; Passing
                 Interface; processor scheduling; PVM 3.4 release; PVM
                 internal; PVMPI project; resource allocation;
                 schedulers; standardised plug-in; taskers;
                 user-controlled flexibility; virtual machines",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "Youngbae Kim and James S. Plank and Jack J. Dongarra",
  title =        "Fault-Tolerant Matrix Operations Using Checksum and
                 Reverse Computation",
  crossref =     "IEEE:1996:FSS",
  pages =        "??--??",
  year =         "1996",
  bibdate =      "Tue Dec 10 09:25:56 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "James S. Plank and Youngbae Kim and Jack Dongarra",
  title =        "Fault Tolerant Matrix Operations for Networks of
                 Workstations Using Diskless Checkpointing",
  type =         "Technical report",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        feb,
  year =         "1996",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Youngbae Kim and J. S. Plank and J. J. Dongarra",
  booktitle =    "Frontiers'96: proceedings / the Sixth Symposium on the
                 Frontiers of Massively Parallel Computing, October
                 27--31, 1996, Annapolis, Maryland",
  title =        "Fault tolerant matrix operations using checksum and
                 reverse computation",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  bookpages =    "xiv + 372",
  pages =        "70--77",
  year =         "1996",
  ISBN =         "0-8186-7551-9",
  ISBN-13 =      "978-0-8186-7551-5",
  LCCN =         "QA76.58 .S95 1996",
  bibdate =      "Tue Feb 26 06:07:46 2002",
  bibsource =    "",
  note =         "IEEE catalog number 96TB100062.",
  acknowledgement = ack-nhfb,
  classcodes =   "C5470 (Performance evaluation and testing); C4140
                 (Linear algebra); C5230 (Digital arithmetic methods)",
  conflocation = "Annapolis, MA, USA; 27-31 Oct. 1996",
  conftitle =    "Proceedings of 6th Symposium on the Frontiers of
                 Massively Parallel Computation (Frontiers '96)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  keywords =     "algebra; checkpointing; checksum; Cholesky
                 factorization; computation; digital arithmetic;
                 factorization; fault tolerant computing; fault tolerant
                 matrix operations; Hessenberg reduction;
                 high-performance matrix operations; LU factorization;
                 matrix; matrix multiplication; multiplication; QR;
                 recovery; reverse; roundoff errors",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsororg =   "IEEE Comput. Soc.; NASA Goddard Space Flight Center;
  treatment =    "P Practical",

  author =       "Marc Snir and Steve W. Otto and Steven Huss-Lederman
                 and David W. Walker and Jack Dongarra",
  title =        "{MPI}: the complete reference",
  publisher =    pub-MIT,
  address =      pub-MIT:adr,
  pages =        "xii + 336",
  year =         "1996",
  ISBN =         "0-262-69184-1",
  ISBN-13 =      "978-0-262-69184-0",
  LCCN =         "QA76.642.M65 1996",
  bibdate =      "Fri Jan 31 07:16:14 1997",
  bibsource =    "",
  price =        "US\$27.50",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Aad J. van der Steen and Jack Dongarra",
  title =        "Overview of Recent Supercomputers",
  type =         "Technical report",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "1996",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Aad J. van der Steen and Jack Dongarra",
  title =        "Overview of Recent Supercomputers",
  journal =      "NHSE Review",
  volume =       "1",
  number =       "1",
  pages =        "??--??",
  day =          "10",
  month =        feb,
  year =         "1996",
  bibdate =      "Wed Jan 14 05:57:08 2004",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  keywords =     "National HPCC Software Exchange (NHSE); Rice
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "D. W. Walker and J. J. Dongarra",
  title =        "{MPI}: a standard Message Passing Interface",
  journal =      j-SUPERCOMPUTER,
  volume =       "12",
  number =       "1",
  pages =        "56--68",
  month =        jan,
  year =         "1996",
  CODEN =        "SPCOEL",
  ISSN =         "0168-7875",
  bibdate =      "Sat Mar 22 15:39:54 MST 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classcodes =   "C6155 (Computer communications software); C5640
                 (Protocols); C6150N (Distributed systems software)",
  corpsource =   "Math. Sci. Sect., Oak Ridge Nat. Lab., TN, USA",
  fjournal =     "Supercomputer",
  keywords =     "collective communication; computer interface; computer
                 interfaces; computer standard; distributed processing;
                 Europe; interface; massively parallel computer;
                 message; message passing; MPI; network; network
                 interface; network interfaces; parallel processing;
                 passing; point-to-point; protocols; routine; software
                 standards; standards; United States; workstation",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  treatment =    "P Practical",

  author =       "Z. Bai and J. Demmel and J. Dongarra and A. Petitet
                 and H. Robinson and K. Stanley",
  title =        "The Spectral Decomposition of Nonsymmetric Matrices on
                 Distributed Memory Parallel Computers",
  journal =      j-SIAM-J-SCI-COMP,
  volume =       "18",
  number =       "5",
  pages =        "1446--1461",
  month =        sep,
  year =         "1997",
  CODEN =        "SJOCE3",
  DOI =          "",
  ISSN =         "1064-8275 (print), 1095-7197 (electronic)",
  ISSN-L =       "1064-8275",
  MRclass =      "65F05 (65F30 65Y05)",
  MRnumber =     "98d:65027",
  bibdate =      "Tue Feb 26 10:04:07 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM Journal on Scientific Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Z. Bai and D. Day and J. Demmel and J. Dongarra",
  title =        "A Test Matrix Collection for Non-{Hermitian}
                 Eigenvalue Problems",
  type =         "LAPACK Working Note",
  number =       "123 and CS-97-355",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        mar,
  year =         "1997",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "LAPACK Working Note 123. UT-CS-97-355, March 1997.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "L. S. Blackford and A. Cleary and A. Petitet and R. C.
                 Whaley and J. Demmel and I. Dhillon and H. Ren and K.
                 Stanley and J. Dongarra and S. Hammarling",
  title =        "Practical Experience in the Numerical Dangers of
                 Heterogeneous Computing",
  journal =      j-TOMS,
  volume =       "23",
  number =       "2",
  pages =        "133--147",
  month =        jun,
  year =         "1997",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  abstract =     "Special challenges exist in writing reliable numerical
                 library software for heterogeneous computing
                 environments. Although a lot of software for
                 distributed-memory parallel computers has been written,
                 porting this software to a network of workstations
                 requires careful consideration. The symptoms of
                 heterogeneous computing failures can range from
                 erroneous results without warning to deadlock. Some of
                 the problems are straightforward to solve, but for
                 others the solutions are not so obvious, or incur an
                 unacceptable overhead. Making software robust on
                 heterogeneous systems often requires additional
                 communication. We describe and illustrate the problems
                 encountered during the development of ScaLAPACK and the
                 NAG Numerical PVM Library. Where possible, we suggest
                 ways to avoid potential pitfalls, or if that is not
                 possible, we recommend that the software not be used on
                 heterogeneous networks.",
  acknowledgement = ack-rfb # " and " # ack-kr,
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  keywords =     "distributed-memory systems, floating-point arithmetic,
                 heterogeneous processor networks, message passing,
                 numerical software, reliability",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  subject =      "{\bf D.1.3} Software, PROGRAMMING TECHNIQUES,
                 Concurrent Programming, Distributed programming. {\bf
                 G.1.0} Mathematics of Computing, NUMERICAL ANALYSIS,
                 General, Computer arithmetic. {\bf G.1.0} Mathematics
                 of Computing, NUMERICAL ANALYSIS, General, Parallel

  author =       "L. S. Blackford and J. Choi and A. Cleary and E.
                 D'Azevedo and J. Demmel and I. Dhillon and J. Dongarra
                 and S. Hammarling and G. Henry and A. Petitet and K.
                 Stanley and D. Walker and R. C. Whaley",
  booktitle =    "Proceedings of the Eighth {SIAM} Conference on
                 Parallel Processing for Scientific Computing
                 (Minneapolis, {MN, 1997)}",
  title =        "{ScaLAPACK}: a linear algebra library for
                 message-passing computers",
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "15 (electronic)",
  year =         "1997",
  MRclass =      "65-04",
  MRnumber =     "1 602 524",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "L. S. Blackford and J. Choi and A. Cleary and E.
                 D'Azevedo and J. Demmel and I. Dhillon and J. Dongarra
                 and S. Hammarling and G. Henry and A. Petitet and K.
                 Stanley and D. Walker and R. C. Whaley",
  title =        "{ScaLAPACK} Users' Guide",
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "xxvi + 325",
  year =         "1997",
  ISBN =         "0-89871-400-1 (paperback), 0-89871-401-X (CD-ROM),
                 0-89871-397-8 (set)",
  ISBN-13 =      "978-0-89871-400-5 (paperback), 978-0-89871-401-2
                 (CD-ROM), 978-0-89871-397-8 (set)",
  LCCN =         "QA185.D37 S33 1997",
  bibdate =      "Sun Jun 19 12:21:50 2011",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Bode and J. Dongarra",
  title =        "Performance Evaluation and Prediction",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1300",
  pages =        "969--970",
  year =         "1997",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Tue Apr 28 08:51:33 MDT 1998",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ronald Boisvert and Shirley V. Browne and Jack J.
                 Dongarra and Eric Grosse and Bruce Miller",
  title =        "Interactive and Dynamic Content in Software
  type =         "Technical report",
  number =       "UT-CS-97-351",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        feb,
  year =         "1997",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ronald F. Boisvert and Roldan Pozo and Karin Remington
                 and Richard F. Barrett and Jack J. Dongarra",
  title =        "Matrix Market: {A}. {Web} Resource for Test Matrix
  crossref =     "Boisvert:1997:QNS",
  pages =        "125--137",
  year =         "1997",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Pierre-Yves Calland and Jack Dongarra and Yves
  title =        "Tiling With Limited Resources",
  type =         "Technical report",
  number =       "CS-97-350",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        feb,
  year =         "1997",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "P. Calland and J. Dongarra and Y. Robert",
  title =        "Tiling with Limited Resources",
  crossref =     "Thiele:1997:IIC",
  pages =        "229--238",
  year =         "1997",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Henri Casanova and Jack Dongarra and David M. Doolin",
  title =        "{Java} access to numerical libraries",
  journal =      j-CPE,
  volume =       "9",
  number =       "11",
  pages =        "1279--1291",
  month =        nov,
  year =         "1997",
  CODEN =        "CPEXEI",
  DOI =          "<1279::AID-CPE339>3.0.CO;2-E",
  ISSN =         "1040-3108 (print), 1096-9128 (electronic)",
  ISSN-L =       "1040-3108",
  bibdate =      "Tue Sep 7 06:06:35 MDT 1999",
  bibsource =    ";
  note =         "Special Issue: Java for computational science and
                 engineering --- simulation and modeling II.",
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency, practice and experience",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "H. Casanova and J. Dongarra",
  title =        "Network Enabled Solvers for Scientific Computing Using
                 the {NetSolve} System",
  crossref =     "Goscinski:1997:ICA",
  pages =        "17--33",
  year =         "1997",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxpages =      "17--34",

  author =       "Henri Casanova and Jack Dongarra",
  title =        "{NetSolve}: a Network-Enabled Server for Solving
                 Computational Science Problems",
  journal =      j-IJSAHPC,
  volume =       "11",
  number =       "3",
  pages =        "212--223",
  month =        "Fall",
  year =         "1997",
  CODEN =        "IJSCFG",
  DOI =          "",
  ISSN =         "1078-3482",
  bibdate =      "Wed Jul 23 11:38:50 1997",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of Supercomputer Applications
                 and High Performance Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "H. Casanova and J. Dongarra",
  title =        "{NetSolve}: a Network Server for Solving Computational
                 Science Problems",
  crossref =     "Anonymous:1997:VPC",
  volume =       "11",
  number =       "1",
  pages =        "24--31",
  year =         "1997",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "H. Casanova and J. Dongarra",
  title =        "The Use of {Java} in the {NetSolve} Project",
  crossref =     "Sydow:1997:IWC",
  volume =       "4",
  pages =        "791--796",
  year =         "1997",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Cleary and J. Dongarra",
  title =        "Implementation in {ScaLAPACK} of Divide-and-Conquer
                 Algorithms for Banded and Tridiagonal Linear Systems",
  type =         "LAPACK Working Note",
  number =       "125 and CS-97-358",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        apr,
  year =         "1997",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-97-358, April 1997.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ed F. D'Azevedo and J. Dongarra",
  title =        "The Design and Implementation of the Parallel
                 Out-of-core {ScaLAPACK} {$ L U $}, {$ Q R $} and
                 {Cholesky} Factorization Routines",
  type =         "Technical report",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        jan,
  year =         "1997",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "F. Desprez and J. Dongarra and F. Rastello and Y.
  title =        "Determining the Idle Time of a Tiling: New Results",
  crossref =     "IEEE:1997:PIC",
  pages =        "307--317",
  year =         "1997",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "F. Desprez and J. Dongarra and F. Rastello and Y.
  title =        "Determining the Idle Time of a Tiling: New Results",
  journal =      j-J-INFO-SCI-ENG,
  volume =       "14",
  number =       "1",
  pages =        "167--190",
  month =        mar,
  year =         "1997",
  CODEN =        "JINEEY",
  ISSN =         "1016-2364",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of information science and engineering",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Frederic Desprez and Jack Dongarra and Antoine Petitet
                 and Cyril Randriamaro and Yves Robert",
  title =        "Scheduling Block-Cyclic Array Redistribution",
  type =         "LAPACK Working Note",
  number =       "120 and UT-CS-97-349",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        feb,
  year =         "1997",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "LAPACK Working Note 120. UT-CS-97-349, February
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and F. Desprez and A. Petitet and C.
  title =        "Block-Cyclic Array Redistribution on Networks of
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1332",
  pages =        "343--350",
  year =         "1997",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Tue Apr 28 08:51:33 MDT 1998",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and F. Desprez and A. Petitet and C.
  title =        "Block-Cyclic Array Redistribution on Networks of
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1332",
  pages =        "343--350",
  year =         "1997",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Tue Apr 28 08:51:33 MDT 1998",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and David W. Walker",
  booktitle =    "Iterative methods in scientific computing (Hong Kong,
  title =        "Constructing linear algebra software libraries for
                 high-performance computers",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "111--167",
  year =         "1997",
  MRclass =      "65Fxx (65Y05 65Y15)",
  MRnumber =     "1 661 961",
  bibdate =      "Thu Sep 16 09:36:42 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and S. Hammarling and A. Petitet",
  title =        "Case studies on the development of {ScaLAPACK} and the
                 {NAG} Numerical {PVM} Library",
  crossref =     "Boisvert:1997:QNS",
  pages =        "236--248",
  year =         "1997",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and H. W. Meuer and H. D. Simon and E.
  title =        "Changing Technologies of {HPC}",
  journal =      j-FUT-GEN-COMP-SYS,
  volume =       "12",
  number =       "5",
  pages =        "461--474",
  month =        apr,
  year =         "1997",
  CODEN =        "FGSEVI",
  DOI =          "",
  ISSN =         "0167-739X (print), 1872-7115 (electronic)",
  ISSN-L =       "0167-739X",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Future Generation Computer Systems",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and E. F. D'Azevedo",
  title =        "The Design and Implementation of the Parallel
                 Out-of-core {ScaLAPACK} {$ L U $}, {$ Q R $}, and
                 {Cholesky} Factorization Routines",
  type =         "LAPACK Working Note",
  number =       "118",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        jan,
  year =         "1997",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-97-347, January 1997.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Greg Henry and David Watkins",
  booktitle =    "Proceedings of the Eighth {SIAM} Conference on
                 Parallel Processing for Scientific Computing
                 (Minneapolis, {MN, 1997)}",
  title =        "A distributed memory implementation of the
                 nonsymmetric {$ Q R $} algorithm",
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "8 (electronic)",
  year =         "1997",
  MRclass =      "65F30",
  MRnumber =     "1 602 519",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and Y. Kim and J. Plank",
  title =        "Fault Tolerant Matrix Operations for Networks of
                 Workstations using Multiple Checkpointing",
  crossref =     "IEEE:1997:HPC",
  pages =        "460--465",
  year =         "1997",
  bibdate =      "Tue Feb 26 08:40:25 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and H. D. Simon",
  title =        "High Performance Computing in the {U.S.} in 1996 ---
                 An Analysis on the Basis of the {TOP500} List",
  journal =      j-SUPERCOMPUTER,
  volume =       "13",
  number =       "1",
  pages =        "19--28",
  month =        "????",
  year =         "1997",
  CODEN =        "SPCOEL",
  ISSN =         "0168-7875",
  bibdate =      "Mon Jul 7 11:45:05 MDT 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classification = "C0200 (General computer topics); C5440
                 (Multiprocessing systems)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Supercomputer",
  keywords =     "1996; computer applications; DP industry; geographical
                 distribution; high performance computing; highly
                 parallel systems; HPC systems; industrial use; Lawrence
                 Berkeley technology transition; microprocessor;
                 National Laboratory; parallel machines; performance
                 evaluation; supercomputer sites; TOP500 list; United
                 States; vendors",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  pubcountry =   "Netherlands",
  treatment =    "P Practical",

  author =       "Jack Dongarra and Sven Hammarling and David W.
  title =        "Key Concepts For Parallel Out-Of-Core {$ L U $}
  type =         "Technical report",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "1997",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Sven Hammarling and David W.
  title =        "Key concepts for parallel out-of-core {$ L U $}
  journal =      j-PARALLEL-COMPUTING,
  volume =       "23",
  number =       "1--2",
  pages =        "49--70",
  day =          "16",
  month =        apr,
  year =         "1997",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Tue Oct 21 15:14:48 MDT 1997",
  bibsource =    "Compendex database;
  acknowledgement = ack-nhfb,
  affiliation =  "Univ of Tennessee",
  affiliationaddress = "Knoxville, TN, USA",
  classification = "714.2; 722.1; 722.4; 723; 723.1; 921",
  conference =   "Proceedings of the 1996 International Workshop on
                 Environments and Tools for Parallel Scientific
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  journalabr =   "Parallel Comput",
  keywords =     "Algorithms; Computer architecture; Input output
                 programs; lu factorization; Microprocessor chips;
                 Parallel processing systems; Percolation (computer
                 storage); Storage allocation (computer)",
  meetingaddress = "Faverges de la Tour, Fr",
  meetingdate =  "Aug 22--23 1996",
  meetingdate2 = "08/22--23/96",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Tom Dunigan",
  title =        "Message-passing performance of various computers",
  journal =      j-CPE,
  volume =       "9",
  number =       "10",
  pages =        "915--926",
  month =        oct,
  year =         "1997",
  CODEN =        "CPEXEI",
  DOI =          "<915::AID-CPE277>3.0.CO;2-C",
  ISSN =         "1040-3108 (print), 1096-9128 (electronic)",
  ISSN-L =       "1040-3108",
  bibdate =      "Tue Sep 7 06:06:35 MDT 1999",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency, practice and experience",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and H. W. Meuer and E. Strohmaier",
  title =        "Preface",
  journal =      j-SUPERCOMPUTER,
  volume =       "13",
  number =       "1",
  pages =        "4--5",
  month =        "????",
  year =         "1997",
  CODEN =        "SPCOEL",
  ISSN =         "0168-7875",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Supercomputer",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and S. Browne and H. Casanova",
  title =        "Providing Access to High Performance Computing
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1215",
  pages =        "24--34",
  year =         "1997",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Fri Aug 22 11:59:49 MDT 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Bernard Tourancheau",
  title =        "Preface to the Special Issue",
  journal =      j-IJSAHPC,
  volume =       "11",
  number =       "2",
  pages =        "83--83",
  month =        "Summer",
  year =         "1997",
  CODEN =        "IJSCFG",
  DOI =          "",
  ISSN =         "1078-3482",
  bibdate =      "Thu Jun 26 18:17:48 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of Supercomputer Applications
                 and High Performance Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and H. W. Meuer and E. Strohmaier",
  title =        "{TOP500} Supercomputer Sites",
  journal =      j-SUPERCOMPUTER,
  volume =       "13",
  number =       "1",
  pages =        "89--120",
  month =        "????",
  year =         "1997",
  CODEN =        "SPCOEL",
  ISSN =         "0168-7875",
  bibdate =      "Mon Jul 7 11:45:05 MDT 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classification = "C0310B (Computer facilities); C5440 (Multiprocessing
                 systems)C5470 (Performance evaluation and testing)",
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Supercomputer",
  keywords =     "computer centres; computer installation;
                 high-performance computers; LINPACK benchmark
                 performance; multiprocessing systems; performance
                 evaluation; performance measure; powerful computer
                 systems; ranking; statistics; supercomputer sites",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  pubcountry =   "Netherlands",
  treatment =    "G General Review",

  author =       "J. Dongarra and R. C. Whaley",
  title =        "A User's Guide to the {BLACS v1.1}",
  type =         "LAPACK Working Note",
  number =       "94",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "5",
  month =        may,
  year =         "1997",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "Updated May 5, 1997 (Version 1.1).",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and B. Tourancheau",
  title =        "Workshop on environments and tools for parallel
                 scientific computing",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "23",
  number =       "1--2",
  pages =        "1--4",
  day =          "16",
  month =        apr,
  year =         "1997",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Tue Oct 21 14:55:59 MDT 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "David M. Doolin and Jack Dongarra",
  title =        "{JLAPACK} --- Compiling {LAPACK Fortran} to {Java},
                 Phase 1",
  type =         "Technical report",
  number =       "CS-97-367",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "1997",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "G. Fagg and J. Dongarra and A. Geist",
  title =        "Heterogeneous {MPI} Application Interoperation and
                 Process Management under {PVMPI}",
  type =         "Technical report",
  number =       "CS-97-???",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        jun,
  year =         "1997",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "G. E. Fagg and J. J. Dongarra and A. Geist",
  title =        "Heterogeneous {MPI} Application Interoperation and
                 Process Management under {PVMPI}",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1332",
  pages =        "91--98",
  year =         "1997",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Tue Apr 28 08:51:33 MDT 1998",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Markus Fischer and Jack Dongarra",
  editor =       "????",
  booktitle =    "Concurrent Computing Conference, Atlanta, {GA}, March
                 10--11, 1994",
  title =        "Another Architecture: {PVM} on {Windows 95\slash NT}",
  publisher =    "????",
  address =      "????",
  pages =        "??--??",
  year =         "1997",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "G. Henry and D. Watkins and J. Dongarra",
  title =        "A Parallel Implementation of the Nonsymmetric {$ Q R
                 $} Algorithm for Distributed Memory Architectures",
  type =         "LAPACK Working Note",
  number =       "121",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        mar,
  year =         "1997",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-97-352, March 1997.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Keith Moore and Graham E. Fagg and Al Geist and Jack
  title =        "Scalable Networked Information Processing Environment
  crossref =     "ACM:1997:SHP",
  pages =        "??--??",
  year =         "1997",
  bibdate =      "Sat Mar 21 08:51:09 1998",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "James S. Plank and Youngbae Kim and Jack J. Dongarra",
  title =        "Fault-Tolerant Matrix Operations for Networks of
                 Workstations Using Diskless Checkpointing",
  journal =      j-J-PAR-DIST-COMP,
  volume =       "43",
  number =       "2",
  pages =        "125--138",
  day =          "15",
  month =        jun,
  year =         "1997",
  CODEN =        "JPDCER",
  DOI =          "",
  ISSN =         "0743-7315 (print), 1096-0848 (electronic)",
  ISSN-L =       "0743-7315",
  bibdate =      "Thu Mar 9 09:19:03 MST 2000",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of Parallel and Distributed Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. Strohmaier and J. J. Dongarra and H. W. Meuer and
                 H. D. Simon",
  title =        "Evolution of the {HPC} Market",
  crossref =     "Grandinetti:1997:HPC",
  volume =       "30",
  pages =        "27--44",
  year =         "1997",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. Strohmaier and J. J. Dongarra and H. W. Meuer and
                 H. D. Simon",
  title =        "High-Performance Computing in Industry",
  journal =      j-SUPERCOMPUTER,
  volume =       "13",
  number =       "1",
  pages =        "74--88",
  month =        "????",
  year =         "1997",
  CODEN =        "SPCOEL",
  ISSN =         "0168-7875",
  bibdate =      "Wed Mar 18 08:37:01 MST 1998",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  classification = "C5440 (Multiprocessing systems); C7160
                 (Manufacturing and industrial administration)C6150N
                 (Distributed systems software); C7400 (Engineering
  corpsource =   "Dept. of Comput. Sci., Tennessee Univ., Knoxville, TN,
  fjournal =     "Supercomputer",
  keywords =     "computer applications; computer architecture; computer
                 architectures; DP industry; geographical distribution;
                 high-performance computing; industrial applications;
                 industrial computing; industrial installations; market
                 share; multiprocessing programs; multiprocessing
                 systems; supercomputer manufacturers; top 500
                 supercomputer sites",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  pubcountry =   "Netherlands",
  treatment =    "A Application; G General Review",

  author =       "Greg Henry and David Watkins and Jack Dongarra",
  title =        "A Parallel Implementation of the Nonsymmetric {$ Q R
                 $} Algorithm for Distributed Memory Architectures",
  type =         "Technical report",
  number =       "CS-97-352",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  month =        mar,
  year =         "1997",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  note =         "LAPACK Working Note 121.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "R. Whaley and J. Dongarra",
  title =        "Automatically Tuned Linear Algebra Software",
  type =         "LAPACK Working Note",
  number =       "131",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        dec,
  year =         "1997",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-97-366, December 1997.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "L. S. Blackford and J. J. Dongarra and C. A.
                 Papadopoulos and R. C. Whaley",
  title =        "Installation Guide and Design of the {HPF 1.1}
                 interface to {ScaLAPACK}, {SLHPF}",
  type =         "LAPACK Working Note",
  number =       "137",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        aug,
  year =         "1998",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-98-396, August 1998.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ronald F. Boisvert and Jack J. Dongarra and Roldan
                 Pozo and Karin A. Remington and G. W. Stewart",
  title =        "Developing numerical libraries in {Java}",
  crossref =     "ACM:1998:AWJ",
  pages =        "??--??",
  year =         "1998",
  bibdate =      "Thu Apr 27 10:43:08 2000",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ronald F. Boisvert and Jack J. Dongarra and Roldan
                 Pozo and Karin A. Remington and G. W. Stewart",
  title =        "Developing numerical libraries in {Java}",
  journal =      j-CPE,
  volume =       "10",
  number =       "11--13",
  pages =        "1117--1129",
  month =        sep,
  year =         "1998",
  CODEN =        "CPEXEI",
  DOI =          "<1117::AID-CPE386>3.3.CO;2-9",
  ISSN =         "1040-3108 (print), 1096-9128 (electronic)",
  ISSN-L =       "1040-3108",
  bibdate =      "Tue Sep 7 06:06:44 MDT 1999",
  bibsource =    ";
  note =         "Special Issue: Java for High-performance Network
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency, practice and experience",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "R. Boisvert and Shirley Browne and Jack Dongarra and
                 E. Grosse and B. Miller",
  title =        "User Interfaces for Software Repositories",
  type =         "Technical report",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "1998",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  note =         "Submitted to Information Retrieval Journal.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Shirley Browne and Jack Dongarra and Kevin London",
  title =        "Review of Performance Analysis Tools for {MPI}
                 Parallel Programs",
  journal =      "NHSE Review",
  volume =       "3",
  year =         "1998",
  CODEN =        "????",
  ISSN =         "????",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  note =         "Accepted, to appear.",
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "National HPCC Software Exchange (NHSE); Rice
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  remark =       "This journal ceased publication in 1997.",

  author =       "Henri Casanova and Jack Dongarra",
  title =        "Applying {NetSolve}'s Network-Enabled Server",
  journal =      j-IEEE-COMPUT-SCI-ENG,
  volume =       "5",
  number =       "3",
  pages =        "57--67",
  month =        jul # "\slash " # sep,
  year =         "1998",
  CODEN =        "ISCEE4",
  DOI =          "",
  ISSN =         "1070-9924 (print), 1558-190X (electronic)",
  ISSN-L =       "1070-9924",
  bibdate =      "Sat Jan 9 08:57:23 MST 1999",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Computational Science \& Engineering",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "H. Casanova and J. Dongarra",
  title =        "Enabling Technologies for High Performance Computing",
  crossref =     "Papailiou:1998:PFE",
  volume =       "2",
  pages =        "71--76",
  year =         "1998",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "H. Casanova and J. J. Dongarra and K. Moore",
  title =        "Network-Enabled Solvers and the {NetSolve} Project",
  journal =      j-SIAM-NEWS,
  volume =       "31",
  number =       "1",
  pages =        "??--??",
  year =         "1998",
  ISSN =         "0036-1437",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM News",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "H. Casanova and J. J. Dongarra",
  title =        "{NetSolve}: a network-enabled solver; examples and
  crossref =     "Antonio:1998:SHC",
  pages =        "19--28",
  year =         "1998",
  DOI =          "",
  bibdate =      "Fri May 27 10:25:12 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "H. Casanova and J. Dongarra",
  title =        "{NetSolve version 1.2}: Design and Implementation",
  type =         "LAPACK Working Note",
  number =       "140",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        nov,
  year =         "1998",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-98-406, Nov 1998.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Henri Casanova and Jack Dongarra",
  title =        "Using agent-based software for scientific computing in
                 the {NetSolve} system",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "24",
  number =       "12--13",
  pages =        "1777--1790",
  day =          "1",
  month =        nov,
  year =         "1998",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Fri Aug 6 10:15:40 MDT 1999",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. D'Azevedo and J. Dongarra",
  title =        "Packed Storage Extensions for {ScaLAPACK}",
  type =         "LAPACK Working Note",
  number =       "135",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        apr,
  year =         "1998",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-98-385, April 1998.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "F. Desprez and J. Dongarra and F. Rastello and Y.
  title =        "Determining the idle time of a tiling: New results",
  journal =      j-J-INFO-SCI-ENG,
  volume =       "14",
  number =       "1",
  pages =        "167--190",
  month =        "????",
  year =         "1998",
  CODEN =        "JINEEY",
  ISSN =         "1016-2364",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of information science and engineering",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "F. Desprez and S. Domas and J. Dongarra and A.
  title =        "More on Scheduling Block-Cyclic Array Redistribution",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1511",
  pages =        "275--287",
  year =         "1998",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Tue Jan 5 08:21:58 MST 1999",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "F. Desprez and J. Dongarra and A. Petitet and C.
  title =        "Scheduling Block-Cyclic Array Redistribution",
  crossref =     "DHollander:1998:PCF",
  pages =        "227--234",
  year =         "1998",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "F. Desprez and J. Dongarra and A. Petitet and C.
                 Randriamaro and Y. Robert",
  title =        "Scheduling Block-Cyclic Array Redistribution",
  journal =      j-IEEE-TRANS-PAR-DIST-SYS,
  volume =       "9",
  number =       "2",
  pages =        "192--205",
  month =        feb,
  year =         "1998",
  CODEN =        "ITDSEO",
  DOI =          "",
  ISSN =         "1045-9219 (print), 1558-2183 (electronic)",
  ISSN-L =       "1045-9219",
  bibdate =      "Fri Nov 6 12:31:15 MST 1998",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Transactions on Parallel and Distributed
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and G. Fagg and A. Geist and J. A. Kohl",
  title =        "{HARNESS}: Heterogeneous Adaptable Reconfigurable
                 {NEtworked} Systems",
  crossref =     "IEEE:1998:PSI",
  pages =        "358--359",
  year =         "1998",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and J. Wa{\'s}niewski",
  title =        "High Performance Linear Algebra Package {LAPACK90}",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1388",
  pages =        "387--391",
  year =         "1998",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Sat Oct 10 14:40:24 MDT 1998",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and S. Hammarling and D. W. Walker",
  title =        "Key concepts for parallel out-of-core {$ L U $}
  journal =      j-COMPUT-MATH-APPL,
  volume =       "35",
  number =       "7",
  pages =        "13--31",
  month =        "????",
  year =         "1998",
  CODEN =        "CMAPDK",
  DOI =          "",
  ISSN =         "0898-1221 (print), 1873-7668 (electronic)",
  ISSN-L =       "0898-1221",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Computers and Mathematics with Applications",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Iain S. Duff and Danny C.
                 Sorensen and Henk A. van der Vorst",
  title =        "Numerical Linear Algebra for High-Performance
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "xviii + 342",
  year =         "1998",
  ISBN =         "0-89871-428-1",
  ISBN-13 =      "978-0-89871-428-9",
  LCCN =         "QA76.88 .N86 1998",
  MRclass =      "65-02 (65Fxx 65G50); 65-02 (65Fxx 65G05)",
  MRnumber =     "MR1654239 (2000a:65002)",
  MRreviewer =   "Zahari Zlatev",
  bibdate =      "Sat Dec 31 06:28:14 2005",
  bibsource =    ";
                 MathSciNet database",
  series =       "Software, Environments, and Tools",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and W. Owczarz and J. Wasniewski and P.
  title =        "Testing Software for {LAPACK90}",
  type =         "LAPACK Working Note",
  number =       "138",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        sep,
  year =         "1998",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-98-401, Sept 1998.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "G. E. Fagg and K. S. London and J. J. Dongarra",
  title =        "{MPIConnect}: Managing Heterogeneous {MPI}
                 Applications Interoperation and Process Control",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1497",
  pages =        "93--96",
  year =         "1998",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Tue Jan 5 08:21:58 MST 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "William Gropp and Steven Huss-Lederman and Andrew
                 Lumsdaine and Ewing Lusk and Bill Nitzberg and William
                 Saphir and Marc Snir",
  title =        "{MPI}: The Complete Reference. Volume 2, The {MPI-2}
  publisher =    pub-MIT,
  address =      pub-MIT:adr,
  edition =      "Second",
  pages =        "350",
  year =         "1998",
  ISBN =         "0-262-57123-4 (vol. 2), 0-262-69216-3 (set)",
  ISBN-13 =      "978-0-262-57123-4 (vol. 2), 978-0-262-69216-8 (set)",
  LCCN =         "QA76.642 .M65 1998",
  bibdate =      "Thu Oct 29 07:27:43 1998",
  bibsource =    "",
  note =         "See also volume 1 \cite{Snir:1998:MCR}.",
  price =        "US\$30 (paperback)",
  series =       "Scientific and Engineering Computation",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "M. Migliardi and J. Dongarra and A. Geist and V.
  title =        "Dynamic Reconfiguration and Virtual Machine Management
                 in the {Harness} Metacomputing System",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1505",
  pages =        "127--134",
  year =         "1998",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Tue Jan 5 08:21:58 MST 1999",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Petitet and J. Dongarra",
  title =        "Algorithmic Redistribution Methods for Block Cyclic
  type =         "LAPACK Working Note",
  number =       "133",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        mar,
  year =         "1998",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-98-383, March 1998.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Petitet and H. Casanova and J. Dongarra and Y.
                 Robert and R. C. Whaley",
  title =        "A Numerical Linear Algebra Problem Solving Environment
                 Designer's Perspective",
  type =         "LAPACK Working Note",
  number =       "139",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        oct,
  year =         "1998",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-98-405, Oct 1998.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. S. Plank and H. Casanova and M. Beck and J.
  title =        "Deploying Fault-Tolerance and Task Migration with
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1541",
  pages =        "418--432",
  year =         "1998",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Wed Sep 15 10:01:31 MDT 1999",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  keywords =     "applied parallel computing; computing science; PARA;
                 parallel computing",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Joel H. Saltz and Alan Sussman and Susan Graham and
                 James Demmel and Scott Baden and Jack Dongarra",
  title =        "Programming tools and environments",
  journal =      j-CACM,
  volume =       "41",
  number =       "11",
  pages =        "64--73",
  month =        nov,
  year =         "1998",
  CODEN =        "CACMA2",
  DOI =          "",
  ISSN =         "0001-0782 (print), 1557-7317 (electronic)",
  ISSN-L =       "0001-0782",
  bibdate =      "Wed Nov 4 07:39:27 MST 1998",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Communications of the ACM",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Marc Snir and Steve W. Otto and Steven Huss-Lederman
                 and David W. Walker and Jack Dongarra",
  title =        "{MPI}: The Complete Reference. Volume 1, The {MPI-1}
  publisher =    pub-MIT,
  address =      pub-MIT:adr,
  edition =      "Second",
  pages =        "450",
  month =        sep,
  year =         "1998",
  ISBN =         "0-262-69215-5",
  ISBN-13 =      "978-0-262-69215-1",
  LCCN =         "QA76.642 .M65 1998",
  bibdate =      "Thu Oct 29 07:27:43 1998",
  bibsource =    "",
  note =         "See also volume 2 \cite{Gropp:1998:MCR}.",
  price =        "US\$35 (paperback)",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "F. Tisseur and J. Dongarra",
  title =        "Parallelizing the Divide and Conquer Algorithm for the
                 Symmetric Tridiagonal Eigenvalue Problem on Distributed
                 Memory Architectures",
  type =         "LAPACK Working Note",
  number =       "132",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        mar,
  year =         "1998",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-98-382, March 1998.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Wasniewski and J. Dongarra",
  title =        "High Performance Linear Algebra Package ---
  type =         "LAPACK Working Note",
  number =       "134",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        apr,
  year =         "1998",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-98-384, April 1998.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Wa{\'s}niewski and J. Dongarra",
  title =        "High Performance Linear Algebra Package for {FORTRAN
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1541",
  pages =        "579--581",
  year =         "1998",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Wed Sep 15 10:01:31 MDT 1999",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  keywords =     "applied parallel computing; computing science; PARA;
                 parallel computing",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "R. Clint Whaley and Jack J. Dongarra",
  title =        "{Automatically Tuned Linear Algebra Software}
  crossref =     "ACM:1998:SHP",
  year =         "1998",
  bibdate =      "Wed Mar 06 06:37:44 2002",
  bibsource =    "",
  note =         "Best Paper Award for Systems.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. Anderson and Z. Bai and C. Bischof and S. Blackford
                 and J. Demmel and J. Dongarra and J. {Du Croz} and A.
                 Greenbaum and S. Hammarling and A. McKenney and D.
  title =        "{LAPACK} Users' Guide",
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  edition =      "Third",
  pages =        "xxi + 407",
  year =         "1999",
  ISBN =         "0-89871-447-8",
  ISBN-13 =      "978-0-89871-447-0",
  LCCN =         "QA76.73.F25 L36 1999",
  bibdate =      "Thu Sep 19 07:23:11 2002",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "P. Arbenz and A. Cleary and J. Dongarra and M.
  title =        "A Comparison of Parallel Solvers for Diagonally
                 Dominant and General Narrow-Banded Linear Systems",
  type =         "LAPACK Working Note",
  number =       "142",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  pages =        "18",
  month =        feb,
  year =         "1999",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-99-414, Feb 1999.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "P. Arbenz and A. Cleary and J. Dongarra and M.
  title =        "A Comparison of Parallel Solvers for Diagonally
                 Dominant and General Narrow-Banded Linear Systems
  type =         "LAPACK Working Note",
  number =       "143",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  pages =        "10",
  month =        may,
  year =         "1999",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-99-415, May 1999.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "P. Arbenz and A. Cleary and J. Dongarra and M.
  title =        "A Comparison of Parallel Solvers for Diagonally
                 Dominant and General Narrow-Banded Linear Systems",
  journal =      j-PARALLEL-DIST-COMP-PRACT,
  volume =       "2",
  number =       "4",
  pages =        "??--??",
  month =        "????",
  year =         "1999",
  CODEN =        "????",
  ISSN =         "1097-2803",
  bibdate =      "Fri Dec 19 08:14:14 MST 2003",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "PDCP: Parallel and Distributed Computing Practices",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "V. Barker and S. Blackford and J. Dongarra and J.
                 DuCroz and S. Hammarling and J. Wa{\'s}niewski and P.
  title =        "{LAPACK95} Users' Guide (Draft)",
  type =         "Technical report",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "1999",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Micah Beck and Jack J. Dongarra and Graham E. Fagg and
                 G. Al Geist and Paul Gray and James Kohl and Mauro
                 Migliardi and Keith Moore and Terry Moore and Philip
                 Papadopoulous and Stephen L. Scott and Vaidy Sunderam",
  title =        "{HARNESS}: a Next Generation Distributed Virtual
  journal =      j-FUT-GEN-COMP-SYS,
  volume =       "15",
  number =       "5--6",
  pages =        "571--582",
  day =          "1",
  month =        oct,
  year =         "1999",
  CODEN =        "FGSEVI",
  DOI =          "",
  ISSN =         "0167-739X (print), 1872-7115 (electronic)",
  ISSN-L =       "0167-739X",
  bibdate =      "Tue Mar 05 17:45:35 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Future Generation Computer Systems",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Micah Beck and Henri Casanova and Jack Dongarra and
                 Terry Moore and Jim Plank and Francine Berman and Rich
  title =        "Logistical Quality of Service in {NetSolve}",
  journal =      j-COMP-COMM,
  volume =       "22",
  number =       "11",
  pages =        "1034--1044",
  year =         "1999",
  CODEN =        "COCOD7",
  DOI =          "",
  ISSN =         "0140-3664 (print), 1873-703X (electronic)",
  ISSN-L =       "0140-3664",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Computer Communications",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Mike Berry and Jack Dongarra",
  title =        "{Atlanta} Organizers Put Mathematics to Work For the
                 Math Sciences Community",
  journal =      j-SIAM-NEWS,
  volume =       "32",
  number =       "6",
  year =         "1999",
  ISSN =         "0036-1437",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM News",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Pierre Boulet and Jack Dongarra and Fabrice Rastello
                 and Yves Robert and Frederic Vivien",
  title =        "Algorithmic Issues on Heterogeneous Computing
  journal =      j-PARALLEL-PROCESS-LETT,
  volume =       "9",
  number =       "2",
  pages =        "197--213",
  year =         "1999",
  CODEN =        "PPLTEE",
  ISSN =         "0129-6264 (print), 1793-642X (electronic)",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Processing Letters",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxnote =       "Check this: conflicts with entries in

  author =       "Pierre Boulet and Jack Dongarra and Yves Robert and
                 Fr{\'e}d{\'e}ric Vivien",
  title =        "Static tiling for heterogeneous computing platforms",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "25",
  number =       "5",
  pages =        "547--568",
  day =          "1",
  month =        may,
  year =         "1999",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  MRclass =      "68M20",
  MRnumber =     "1 694 931",
  bibdate =      "Fri Aug 6 10:16:06 MDT 1999",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Shirley Browne and Jack Dongarra and Anne Trefethen",
  editor =       "????",
  booktitle =    "{IEEE} Cluster Computing {BOF} at {SC99}, November,
                 1999, Portland {OR}",
  title =        "Numerical Libraries and Tools for Scalable Parallel
                 Cluster Computing",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "??--??",
  year =         "1999",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Pierre-Yves Calland and Jack Dongarra and Yves
  title =        "Tiling on systems with communication\slash computation
  journal =      j-CPE,
  volume =       "11",
  number =       "3",
  pages =        "139--153",
  month =        mar,
  year =         "1999",
  CODEN =        "CPEXEI",
  DOI =          "<139::AID-CPE370>3.0.CO;2-X",
  ISSN =         "1040-3108 (print), 1096-9128 (electronic)",
  ISSN-L =       "1040-3108",
  bibdate =      "Tue Sep 7 06:06:47 MDT 1999",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency, practice and experience",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Henri Casanova and MyungHo Kim and James S. Plank and
                 Jack J. Dongarra",
  title =        "Adaptive Scheduling for Task Farming with Grid
  journal =      j-IJHPCA,
  volume =       "13",
  number =       "3",
  pages =        "231--240",
  month =        "Fall",
  year =         "1999",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Thu Jul 15 18:35:38 1999",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "H. Casanova and J. Dongarra",
  title =        "Providing uniform dynamic access to numerical
  crossref =     "Heath:1999:APP",
  volume =       "105",
  pages =        "345--366",
  year =         "1999",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Henri Casanova and Michael G. Thomason and Jack J.
  title =        "Stochastic Performance Prediction for Iterative
                 Algorithms in Distributed Environments",
  journal =      j-J-PAR-DIST-COMP,
  volume =       "58",
  number =       "1",
  pages =        "68--91",
  month =        jul,
  year =         "1999",
  CODEN =        "JPDCER",
  DOI =          "",
  ISSN =         "0743-7315 (print), 1096-0848 (electronic)",
  ISSN-L =       "0743-7315",
  bibdate =      "Thu Mar 9 09:19:07 MST 2000",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of Parallel and Distributed Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Graham Fagg and Rolf Hempel and
                 David Walker",
  title =        "Message Passing Software Systems",
  crossref =     "Webster:1999:WEE",
  pages =        "??--??",
  year =         "1999",
  bibdate =      "Tue Feb 26 07:50:42 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Victor Eijkhout",
  title =        "Numerical Linear Algebra Algorithms and Software",
  journal =      "Journal CAM (Numerical) Linear Algebra",
  volume =       "31",
  number =       "4",
  pages =        "??--??",
  day =          "28",
  month =        oct,
  year =         "1999",
  CODEN =        "????",
  ISSN =         "????",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxnote =       "What journal is this??",

  author =       "Jack Dongarra and Victor Eijkhout",
  editor =       "Allen Kent and James Williams",
  booktitle =    "Encyclopedia of Computer Science and Technology",
  title =        "Numerical Linear Algebra",
  publisher =    pub-MARCEL-DEKKER,
  address =      pub-MARCEL-DEKKER:adr,
  pages =        "207--233",
  month =        aug,
  year =         "1999",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and E. J. Kontoghiorghes",
  title =        "Preface",
  journal =      j-PARALLEL-DIST-COMP-PRACT,
  volume =       "2",
  number =       "4",
  pages =        "??--??",
  month =        "????",
  year =         "1999",
  CODEN =        "????",
  ISSN =         "1097-2803",
  bibdate =      "Fri Dec 19 08:14:14 MST 2003",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "PDCP: Parallel and Distributed Computing Practices",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Bernard Tourancheau",
  title =        "Special Issue Introduction: Clusters and Computational
                 Grids for Scientific Computing",
  journal =      j-IJHPCA,
  volume =       "13",
  number =       "3",
  pages =        "179--179",
  month =        "Fall",
  year =         "1999",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Wed Jul 28 14:14:38 1999",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxmonth =      aug,

  author =       "Jack Dongarra and Hans-Werner Meuer and Erich
  title =        "{Top500} Report",
  type =         "Technical report",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "1999",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "D. Doolin and J. Dongarra and K. Seymour",
  title =        "{JLAPACK} --- Compiling {LAPACK Fortran} to {Java}",
  journal =      j-SCI-PROG,
  volume =       "7",
  number =       "2",
  pages =        "111--138",
  year =         "1999",
  CODEN =        "SCIPEV",
  ISSN =         "1058-9244 (print), 1875-919X (electronic)",
  ISSN-L =       "1058-9244",
  bibdate =      "Tue Mar 05 17:37:30 2002",
  bibsource =    "",
  note =         "The software is available on the World-Wide Web at
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Scientific Programming",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Graham E. Fagg and Keith Moore and Jack J. Dongarra",
  title =        "{Scalable Networked Information Processing
                 Environment} ({SNIPE})",
  journal =      j-FUT-GEN-COMP-SYS,
  volume =       "15",
  number =       "5--6",
  pages =        "595--605",
  day =          "1",
  month =        oct,
  year =         "1999",
  CODEN =        "FGSEVI",
  DOI =          "",
  ISSN =         "0167-739X (print), 1872-7115 (electronic)",
  ISSN-L =       "0167-739X",
  bibdate =      "Tue Mar 05 17:46:27 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Future Generation Computer Systems",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Markus Fischer and Jack Dongarra",
  title =        "Experiences with {Windows 95/NT} as a Cluster
                 Computing Platform for Parallel Computing",
  journal =      j-PARALLEL-DIST-COMP-PRACT,
  volume =       "2",
  number =       "2",
  pages =        "??--??",
  month =        feb,
  year =         "1999",
  CODEN =        "????",
  ISSN =         "1097-2803",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "PDCP: Parallel and Distributed Computing Practices",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. P. Petitet and J. J. Dongarra",
  title =        "Algorithmic Redistribution Methods for Block-Cyclic
  journal =      j-IEEE-TRANS-PAR-DIST-SYS,
  volume =       "10",
  number =       "12",
  pages =        "1201--1216",
  month =        dec,
  year =         "1999",
  CODEN =        "ITDSEO",
  DOI =          "",
  ISSN =         "1045-9219 (print), 1558-2183 (electronic)",
  ISSN-L =       "1045-9219",
  bibdate =      "Thu Oct 12 18:48:32 MDT 2000",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Transactions on Parallel and Distributed
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Petitet and H. Casanova and R. Whaley and J.
                 Dongarra and Y. Robert",
  booktitle =    "{SIAM} Annual Meeting, Atlanta, {GA}, May 13, 1999",
  title =        "A Numerical Linear Algebra Problem Solving Environment
                 Designer's Perspective",
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  year =         "1999",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "James S. Plank and Henri Casanova and Micah Beck and
                 Jack J. Dongarra",
  title =        "Deploying Fault-Tolerance and Task Migration with
  journal =      j-FUT-GEN-COMP-SYS,
  volume =       "15",
  number =       "5--6",
  pages =        "745--755",
  day =          "1",
  month =        oct,
  year =         "1999",
  CODEN =        "FGSEVI",
  DOI =          "",
  ISSN =         "0167-739X (print), 1872-7115 (electronic)",
  ISSN-L =       "0167-739X",
  bibdate =      "Tue Mar 05 17:44:12 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Future Generation Computer Systems",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Erich Strohmaier and Jack J. Dongarra and Hans W.
                 Meuer and Horst D. Simon",
  title =        "The marketplace of high-performance computing",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "25",
  number =       "13--14",
  pages =        "1517--1544",
  month =        dec,
  year =         "1999",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Sat Oct 28 17:44:02 MDT 2000",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Fran{\c{c}}oise Tisseur and Jack Dongarra",
  title =        "A Parallel Divide and Conquer Algorithm for the
                 Symmetric Eigenvalue Problem on Distributed Memory
  journal =      j-SIAM-J-SCI-COMP,
  volume =       "20",
  number =       "6",
  pages =        "2223--2236",
  month =        nov,
  year =         "1999",
  CODEN =        "SJOCE3",
  DOI =          "",
  ISSN =         "1064-8275 (print), 1095-7197 (electronic)",
  ISSN-L =       "1064-8275",
  bibdate =      "Sat Jul 17 19:14:40 MDT 1999",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM Journal on Scientific Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Beguelin and J. J. Dongarra and G. A. Geist and R.
                 Manchek and V. S. Sunderam",
  title =        "{PVM} Software System and Documentation",
  howpublished = "Email to {\tt [email protected]}",
  year =         "19xx",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Dorian C. Arnold and Jack Dongarra",
  title =        "The {NetSolve} Environment: Progressing Towards the
                 Seamless Grid",
  crossref =     "Sadayappan:2000:IWP",
  bookpages =    "xvi + 584",
  pages =        "199--206",
  year =         "2000",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxeditor =     "David J. Liija",
  xxISBN =       "0-7695-0768-9 0-7695-0770-0 (microfiche)",
  xxLCCN =       "QA76.6 .I548 2000",
  xxnote =       "This conference is cataloged twice with separate
                 editor and ISBN values; which did this paper appear
  xxpages =      "xx + 590",

  author =       "Dorian C. Arnold and Shirley Browne and Jack Dongarra
                 and Graham Fagg and Keith Moore",
  editor =       "????",
  booktitle =    "Proceedings of the {DoD} {HPC} Users Group Conference
                 {(HPCUG 2000)}, Albuquerque, New Mexico, Albuquerque
                 Hilton Hotel, June 5--8, 2000",
  title =        "Secure Remote Access to Numerical Software and
                 Computational Hardware",
  publisher =    "????",
  address =      "????",
  pages =        "??--??",
  year =         "2000",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Zhaojun Bai and James Demmel and Jack Dongarra and
                 Axel Ruhe",
  title =        "Templates for the solution of algebraic eigenvalue
                 problems: a practical guide",
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "xxx + 410",
  year =         "2000",
  ISBN =         "0-89871-471-0 (paperback), 0-89871-958-5 (e-book)",
  ISBN-13 =      "978-0-89871-471-5 (paperback), 978-0-89871-958-1
  LCCN =         "QA193 .T46 2000",
  MRclass =      "65F15 (Eigenvalues, eigenvectors (numerical linear
                 algebra)); 65F50 (Sparse matrices (numerical linear
                 algebra)); 65Y05 (Parallel computation (numerical
                 methods)); 00B15 (Collections of articles of
                 miscellaneous specific interest); 65-06 (Proceedings of
                 conferences (numerical analysis)) 65F35 (Matrix norms,
                 conditioning, scaling (numerical linear algebra));
                 65F20 (Overdetermined systems, pseudoinverses
                 (numerical linear algebra)); 65-02 (65F15)",
  MRnumber =     "MR1792141 (2001k:65003)",
  MRreviewer =   "Jesse L. Barlow",
  bibdate =      "Sat Dec 31 06:28:14 2005",
  bibsource =    ";
                 MathSciNet database",
  note =         "A practical guide.",
  series =       "Software, Environments, and Tools",
  URL =          ";
  abstract =     "The book is edited and written by well-known names in
                 the field and is an excellent guide to the numerical
                 solution of eigenvalue problems. It presents the many
                 available methods in an organized fashion.\par

                 Chapter 1 is introductory. Chapter 2 provides the top
                 level of a decision tree for classifying eigenvalue
                 problems and their corresponding numerical methods.
                 Chapter 3 summarizes the two mathematical principles
                 used by most algorithms for large eigenvalue problems:
                 projection onto subspaces and spectral

                 Chapters 4 through 9 give details for each of the six
                 categories of eigenvalue problems: Hermitian,
                 generalized Hermitian, non-Hermitian, generalized
                 non-Hermitian, and nonlinear eigenvalue problems, and
                 the singular value decomposition. The descriptions
                 include algorithm templates and pointers to available
                 software. Chapter 10 describes common isues of sparse
                 matrix representation and computation, both
                 sequentially and in parallel, shared by all algorithms.
                 Chapter 11 describes some preconditioning techniques
                 that are subject of current research.\par

                 The subjects not covered by the book are referenced for
                 the interested reader.",
  acknowledgement = ack-nhfb,
  keywords =     "Algebraic eigenvalue problems; algorithms; nonlinear
                 eigenvalue problems; parallel computation;
                 preconditioning; projection methods; singular value
                 decomposition; software; spectral transformations;
                 templates; textbook",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  reviewer =     "Plamen Yordanov Yalamov (Russe)",
  subject =      "Eigenvalues; Data processing",
  summary =      "Large-scale problems of engineering and scientific
                 computing often require solutions of eigenvalue and
                 related problems. This book gives a unified overview of
                 theory, algorithms, and practical software for
                 eigenvalue problems. It organizes this large body of
                 material to make it accessible for the first time to
                 the many nonexpert users who need to choose the best
                 state-of-the-art algorithms and software for their
                 problems. Using an informal decision tree, just enough
                 theory is introduced to identify the relevant
                 mathematical structure that determines the best
                 algorithm for each problem.",
  tableofcontents = "List of symbols and acronyms \\
                 List of iterative algorithm templates \\
                 List of direct algorithms \\
                 List of figures \\
                 List of tables \\
                 1. Introduction \\
                 2. A brief tour of eigenproblems \\
                 3. an introduction to iterative projection methods \\
                 4. Hermitian eigenvalue problems \\
                 5. Generalized hermitian eigenvalue problems \\
                 6. Singular value decomposition \\
                 7. Non-hermitian eigenvalue problems \\
                 8. Generalized non-hermitian eigenvalue problems \\
                 9. Nonlinear eigenvalue problems \\
                 10. Common issues \\
                 11. Preconditioning techniques \\
                 Appendix. Of things not treated \\
                 Bibliography \\

  author =       "Mark Baker and Rajkumar Buyya and Jack Dongarra",
  title =        "Tutorial {M9}: Current and Emerging Trends in Cluster
  crossref =     "ACM:2000:SHP",
  pages =        "23--24",
  year =         "2000",
  bibdate =      "Sat Feb 10 14:28:55 2001",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "John Board and Klaus Schulten",
  title =        "The Fast Multipole Algorithm",
  journal =      j-COMPUT-SCI-ENG,
  volume =       "2",
  number =       "1",
  pages =        "76--79",
  month =        jan # "\slash " # feb,
  year =         "2000",
  CODEN =        "CSENFA",
  ISSN =         "1521-9615 (print), 1558-366X (electronic)",
  ISSN-L =       "1521-9615",
  bibdate =      "Fri Oct 13 14:31:09 2000",
  bibsource =    "",
  note =         "See correspondence \cite{Makino:2000:LEF}.",
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Computing in Science and Engineering",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "S. Browne and J. Dongarra and N. Garner and G. Ho and
                 P. Mucci",
  title =        "A Portable Programming Interface for Performance
                 Evaluation on Modern Processors",
  journal =      j-IJHPCA,
  volume =       "14",
  number =       "3",
  pages =        "189--204",
  month =        "Fall",
  year =         "2000",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Sep 12 12:40:50 2000",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "S. Browne and J. Dongarra and N. Garner and K. London
                 and P. Mucci",
  title =        "A Scalable Cross-Platform Infrastructure for
                 Application Performance Tuning Using Hardware
  crossref =     "ACM:2000:SHP",
  pages =        "65--65",
  year =         "2000",
  bibdate =      "Mon Feb 12 11:57:44 2001",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Henri Casanova and Satoshi Matsuoka and J. Dongarra",
  title =        "Network-Enabled Server Systems: Deploying Scientific
                 Simulations on the Grid",
  crossref =     "Tentner:2000:PHP",
  pages =        "??--??",
  year =         "2000",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Frederica Darema and Jack Dongarra and Subhash Saini",
  title =        "Preface",
  journal =      j-IJHPCA,
  volume =       "14",
  number =       "3",
  pages =        "179--179",
  month =        "Fall",
  year =         "2000",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Sep 12 12:40:50 2000",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Eduardo D'Azevedo and Jack Dongarra",
  title =        "The design and implementation of the parallel
                 out-of-core {ScaLAPACK} {$ L U $}, {$ Q R $}, and
                 {Cholesky} factorization routines",
  journal =      j-CPE,
  volume =       "12",
  number =       "15",
  pages =        "1481--1493",
  month =        "????",
  year =         "2000",
  CODEN =        "CPEXEI",
  DOI =          "<1481::AID-CPE540>3.0.CO;2-V",
  ISSN =         "1040-3108 (print), 1096-9128 (electronic)",
  ISSN-L =       "1040-3108",
  bibdate =      "Sat Apr 7 06:56:11 MDT 2001",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency, practice and experience",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Francis Sullivan",
  title =        "{Guest Editors}' Introduction: The Top 10 Algorithms",
  journal =      j-COMPUT-SCI-ENG,
  volume =       "2",
  number =       "1",
  pages =        "22--23",
  month =        jan # "\slash " # feb,
  year =         "2000",
  CODEN =        "CSENFA",
  DOI =          "",
  ISSN =         "1521-9615 (print), 1558-366X (electronic)",
  ISSN-L =       "1521-9615",
  bibdate =      "Fri Oct 13 14:31:09 2000",
  bibsource =    ";
  note =         "See correspondence \cite{Makino:2000:LEF}.",
  URL =          ";
  abstract =     "In putting together this issue of CiSE, we knew three
                 things: it would be difficult to list just 10
                 algorithms; it would be fun to assemble the authors and
                 read their papers; and, whatever we came up with in the
                 end, it would be controversial. We tried to assemble
                 the 10 algorithms with the greatest influence on the
                 development and practice of science and engineering in
                 the 20th century. Following is our list (in
                 chronological order): Metropolis Algorithm for Monte
                 Carlo; Simplex Method for Linear Programming; Krylov
                 Subspace Iteration Methods; The Decompositional
                 Approach to Matrix Computations; The Fortran Optimizing
                 Compiler; QR Algorithm for Computing Eigenvalues;
                 Quicksort Algorithm for Sorting; Fast Fourier
                 Transform; Integer Relation Detection; Fast Multipole
  acknowledgement = ack-nhfb,
  fjournal =     "Computing in Science and Engineering",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Hans Meuer and Horst Simon and Erich
  editor =       "Peter T. Cummings and Phillip R. Westmoreland and
                 Brice Carnahan",
  booktitle =    "Foundations of molecular modeling and simulation:
                 proceedings of the First International Conference on
                 Molecular Modeling and Simulation, Keystone, Colorado,
                 July 23--28, 2000",
  title =        "High Performance Computing Today",
  volume =       "97(325)",
  publisher =    "American Institute of Chemical Engineers",
  address =      "New York, NY",
  bookpages =    "x + 328",
  pages =        "??--??",
  year =         "2000",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  series =       "AIChE symposium series",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. J. Dongarra and V. Eijkhout",
  title =        "Numerical linear algebra algorithms and software",
  journal =      j-J-COMPUT-APPL-MATH,
  volume =       "123",
  number =       "1--2",
  pages =        "489--514",
  month =        "????",
  year =         "2000",
  CODEN =        "JCAMDI",
  DOI =          "",
  ISSN =         "0377-0427 (print), 1879-1778 (electronic)",
  ISSN-L =       "0377-0427",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of Computational and Applied Mathematics",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Padma Raghavan",
  editor =       "????",
  booktitle =    "{IMACS 2000}, Lausanne, Switzerland",
  title =        "A New Recursive Implementation of Sparse {Cholesky}
  publisher =    "????",
  address =      "????",
  pages =        "??--??",
  year =         "2000",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Victor Eijkhout and Piotr Luszczek",
  booktitle =    "Proceedings of the 1st {SGI} Users Conference",
  title =        "Recursive Approach in Sparse Matrix {$ L U $}
  publisher =    "ACC Cyfronet UMM",
  address =      "Cracow, Poland",
  pages =        "409--418",
  month =        oct,
  year =         "2000",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and F. Sullivan",
  title =        "The {Top 10} algorithms",
  journal =      j-COMPUT-SCI-ENG,
  volume =       "2",
  number =       "1",
  pages =        "22--23",
  month =        jan # "\slash " # feb,
  year =         "2000",
  CODEN =        "CSENFA",
  DOI =          "",
  ISSN =         "1521-9615 (print), 1558-366x (electronic)",
  ISSN-L =       "1521-9615",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Computing in Science and Engineering",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Iain Duff and Danny Sorensen",
  title =        "Tutorial {M7}: High-Speed Numerical Linear Algebra:
                 Algorithms and Research Directions",
  crossref =     "ACM:2000:SHP",
  pages =        "21--22",
  year =         "2000",
  bibdate =      "Sat Feb 10 14:28:55 2001",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Graham E. Fagg and Sathish S. Vadhiyar and Jack J.
  title =        "{ACCT}: {Automatic Collective Communications Tuning}",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1908",
  pages =        "354--??",
  year =         "2000",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Fri Feb 1 08:30:27 MST 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Graham E. Fagg and Jack J. Dongarra",
  title =        "{FT-MPI}: {Fault Tolerant MPI}, Supporting Dynamic
                 Applications in a Dynamic World",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1908",
  pages =        "346--??",
  year =         "2000",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Fri Feb 1 08:30:27 MST 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jun Makino and John Board and Klaus Schulten and Peter
                 Borcherds and Rubin D. {Orduz Z.}",
  title =        "Letters to the Editors: {``The Fast Multipole
                 Algorithm''} and {``The Top 10 Algorithms''}",
  journal =      j-COMPUT-SCI-ENG,
  volume =       "2",
  number =       "3",
  pages =        "4--5",
  month =        may # "\slash " # jun,
  year =         "2000",
  CODEN =        "CSENFA",
  ISSN =         "1521-9615 (print), 1558-366X (electronic)",
  ISSN-L =       "1521-9615",
  bibdate =      "Fri Oct 13 14:31:09 2000",
  bibsource =    "",
  note =         "See \cite{Dongarra:2000:GEI,Board:2000:FMA}.",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Computing in Science and Engineering",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Petitet and H. Casanova and J. Dongarra and Y.
                 Robert and R. Whaley",
  editor =       "Jacek Blazewicz and others",
  booktitle =    "Handbook on Parallel and Distributed Processing",
  title =        "Parallel and Distributed Scientific Computing: {A}
                 Numerical Linear Algebra Problem Solving Environment
                 Designer's Perspective",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  bookpages =    "635",
  pages =        "??--??",
  year =         "2000",
  ISBN =         "3-540-66441-6",
  ISBN-13 =      "978-3-540-66441-3",
  LCCN =         "QA76.58 .H36 2000",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sathish S. Vadhiyar and Graham E. Fagg and Jack
  title =        "Automatically Tuned Collective Communications",
  crossref =     "ACM:2000:SHP",
  pages =        "46--46",
  year =         "2000",
  bibdate =      "Mon Feb 12 11:57:42 2001",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "R. C. Whaley and A. Petitet and J. Dongarra",
  title =        "Automated Empirical Optimization of Software and the
                 {ATLAS Project}",
  type =         "LAPACK Working Note",
  number =       "147",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        sep,
  year =         "2000",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-00-448, September 2000.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "D. C. Arnold and S. S. Vahdiyar and J. J. Dongarra",
  title =        "On the Convergence of Computational and Data Grids",
  journal =      j-PARALLEL-PROCESS-LETT,
  volume =       "11",
  number =       "2--3",
  pages =        "187--202",
  year =         "2001",
  CODEN =        "PPLTEE",
  ISSN =         "0129-6264 (print), 1793-642X (electronic)",
  bibdate =      "Sat Feb 23 19:27:51 MST 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Processing Letters",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Dorian C. Arnold and Jack Dongarra",
  title =        "Developing an Architecture to Support the
                 Implementation and Development of Scientific Computing
  crossref =     "Boisvert:2001:ASS",
  pages =        "39--56",
  year =         "2001",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "D. Arnold and W. Lee and J. Dongarra and M. Wheeler",
  title =        "Providing Infrastructure and Interface to High
                 Performance Applications in a Distributed Setting",
  crossref =     "Tentner:2000:PHP",
  pages =        "??--??",
  year =         "2001",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Dorian C. Arnold and Dieter Bachmann and Jack
  title =        "Request Sequencing: Optimizing Communication for the
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "1900",
  pages =        "1213--??",
  year =         "2001",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Sat Feb 2 13:02:44 MST 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "V. A. Barker and L. S. Blackford and J. J. Dongarra
                 and J. J. {Du Croz} and S. J. Hammarling and M.
                 Marinova and J. Wa{\'s}niewski and P. Yalamov",
  title =        "{LAPACK95} Users' Guide",
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "xviii + 258",
  year =         "2001",
  ISBN =         "0-89871-504-0 (paperback), 0-89871-820-1 (e-book)",
  ISBN-13 =      "978-0-89871-504-0 (paperback), 978-0-89871-820-1
  LCCN =         "QA76.73.F25 L36 2001",
  bibsource =    ";
  series =       "Software, environments, and tools",
  URL =          ";
  abstract =     "LAPACK95 is a Fortran 95 interface to the Fortran 77
                 LAPACK library. It is relevant for anyone who writes in
                 the Fortran 95 language and needs reliable software for
                 basic numerical linear algebra. It improves upon the
                 original user-interface to the LAPACK package, taking
                 advantage of the considerable simplifications that
                 Fortran 95 allows. LAPACK95 Users' Guide provides an
                 introduction to the design of the LAPACK95 package, a
                 detailed description of its contents, reference manuals
                 for the leading comments of the routines, and example
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  subject =      "LAPACK; FORTRAN (Computer program language); Fortran
                 (Langage de programmation); Subroutines (Computer
                 programs); Sous-programmes (Logiciels)",
  tableofcontents = "Preface \\
                 Part I: General information \\
                 Chapter 1: Essentials \\
                 Chapter 2: Contents of LAPACK95 \\
                 Chapter 3: Documentation Design and Program Examples
                 Chapter 4: Performance and Troubleshooting \\
                 Part II: Driver Routines \\
                 Chapter 5: Driver Routines for Linear Systems \\
                 Chapter 6: Driver Routines for Least Squares Problems
                 Chapter 7: Driver Routines for Standard Eigenvalue
                 Problems \\
                 Chapter 8: Driver Routines for Generalized Eigenvalue
                 Problems \\
                 Chapter 9: Driver Routines for Singular Value Problems
                 Part III: Computational Routines \\
                 Chapter 10: Computational Routines \\
                 Bibliography \\
                 Index by Keyword \\
                 Index by Routine Name",

  author =       "Micah Beck and Dorian Arnold and Alessandro Bassi and
                 Fran Berman and Henri Casanova and Jack Dongarra and
                 Terry Moore and Graziano Obertelli and James Plank and
                 Martin Swany and Sathish Vadhiyar and Rich Wolski",
  title =        "Logistical Computing and Internetworking: Middleware
                 for the Use of Storage in Communication",
  crossref =     "Lee:2001:TAI",
  pages =        "12--21",
  year =         "2001",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Francine Berman and Andrew Chien and Keith Cooper and
                 Jack Dongarra and Ian Foster and Dennis Gannon and
                 Lennart Johnsson and Ken Kennedy and Carl Kesselman and
                 John Mellor-Crummey and Dan Reed and Linda Torczon and
                 Rich Wolski",
  title =        "The {GrADS Project}: Software Support for High-Level
                 {Grid} Application Development",
  journal =      j-IJHPCA,
  volume =       "15",
  number =       "4",
  pages =        "327--344",
  month =        "Winter",
  year =         "2001",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Sat Nov 03 06:28:41 2001",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  keywords =     "GrADS (Grid Application Development Software)",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "L. S. Blackford and J. Demmel and J. Dongarra and I.
                 Duff and S. Hammarling and G. Henry and M. Heroux and
                 L. Kaufman and A. Lumsdaine and A. Petitet and R. Pozo
                 and K. Remington and R. C. Whaley",
  title =        "An Updated Set of {Basic Linear Algebra Subprograms}
  pages =        "20",
  month =        feb,
  year =         "2001",
  bibsource =    "",
  note =         "Submitted to " # j-TOMS,
  acknowledgement = ack-nhfb,
  bibsource =    "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "{Basic Linear Algebra Subprograms Technical (BLAST)
  title =        "Basic Linear Algebra Subprograms Technical ({BLAST})
                 Forum Standard",
  type =         "Technical report",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  pages =        "viii + 209",
  day =          "23",
  month =        jan,
  year =         "2001",
  bibdate =      "Fri May 27 06:29:51 2005",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  remark =       "The primary chapter authors are the following:
                 \begin{itemize} \item Susan Blackford, Jack Dongarra,
                 and Sven Hammarling, Chapter 1 \item Susan Blackford,
                 Jack Dongarra, and Sven Hammarling, Linda Kaufman,
                 Zohair Maany, Antoine Petitet, Chapter 2 \item Iain Du
                 , Mike Heroux, Roldan Pozo, Karin Remington, Chapter 3
                 \item Jim Demmel, Greg Henry, Velvel Kahan, Xiaoye Li,
                 Chapter 4 \item Clint Whaley, C Interface to the Legacy
                 BLAS \item Jack Dongarra, Fred Krogh, Journal of
                 Development --- Environmental routines \item Antoine
                 Petitet, Journal of Development --- Distributed-Memory
                 Dense BLAS \item Sven Hammarling, Zohair Maany, Journal
                 of Development --- Fortran95 Thin BLAS \item George
                 Corliss, Chenyi Hu, Baker Kearfoot, Bill Walster, J.
                 Wolff v. Gudenberg, Journal of Development --- Interval
                 BLAS. \end{itemize}",

  author =       "J. Choi and J. Demmel and I. Dhillon and J. Dongarra
                 and S. Ostrouchov and A. Petitet and K. Stanley and D.
                 Walker and R. C. Whaley",
  title =        "Installation Guide for {ScaLAPACK}",
  type =         "LAPACK Working Note",
  number =       "93",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "31",
  month =        aug,
  year =         "2001",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "Updated August 31, 2001 (Version 1.7).",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Hans Meuer and Horst Simon and Erich
  title =        "Biannual {Top-500} Computer Lists Track Changing
                 Environments for Scientific Computing",
  journal =      j-SIAM-NEWS,
  volume =       "34",
  number =       "9",
  pages =        "??--??",
  month =        nov,
  year =         "2001",
  ISSN =         "0036-1437",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM News",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Masaaki Shimasaki and Bernard
  title =        "Clusters and computational grids for scientific
  journal =      j-PARALLEL-COMPUTING,
  volume =       "27",
  number =       "11",
  pages =        "1401--1402",
  month =        oct,
  year =         "2001",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Fri Feb 22 16:52:42 MST 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra",
  title =        "High Performance Computing and Trends: Connecting
                 Computational Requirements with Computing Resources",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "2150",
  pages =        "33--??",
  year =         "2001",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Sat Feb 2 13:05:53 MST 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra",
  title =        "High performance computing and trends: connecting
                 computational requirements with computing resources",
  crossref =     "Katz:2001:IIC",
  pages =        "135--135",
  year =         "2001",
  bibdate =      "Fri May 27 10:27:11 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Victor Eijkhout and Henk van der
  title =        "An iterative solver benchmark",
  journal =      j-SCI-PROG,
  volume =       "9",
  number =       "4",
  pages =        "223--231",
  year =         "2001",
  CODEN =        "SCIPEV",
  ISSN =         "1058-9244 (print), 1875-919X (electronic)",
  ISSN-L =       "1058-9244",
  bibdate =      "Sat Oct 26 14:52:27 MDT 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Scientific Programming",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Piotr Luszczek and Antoine Petitet",
  title =        "The {LINPACK} Benchmark: Past, Present, and Future",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "2001",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra",
  title =        "{Netsolve} and its application",
  crossref =     "IEEE:2001:IIS",
  pages =        "21--21",
  year =         "2001",
  bibdate =      "Fri May 27 10:29:12 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Shirley Moore and Anne Trefethen",
  title =        "Numerical Libraries and Tools for Scalable Parallel
                 Cluster Computing",
  journal =      j-IJHPCA,
  volume =       "15",
  number =       "2",
  pages =        "175--180",
  month =        "Summer",
  year =         "2001",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue May 01 05:27:17 2001",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Bernard Tourancheau",
  title =        "Preface",
  journal =      j-IJHPCA,
  volume =       "15",
  number =       "3",
  pages =        "199--199",
  month =        "Fall",
  year =         "2001",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Mon Nov 05 16:09:36 2001",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and B. Tourancheau",
  title =        "Preface: Clusters and Computational Grids for
                 Scientific Computing",
  journal =      j-PARALLEL-PROCESS-LETT,
  volume =       "11",
  number =       "2--3",
  pages =        "185--??",
  year =         "2001",
  CODEN =        "PPLTEE",
  ISSN =         "0129-6264 (print), 1793-642X (electronic)",
  bibdate =      "Sat Feb 23 19:27:51 MST 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Processing Letters",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra",
  title =        "Performance of Various Computers Using Standard Linear
                 Equations Software",
  type =         "Technical Report",
  number =       "CS-89-85",
  institution =  inst-CS-U-Tenn,
  address =      inst-CS-U-Tenn:adr,
  pages =        "58",
  month =        aug,
  year =         "2001",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and David W. Walker",
  title =        "The Quest for Petascale Computing",
  journal =      j-COMPUT-SCI-ENG,
  volume =       "3",
  number =       "3",
  pages =        "32--39",
  month =        may # "\slash " # jun,
  year =         "2001",
  CODEN =        "CSENFA",
  DOI =          "",
  ISSN =         "1521-9615 (print), 1558-366X (electronic)",
  ISSN-L =       "1521-9615",
  bibdate =      "Wed Jul 18 06:52:30 MDT 2001",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Computing in Science and Engineering",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Victor Eijkhout and Piotr Luszczek",
  title =        "Recursive Approach in Sparse Matrix {$ L U $}
  journal =      j-SCI-PROG,
  volume =       "9",
  number =       "1",
  pages =        "51--60",
  year =         "2001",
  CODEN =        "SCIPEV",
  ISSN =         "1058-9244 (print), 1875-919X (electronic)",
  ISSN-L =       "1058-9244",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Scientific Programming",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra",
  title =        "An Update of a Couple of Tools: {ATLAS} and {PAPI}",
  type =         "Slide show.",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  pages =        "11",
  year =         "2001",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Kevin London and Shirley Moore and
                 Phil Mucci and Dan Terpstra",
  editor =       "????",
  booktitle =    "Linux Clusters: The {HPC} Revolution, June 25--27,
                 2001, National Center for Supercomputing Applications
                 {(NCSA)}, University of Illinois, Urbana, {IL}",
  title =        "Using {PAPI} For Hardware Performance Monitoring On
                 {Linux} Systems",
  publisher =    "????",
  address =      "????",
  pages =        "??--??",
  year =         "2001",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    ";
  note =         "Submitted.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Graham E. Fagg and Antonin Bukovsky and Jack J.
  title =        "Fault Tolerant {MPI} for the {HARNESS} Meta-computing
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "2073",
  pages =        "355--??",
  year =         "2001",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Sat Feb 2 13:04:28 MST 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Graham E. Fagg and Antonin Bukovsky and Jack J.
  title =        "{HARNESS} and fault tolerant {MPI}",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "27",
  number =       "11",
  pages =        "1479--1495",
  month =        oct,
  year =         "2001",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Fri Feb 22 16:52:42 MST 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Graham E. Fagg and Edgar Gabriel and Michael Resch and
                 Jack J. Dongarra",
  title =        "Parallel {IO} Support for Meta-computing Applications:
                 {MPI\_Connect IO} Applied to {PACX--MPI}",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "2131",
  pages =        "135--??",
  year =         "2001",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Fri Feb 1 08:13:55 MST 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ken Kennedy and Bradley Broom and Keith Cooper and
                 Jack Dongarra and Rob Fowler and Dennis Gannon and
                 Lennart Johnsson and John Mellor-Crummey and Linda
  title =        "Telescoping Languages: a Strategy for Automatic
                 Generation of Scientific Problem-Solving Systems from
                 Annotated Libraries",
  journal =      j-J-PAR-DIST-COMP,
  volume =       "61",
  number =       "12",
  pages =        "1803--1826",
  day =          "1",
  month =        dec,
  year =         "2001",
  CODEN =        "JPDCER",
  DOI =          "",
  ISSN =         "0743-7315 (print), 1096-0848 (electronic)",
  ISSN-L =       "0743-7315",
  bibdate =      "Tue Feb 26 06:20:18 MST 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of Parallel and Distributed Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "K. London and J. Dongarra and S. Moore and P. Mucci
                 and K. Seymour and T. Spencer",
  title =        "End-user Tools for Application Performance Analysis
                 Using Hardware Counters",
  crossref =     "Sha:2001:PDC",
  pages =        "??--??",
  year =         "2001",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Michelle Miller and Christopher Moulding and Jack
                 Dongarra and Christopher Johnson",
  title =        "Grid-Enabling An Interactive Simulation\slash
                 Visualization Environment",
  crossref =     "Tentner:2001:PHP",
  pages =        "??--??",
  year =         "2001",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Michelle Miller and Christopher Moulding and Jack
                 Dongarra and Christopher Johnson",
  title =        "Grid-Enabling Problem Solving Environments: a Case
                 Study of {SCIRUN} and {NetSolve}",
  crossref =     "Tentner:2001:PHP",
  pages =        "??--??",
  year =         "2001",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Keith Moore and Jack Dongarra",
  title =        "{NetBuild}: Transparent Cross-Platform Access to
                 Computational Software Libraries",
  journal =      j-CCPE,
  volume =       "??",
  number =       "??",
  pages =        "??--??",
  year =         "2001",
  CODEN =        "CCPEBO",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  note =         "Submitted.",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Prac\-tice and
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Shirley Moore and David Cronk and Kevin London and
                 Jack Dongarra",
  title =        "Review of Performance Analysis Tools for {MPI}
                 Parallel Programs",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "2131",
  pages =        "241--??",
  year =         "2001",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Fri Feb 1 08:13:55 MST 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Antoine Petitet and Susan Blackford and Jack Dongarra
                 and Brett Ellis and Graham Fagg and Kenneth Roche and
                 Sathish Vadhiyar",
  title =        "Numerical Libraries and the {Grid}: The {GrADS}
                 Experiments with {ScaLAPACK}",
  crossref =     "ACM:2001:SHP",
  pages =        "??--??",
  year =         "2001",
  bibdate =      "Sat Feb 10 14:28:55 2001",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "GrADS (Grid Application Development Software)",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  pagecount =    "17",

  author =       "Antoine Petitet and Susan Blackford and Jack Dongarra
                 and Brett Ellis and Graham Fagg and Kenneth Roche and
                 Sathish Vadhiyar",
  title =        "Numerical Libraries and the {Grid}",
  journal =      j-IJHPCA,
  volume =       "15",
  number =       "4",
  pages =        "359--374",
  month =        "Winter",
  year =         "2001",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Sat Nov 03 06:28:41 2001",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Keith Seymour and Jack Dongarra",
  title =        "Automatic Translation of {Fortran} to {JVM} Bytecode",
  crossref =     "ACM:2001:PAJ",
  pages =        "126--133",
  year =         "2001",
  bibdate =      "Mon May 06 09:31:01 2002",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  keywords =     "Java",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sathish S. Vadhiyar and Graham E. Fagg and Jack J.
  title =        "Performance Modeling for Self Adapting Collective
                 Communications for {MPI}",
  crossref =     "Oldehoeft:2002:SIS",
  pages =        "??--??",
  year =         "2001",
  bibdate =      "Tue Feb 26 06:44:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "Los Alamos Computer Science Institute (LASCI)",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxbooktitle =  "LACSI Symposium 2001, October 15--18, Eldorado Hotel,
                 Santa Fe, NM",

  author =       "Sathish S. Vadhiyar and Graham E. Fagg and Jack J.
  title =        "Towards an Accurate Model for Collective
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "2073",
  pages =        "41--??",
  year =         "2001",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Sat Feb 2 13:04:28 MST 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Aad J. van der Steen and Jack J. Dongarra",
  title =        "Overview of Recent Supercomputers",
  type =         "Technical report",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "2001",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "R. Clint Whaley and Antoine Petitet and Jack J.
  title =        "Automated empirical optimizations of software and the
                 {ATLAS} project",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "27",
  number =       "1--2",
  pages =        "3--35",
  month =        jan,
  year =         "2001",
  CODEN =        "PACOEJ",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Wed Jul 18 06:31:14 MDT 2001",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Dorian C. Arnold and Henri Casanova and Jack
  title =        "Innovations of the {NetSolve Grid Computing System}",
  journal =      j-CCPE,
  volume =       "14",
  number =       "13--15",
  pages =        "1457--1479",
  month =        nov # "\slash " # dec,
  year =         "2002",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Tue Jan 13 09:28:02 MST 2004",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Prac\-tice and
  journal-URL =  "",
  onlinedate =   "6 Jan 2003",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Micah Beck and Dorian Arnold and Alessandro Bassi and
                 Fran Berman and Henri Casanova and Jack Dongarra and
                 Terry Moore and Graziano Obertelli and James Plank and
                 Martin Swany",
  title =        "Middleware for the use of storage in communication",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "28",
  number =       "12",
  pages =        "1773--1787",
  month =        dec,
  year =         "2002",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Wed Dec 24 09:07:22 MST 2003",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "L. Susan Blackford and James Demmel and Jack Dongarra
                 and Iain Duff and Sven Hammarling and Greg Henry and
                 Michael Heroux and Linda Kaufman and Andrew Lumsdaine
                 and Antoine Petitet and Roldan Pozo and Karin Remington
                 and R. Clint Whaley",
  title =        "An updated set of {Basic Linear Algebra Subprograms
  journal =      j-TOMS,
  volume =       "28",
  number =       "2",
  pages =        "135--151",
  month =        jun,
  year =         "2002",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  bibdate =      "Sat Nov 9 11:16:50 MST 2002",
  bibsource =    ";
  URL =          "",
  abstract =     "This paper expands the specification of a set of
                 kernel routines for linear algebra, historically called
                 the Basic Linear Algebra Subprograms and commonly known
                 as the BLAS.\par

                 Numerical linear algebra, particularly the solution of
                 linear systems of equations, linear least squares
                 problems, eigenvalue problems and singular value
                 problems, is fundamental to most calculations in
                 scientific computing, and is often the computationally
                 intense part of such calculations. Designers of
                 computer programs involving linear algebraic operations
                 have frequently chosen to implement certain low level
                 operations, such as the dot product or the matrix
                 vector product, as separate subprograms. This may be
                 observed both in many published codes and in codes
                 written for specific applications at many computer

                 A major aim of the standards defined in this paper is
                 to enable linear algebra libraries (both public domain
                 and commercial) to interoperate efficiently, reliably
                 and easily.",
  acknowledgement = ack-nhfb,
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ronald F. Boisvert and Jack J. Dongarra",
  title =        "Preface to the special issue on the {Basic Linear
                 Algebra Subprograms (BLAS)}",
  journal =      j-TOMS,
  volume =       "28",
  number =       "2",
  pages =        "133--134",
  month =        jun,
  year =         "2002",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  bibdate =      "Sat Nov 9 11:16:50 MST 2002",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Henri Casanova and Thomas Bartol and Francine Berman
                 and Adam Birnbaum and Jack Dongarra and Mark Ellisman
                 and Marcio Faerman and Erhan Gockay and Michelle Miller
                 and Graziano Obertelli and Stuart Pomerantz and Terry
                 Sejnowski and Joel Stiles and Rich Wolski",
  title =        "The {Virtual Instrument}: Support for {Grid}-enabled
                 Scientific Simulations",
  journal =      j-PARALLEL-DIST-COMP-PRACT,
  volume =       "??",
  number =       "??",
  pages =        "??--??",
  month =        "????",
  year =         "2002",
  CODEN =        "????",
  ISSN =         "1097-2803",
  bibdate =      "Tue Jan 13 18:52:33 2004",
  bibsource =    "",
  note =         "Submitted.",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "PDCP: Parallel and Distributed Computing Practices",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Javier Cuencal and Domingo Giminez and Josi Gonzalez
                 and Jack Dongarra and Kenneth Roche",
  title =        "Automatic Optimisation of Parallel Linear Algebra
                 Routines in Systems with Variable Load",
  crossref =     "Monien:2002:EPP",
  pages =        "??--??",
  year =         "2002",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  note =         "Submitted.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra",
  title =        "High Performance Computing, Computational {Grid}, and
                 Numerical Libraries",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "2474",
  pages =        "1--??",
  year =         "2002",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Sat Nov 30 20:57:35 MST 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra",
  title =        "Preface: {Basic Linear Algebra Subprograms Technical
                 (Blast) Forum Standard I}",
  journal =      j-IJHPCA,
  volume =       "16",
  number =       "1",
  pages =        "1--111",
  month =        "Spring",
  year =         "2002",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Fri Nov 28 06:52:13 2003",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra",
  title =        "Preface: {Basic Linear Algebra Subprograms Technical
                 (Blast) Forum Standard II}",
  journal =      j-IJHPCA,
  volume =       "16",
  number =       "2",
  pages =        "115--115",
  month =        "Summer",
  year =         "2002",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Fri Nov 28 06:52:13 2003",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra",
  title =        "Performance of Various Computers Using Standard Linear
                 Equations Software ({Linpack} Benchmark Report)",
  type =         "Technical report",
  number =       "CS-89-85",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "2002",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Victor Eijkhout",
  title =        "Self-adapting Numerical Software for Next Generation
  type =         "LAPACK Working Note",
  number =       "157",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        aug,
  year =         "2002",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-02-484, August 2002",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Jack Dongarra and Ian Foster and Geoffrey Fox and
                 William Gropp and Ken Kennedy and Linda Torczon and
                 Andy White",
  title =        "The Sourcebook of Parallel Computing",
  publisher =    pub-MORGAN-KAUFMANN,
  address =      pub-MORGAN-KAUFMANN:adr,
  pages =        "xvi + 842 + 8",
  year =         "2002",
  ISBN =         "1-55860-871-0",
  ISBN-13 =      "978-1-55860-871-9",
  LCCN =         "QA76.58 S638 2003",
  bibdate =      "Tue Jun 17 13:39:32 2003",
  bibsource =    "",
  price =        "US\$59.95",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra",
  title =        "Trends in high performance computing and using
                 numerical libraries on clusters",
  crossref =     "Gropp:2002:PII",
  pages =        "172--172",
  year =         "2002",
  bibdate =      "Fri May 27 10:30:39 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra",
  title =        "Three tools to help with cluster and grid computing:
                 {SANS-Effort}, {PAPI}, and {NetSolve}",
  crossref =     "IEEE:2002:CIA",
  pages =        "2--2",
  year =         "2002",
  DOI =          "",
  bibdate =      "Fri May 27 10:33:02 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Graham E. Fagg and Antonin Bukovsky and Sathish
                 Vadhiyar and Jack J. Dongarra",
  title =        "Fault Tolerant {MPI} for the {HARNESS MetaComputing}
  type =         "Technical report",
  number =       "????",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  pages =        "14",
  year =         "2002",
  bibdate =      "Tue Jan 13 18:41:26 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Graham E. Fagg and Jack J. Dongarra",
  title =        "{HARNESS} Fault Tolerant {MPI} Design, Usage and
                 Performance Issues",
  type =         "Technical report",
  number =       "????",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "2002",
  bibdate =      "Tue Jan 13 18:42:49 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Graham E. Fagg and Jack J. Dongarra",
  title =        "{HARNESS} fault tolerant {MPI} design, usage and
                 performance issues",
  journal =      j-FUT-GEN-COMP-SYS,
  volume =       "18",
  number =       "8",
  pages =        "1127--1142",
  month =        oct,
  year =         "2002",
  CODEN =        "FGSEVI",
  DOI =          "",
  ISSN =         "0167-739X (print), 1872-7115 (electronic)",
  ISSN-L =       "0167-739X",
  bibdate =      "Sat Jan 10 10:03:29 MST 2004",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Future Generation Computer Systems",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Greg Henry and David Watkins and Jack Dongarra",
  title =        "A Parallel Implementation of the Nonsymmetric {$ Q R
                 $} Algorithm for Distributed Memory Architectures",
  journal =      j-SIAM-J-SCI-COMP,
  volume =       "24",
  number =       "1",
  pages =        "284--311",
  month =        jan,
  year =         "2002",
  CODEN =        "SJOCE3",
  DOI =          "",
  ISSN =         "1064-8275 (print), 1095-7197 (electronic)",
  ISSN-L =       "1064-8275",
  bibdate =      "Tue Oct 22 18:24:38 MDT 2002",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM Journal on Scientific Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "T. Hiroyasu and M. Miki and H. Shimosaka and Y.
                 Tanimura and J. Dongarra",
  editor =       "????",
  booktitle =    "The Japan Society of Mechanical Engineers, Kyoto
                 University, Kyoto, Japan, October 12--13, 2002",
  title =        "Optimization System Using {Grid RPC}",
  publisher =    "????",
  address =      "????",
  pages =        "??--??",
  year =         "2002",
  ISBN =         "????",
  ISBN-13 =      "????",
  LCCN =         "????",
  bibdate =      "Tue Jan 13 18:45:45 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "T. Hiroyasu and M. Miki and H. Shimosaka and M. Sano
                 and Y. Tanimura and Y. Mimura and S. Yoshimura and J.
  editor =       "????",
  booktitle =    "The Japan Society of Mechanical Engineers, Kyoto
                 University, Kyoto, Japan, October 12--13, 2002",
  title =        "Truss Structural Optimization Using {NetSolve}
  publisher =    "????",
  address =      "????",
  pages =        "??--??",
  year =         "2002",
  ISBN =         "????",
  ISBN-13 =      "????",
  LCCN =         "????",
  bibdate =      "Tue Jan 13 18:46:58 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ken Kennedy and Mark Mazina and John Mellor-Crummey
                 and Keith Cooper and Linda Torczon and Fran Berman and
                 Andrew Chien and Holly Dail and Otto Sievert and Dave
                 Angulo and Ian Foster and Dennis Gannon and Lennart
                 Johnsson and Carl Kesselman and Ruth Aydt and Daniel
                 Reed and Jack Dongarra and Sathish Vadhiyar and Rich
  title =        "Toward a Framework for Preparing and Executing
                 Adaptive Grid Programs",
  crossref =     "IEEE:2002:PIP",
  pages =        "??--??",
  year =         "2002",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  note =         "To appear.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "DongWoo Lee and Jack J. Dongarra and R. S.
  title =        "{visPerf}: Monitoring Tool for {Grid} Computing",
  crossref =     "Parashar:2002:GCG",
  pages =        "??--??",
  year =         "2002",
  bibdate =      "Tue Jan 13 18:48:26 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Shirley Moore and A. J. Baker and Jack Dongarra and
                 Christian Halloy and Chung Ng",
  title =        "{Active Netlib}: An Active Mathematical Software
                 Collection for Inquiry-based Computational Science and
                 Engineering Education",
  journal =      j-J-DIGITAL-INFO,
  volume =       "2",
  number =       "4",
  pages =        "??--??",
  month =        may,
  year =         "2002",
  CODEN =        "????",
  ISSN =         "1368-7506",
  bibdate =      "Fri Sep 10 11:19:19 MDT 2010",
  bibsource =    ";
  URL =          ";
  abstract =     "The efficient application of scientific computing
                 techniques requires specialized knowledge of numerical
                 methods and their implementation in mathematical
                 software libraries that many students, scientists and
                 engineers, working beyond the already strenuous demands
                 of their particular field, must struggle to achieve.
                 Active Netlib addresses this problem by creating an
                 active collection of executable mathematical software
                 deployed on computational servers and accessible over
                 the network from familiar desktop client interfaces.
                 The Netlib mathematical software collection is being
                 extended in a number of ways to support this project.
                 The NetSolve client-server system provides an active
                 interface to the contents of Netlib by constructing
                 network-accessible objects with executable content from
                 the software packages in Netlib. The NetSolve adaptive
                 solver interface guides the user in selecting
                 appropriate software, in setting parameters correctly,
                 and in interpreting numerical results. In addition,
                 Active Netlib provides mechanisms that enable resource
                 users to become resource providers by dynamically
                 uploading and deploying their own software
                 applications, which are reviewed before becoming part
                 of the moderated publicly available collection. It is
                 hoped that Active Netlib will grow to be a worldwide
                 collection of executable mathematical software, as well
                 as scientific and engineering applications, that is
                 both drawn upon and contributed to by researchers,
                 educators and students.",
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of Digital Information",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Keith Moore and Jack Dongarra",
  title =        "{NetBuild}: transparent cross-platform access to
                 computational software libraries",
  journal =      j-CCPE,
  volume =       "14",
  number =       "13--15",
  pages =        "1445--1456",
  month =        nov # "\slash " # dec,
  year =         "2002",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Tue Jan 13 09:28:02 MST 2004",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Prac\-tice and
  journal-URL =  "",
  onlinedate =   "6 Jan 2003",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hidemoto Nakada and Satoshi Matsuoka and Keith Seymour
                 and Jack Dongarra and Craig Lee and Henri Casanova",
  title =        "{GridRPC}: a Remote Procedure Call {API} for Grid
  crossref =     "Parashar:2002:GCG",
  year =         "2002",
  bibdate =      "Tue Jan 13 18:49:43 2004",
  bibsource =    "",
  note =         "Submitted.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Kenneth J. Roche and Jack J. Dongarra",
  title =        "Deploying Parallel Numerical Library Routines to
                 Cluster Computing in a Self Adapting Fashion",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "??",
  number =       "??",
  pages =        "??--??",
  year =         "2002",
  CODEN =        "PACOEJ",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Tue Jan 13 18:54:15 2004",
  bibsource =    "",
  note =         "Submitted.",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Keith Seymour and Hidemoto Nakada and Satoshi Matsuoka
                 and Jack Dongarra and Craig Lee and Henri Casanova",
  title =        "Overview of {GridRPC}: a Remote Procedure Call {API}
                 for {Grid} Computing",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "2536",
  pages =        "274--??",
  year =         "2002",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Sat Nov 30 20:58:10 MST 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sathish S. Vadhiyar and Jack J. Dongarra",
  title =        "A Metascheduler for the Grid",
  crossref =     "IEEE:2002:PFA",
  bookpages =    "viii + 99",
  pages =        "??--??",
  year =         "2002",
  bibdate =      "Tue Jan 13 18:55:39 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "S. S. Vadhiyar and J. J. Dongarra",
  title =        "A metascheduler for the {Grid}",
  crossref =     "IEEE:2002:HPI",
  pages =        "343--351",
  year =         "2002",
  DOI =          "",
  bibdate =      "Fri May 27 10:31:49 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sathish S. Vadhiyar and Graham E. Fagg and Jack J.
  title =        "Performance Modeling for Self Adapting Collective
                 Communications for {MPI}",
  crossref =     "Oldehoeft:2002:SIS",
  pages =        "??--??",
  year =         "2002",
  bibdate =      "Tue Feb 26 06:44:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "Los Alamos Computer Science Institute (LASCI)",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxbooktitle =  "LACSI Symposium 2001, October 15--18, Eldorado Hotel,
                 Santa Fe, NM",

  author =       "Sathish S. Vadhiyar and J. Dongarra",
  title =        "A Performance Oriented Migration Framework for the
  type =         "Technical report",
  number =       "????",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  pages =        "9",
  year =         "2002",
  bibdate =      "Tue Jan 13 18:44:33 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Aad van der Steen and Jack Dongarra",
  title =        "Overview of High Performance Computers",
  crossref =     "Abello:2002:HMD",
  pages =        "??--??",
  year =         "2002",
  bibdate =      "Tue Feb 26 10:10:44 2002",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Asim YarKhan and Jack J. Dongarra",
  title =        "Experiments with Scheduling Using Simulated Annealing
                 in a {Grid} Environment",
  journal =      j-LECT-NOTES-COMP-SCI,
  volume =       "2536",
  pages =        "232--??",
  year =         "2002",
  CODEN =        "LNCSD9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Sat Nov 30 20:58:10 MST 2002",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Lecture Notes in Computer Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sudesh Agrawal and Jack Dongarra and Keith Seymour and
                 Sathish Vadhiyar",
  editor =       "Fran Berman and Geoffrey Fox and Anthony J. G. Hey",
  booktitle =    "{Grid} Computing: Making the Global Infrastructure a
  title =        "{NetSolve}: Past, Present, and Future --- a Look at a
                 {Grid} Enabled Server",
  publisher =    pub-WILEY,
  address =      pub-WILEY:adr,
  bookpages =    "xlvi + 1012",
  pages =        "??--??",
  year =         "2003",
  ISBN =         "0-470-85319-0",
  ISBN-13 =      "978-0-470-85319-1",
  LCCN =         "QA76.9.C58 G755 2003",
  bibdate =      "Tue Jan 13 18:12:34 2004",
  bibsource =    "",
  series =       "Wiley series in communications networking and
                 distributed systems",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Micah Beck and Jack Dongarra and Victor Eijkhout and
                 Mike Langston and Terry Moore and Jim Plank",
  editor =       "????",
  booktitle =    "{DOE/NSF} Workshop on New Directions in Cyber-Security
                 in Large-Scale Networks: Deployment Obstacles, National
                 Conference Center, Lansdowne, Virginia, March, 2003",
  title =        "Scalable, Trustworthy Network Computing Using
                 Untrusted Intermediaries: a Position Paper",
  publisher =    "????",
  address =      "????",
  pages =        "??--??",
  year =         "2003",
  ISBN =         "????",
  ISBN-13 =      "????",
  LCCN =         "????",
  bibdate =      "Tue Jan 13 17:57:54 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Zizhong Chen and Jack Dongarra and Piotr Luszczek and
                 Kenneth Roche",
  title =        "Self Adapting Software for Numerical Linear Algebra
                 and {LAPACK} for Clusters",
  type =         "LAPACK Working Note",
  number =       "160",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        jan,
  year =         "2003",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-03-499, January 2003. Submitted to Parallel
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Z. Z. Chen and J. Dongarra and P. Luszczek and K.
  title =        "Self-adapting software for numerical linear algebra
                 and {LAPACK} for clusters",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "29",
  number =       "11--12",
  pages =        "1723--1743",
  month =        "????",
  year =         "2003",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Cuenca and D. Gimenez and J. Gonzalez and J.
                 Dongarra and K. Roche",
  title =        "Automatic optimisation of parallel linear algebra
                 routines in systems with variable load",
  crossref =     "Clematis:2003:EEC",
  pages =        "409--416",
  year =         "2003",
  DOI =          "",
  bibdate =      "Fri May 27 10:38:56 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Holly Dail and Otto Sievert and Fran Berman and Henri
                 Casanova and Asim YarKhan and Sathish Vadhiyar and Jack
                 Dongarra and Chuang Liu and Lingyun Yang and Dave
                 Angulo and Ian Foster",
  title =        "Scheduling in the Grid Application Development
                 Software Project",
  crossref =     "Nabrzyski:2003:GRM",
  pages =        "??--??",
  year =         "2003",
  bibdate =      "Tue Jan 13 18:17:07 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Kevin London and Shirley Moore and
                 Philip Mucci and Daniel Terpstra and Haihang You and
                 Min Zhou",
  title =        "Experiences and Lessons Learned with a Portable
                 Interface to Hardware Performance Counters",
  crossref =     "IEEE:2003:PIP",
  pages =        "??--??",
  year =         "2003",
  bibdate =      "Tue Jan 13 18:23:28 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxbooktitle =  "PADTAD workshop, IPDPS2003 meeting, Nice France, April
                 26, 2003",

  author =       "J. Dongarra and K. London and S. Moore and P. Mucci
                 and D. Terpstra and Haihang You and Min Zhou",
  title =        "Experiences and lessons learned with a portable
                 interface to hardware performance counters",
  crossref =     "IEEE:2003:IPD",
  year =         "2003",
  DOI =          "",
  bibdate =      "Fri May 27 10:33:59 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  pagecount =    "6",

  author =       "Jack Dongarra and Victor Eijkhout",
  title =        "Finite-choice algorithm optimization in {Conjugate
  type =         "LAPACK Working Note",
  number =       "159",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        jan,
  year =         "2003",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-03-502, January 2003",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Piotr Luszczek and Antoine
  title =        "The {LINPACK Benchmark}: past, present and future",
  journal =      j-CCPE,
  volume =       "15",
  number =       "9",
  pages =        "803--820",
  day =          "10",
  month =        aug,
  year =         "2003",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Tue Jan 13 09:28:12 MST 2004",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Prac\-tice and
  journal-URL =  "",
  onlinedate =   "14 Jul 2003",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Bernard Tourancheau",
  title =        "Preface",
  journal =      j-PARALLEL-PROCESS-LETT,
  volume =       "13",
  number =       "2",
  pages =        "93--??",
  month =        jun,
  year =         "2003",
  CODEN =        "PPLTEE",
  ISSN =         "0129-6264 (print), 1793-642X (electronic)",
  bibdate =      "Sat Nov 6 18:06:29 MST 2004",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Processing Letters",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Allen Malony and Shirley Moore and
                 Philip Mucci and Sameer Shende",
  title =        "Performance Instrumentation and Measurement for
                 Terascale Systems",
  crossref =     "Sloot:2003:CSIb",
  pages =        "53--62",
  year =         "2003",
  bibdate =      "Tue Jan 13 18:35:22 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxbooktitle =  "ICCS 2003 meeting, Terascale workshop",

  author =       "Jack Dongarra and Victor Eijkhout",
  title =        "Self-Adapting Numerical Software and Automatic Tuning
                 of Heuristics",
  crossref =     "Sloot:2003:CSIa",
  pages =        "??--??",
  year =         "2003",
  bibdate =      "Tue Jan 13 18:20:06 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Victor Eijkhout",
  title =        "Self-Adapting Numerical Software for Next Generation
  journal =      j-IJHPCA,
  volume =       "17",
  number =       "2",
  pages =        "125--131",
  month =        "Summer",
  year =         "2003",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Fri Nov 28 06:52:13 2003",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Thomas Eidson and Jack Dongarra and Victor Eijkhout",
  editor =       "????",
  booktitle =    "Proceedings. International Parallel and Distributed
                 Processing Symposium, 2003. 22--26 April 2003",
  title =        "Applying Aspect-Orient Programming Concepts to a
                 Component-based Programming Model",
  publisher =    "????",
  address =      "????",
  pages =        "??--??",
  year =         "2003",
  ISBN =         "????",
  ISBN-13 =      "????",
  LCCN =         "????",
  bibdate =      "Tue Jan 13 18:34:18 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "International Parallel and Distributed Processing
                 Symposium (IPDPS)",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  pagecount =    "7",
  xxbooktitle =  "IPDPS Workshop on NSF-Next Generation Software",

  author =       "Graham E. Fagg and Edgar Gabriel and Zizhon Chen and
                 Thara Angskun and George Bosilca and Antonin Bukovsky
                 and Jack J. Dongarra",
  editor =       "????",
  booktitle =    "{Los Alamos Computer Science Institute} Symposium,
                 {Santa Fe, NM, October 27--29, 2003}",
  title =        "Fault Tolerant Communication Library and Applications
                 for High Performance Computing",
  publisher =    "????",
  address =      "????",
  pages =        "??--??",
  year =         "2003",
  ISBN =         "????",
  ISBN-13 =      "????",
  LCCN =         "????",
  bibdate =      "Tue Jan 13 17:55:53 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "G. Fox and J. J. Dongarra and D. Arnold and H.
                 Casanova and Ann C. Catlin and T. Haupt and E. N.
                 Houstis and J. R. Rice",
  title =        "Problem solving environments",
  crossref =     "Dongarra:2003:SPC",
  pages =        "409--442",
  year =         "2003",
  bibdate =      "Sat Dec 29 18:28:39 2007",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Edgar Gabriel and Graham Fagg and Jack Dongarra",
  title =        "Evaluating the Performance of {MPI-2} Dynamic
                 Communicators and One-Sided Communication",
  crossref =     "Dongarra:2003:RAP",
  pages =        "??--??",
  year =         "2003",
  bibdate =      "Tue Jan 13 18:15:48 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Edgar Gabriel and Graham E. Fagg and Antonin Bukovsky
                 and Thara Angskun and Jack J. Dongarra",
  editor =       "????",
  booktitle =    "17th Annual {ACM} International Conference on
                 Supercomputing {(ICS'03)} International Workshop on
                 Grid Computing and e-Science, June 21, 2003, San
  title =        "A Fault-Tolerant Communication Library for {Grid}
  publisher =    "????",
  address =      "????",
  pages =        "??--??",
  year =         "2003",
  ISBN =         "????",
  ISBN-13 =      "????",
  LCCN =         "????",
  bibdate =      "Tue Jan 13 18:14:32 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxcrossref =   "ACM:2003:CPI",

  author =       "Tomoyuki Hiroyasu and Mitsunori Miki and Shinya Ogura
                 and Keiko Aoi and Takeshi Yoshida and Yuko Okamoto and
                 Jack Dongarra",
  title =        "Energy Minimization of Protein Tertiary Structure by
                 Parallel Simulated Annealing using Genetic Crossover",
  journal =      "Journal of Genetic Programming and Evolvable
  volume =       "??",
  number =       "??",
  pages =        "??--??",
  month =        "????",
  year =         "2003",
  CODEN =        "????",
  ISSN =         "1389-2576",
  bibdate =      "Wed Jan 14 07:51:16 2004",
  bibsource =    ";
  note =         "Special Issue on Biological Applications of Genetic
                 and Evolutionary Computation",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxnote =       "Issue has not appeared up to volume 4 number 4
                 December 2003.",

  author =       "Tomoyuki Hiroyasu and Mitsunori Miki and Hisashi
                 Shimosaka and Jack Dongarra",
  title =        "Optimization Problem Solving System using {Grid RPC}",
  crossref =     "IEEE:2003:PCI",
  pages =        "??--??",
  year =         "2003",
  bibdate =      "Tue Jan 13 18:21:03 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Tomoyuki Hiroyasu and Mitsunori Miki and Kenzo Kodama
                 and Junichi Uekawa and Jack Dongarra",
  editor =       "????",
  booktitle =    "{ClusterWorld} Conference and Expo, San Jose,
                 California, June 24--26, 2003",
  title =        "A Simple Installation and Administration Tool for the
                 Large-scaled {PC} Cluster System",
  publisher =    "????",
  address =      "????",
  pages =        "??--??",
  year =         "2003",
  ISBN =         "????",
  ISBN-13 =      "????",
  LCCN =         "????",
  bibdate =      "Tue Jan 13 18:22:18 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Dieter Kranzlm{\"u}ller and Peter Kacsuk and Jack
                 Dongarra and Jens Volkert",
  title =        "Recent Advances in {Parallel Virtual Machine} and
                 {Message Passing Interface} (Select papers from the
                 {EuroPVMMPI 2002 Conference})",
  journal =      j-IJHPCA,
  volume =       "17",
  number =       "1",
  pages =        "3--5",
  month =        "Spring",
  year =         "2003",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Fri Nov 28 06:52:13 2003",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "DongWoo Lee and Jack J. Dongarra and R. S.
  title =        "{visP$ \! $ erf}: Monitoring Tool for Grid Computing",
  crossref =     "Sloot:2003:CSIc",
  pages =        "233--243",
  year =         "2003",
  bibdate =      "Wed Nov 17 16:33:34 2004",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "James S. Plank and Micah Beck and Jack Dongarra and
                 Rich Wolski and Heni Casanova",
  title =        "Optimizing Performance and Reliability in Distributed
                 Computing Systems Through Wide Spectrum Storage",
  crossref =     "Gerndt:2003:PEI",
  pages =        "??--??",
  year =         "2003",
  bibdate =      "Tue Jan 13 18:24:42 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  pagecount =    "8",

  author =       "Keith Seymour and Jack Dongarra",
  title =        "Automatic translation of {Fortran} to {JVM} bytecode",
  journal =      j-CCPE,
  volume =       "15",
  number =       "3--5",
  pages =        "207--222",
  month =        mar # "\slash " # apr,
  year =         "2003",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Tue Jan 13 09:28:08 MST 2004",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Prac\-tice and
  journal-URL =  "",
  onlinedate =   "12 Feb 2003",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sathish Vadhiyar and Jack Dongarra",
  title =        "{GrADSolve} --- {A} {Grid}-based {RPC} system for
                 Remote Invocation of Parallel Software",
  journal =      j-PARALLEL-DIST-COMP-PRACT,
  volume =       "??",
  number =       "??",
  pages =        "??--??",
  year =         "2003",
  CODEN =        "????",
  ISSN =         "1097-2803",
  bibdate =      "Tue Jan 13 18:29:45 2004",
  bibsource =    "",
  note =         "Submitted.",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "PDCP: Parallel and Distributed Computing Practices",
  keywords =     "GrADS (Grid Application Development Software)",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sathish Vadhiyar and Jack Dongarra",
  title =        "{GrADSolve} --- {RPC} for High Performance Computing
                 on the {Grid}",
  crossref =     "Kosch:2003:EPP",
  pages =        "??--??",
  year =         "2003",
  bibdate =      "Tue Jan 13 18:31:06 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "GrADS (Grid Application Development Software)",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "S. S. Vadhiyar and J. J. Dongarra",
  title =        "A performance oriented migration framework for the
  crossref =     "IEEE:2003:CIA",
  pages =        "130--137",
  year =         "2003",
  DOI =          "",
  bibdate =      "Fri May 27 10:38:01 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sathish Vadhiyar and Jack Dongarra",
  title =        "Self Adaptability in Grid Computing",
  journal =      j-CCPE,
  volume =       "??",
  number =       "??",
  pages =        "??--??",
  month =        "????",
  year =         "2003",
  CODEN =        "CCPEBO",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Tue Jan 13 18:31:58 2004",
  bibsource =    "",
  note =         "Submitted.",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Prac\-tice and
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sathish S. Vadhiyar and Jack J. Dongarra",
  title =        "{SRS} --- {A} Framework for Developing Malleable and
                 Migratable Parallel Applications for Distributed
  journal =      j-PARALLEL-PROCESS-LETT,
  volume =       "13",
  number =       "2",
  pages =        "291--??",
  month =        jun,
  year =         "2003",
  CODEN =        "PPLTEE",
  ISSN =         "0129-6264 (print), 1793-642X (electronic)",
  bibdate =      "Thu Jan 06 09:46:07 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Processing Letters",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "D. Abramson and J. Dongarra and E. Meek and P. Roe and
                 Zhiao Shi",
  title =        "Simplified grid computing through spreadsheets and
  crossref =     "IEEE:2004:SIC",
  pages =        "19--24",
  year =         "2004",
  DOI =          "",
  bibdate =      "Fri May 27 10:42:55 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Micah Beck and Jack Dongarra and Jian Huang and Terry
                 Moore and James S. Plank",
  title =        "Active Logistical State Management in {GridSolve/L}",
  crossref =     "IEEE:2004:CII",
  pages =        "??--??",
  year =         "2004",
  bibdate =      "Tue Jan 13 17:53:10 2004",
  bibsource =    "",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Henri Casanova and Francine Berman and Thomas Bartol
                 and Erhan Gokcay and Terry Sejnowski and Adam Birnbaum
                 and Jack Dongarra and Michelle Miller and Mark Ellisman
                 and Marcio Faerman and Graziano Obertelli and Rich
                 Wolski and Stuart Pomerantz and Joel Stiles",
  title =        "The {Virtual Instrument}: Support for {Grid}-Enabled
                 {Mcell} Simulations",
  journal =      j-IJHPCA,
  volume =       "18",
  number =       "1",
  pages =        "3--17",
  month =        feb,
  year =         "2004",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Aug 31 09:59:44 MDT 2010",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Zizhong Chen and Jack Dongarra and Piotr Luszczek and
                 Kenneth Roche",
  title =        "The {LAPACK for Clusters Project}: An Example of Self
                 Adapting Numerical Software",
  crossref =     "Sprague:2004:PAH",
  pages =        "282--291",
  year =         "2004",
  bibdate =      "Fri May 27 10:43:51 2005",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "K. Cooper and A. Dasgupta and K. Kennedy and C.
                 Koelbel and A. Mandal and G. Marin and M. Mazina and J.
                 Mellor-Crummey and F. Berman and H. Casanova and A.
                 Chien and H. Dail and X. Liu and A. Olugbile and O.
                 Sievert and H. Xia and L. Johnsson and B. Liu and M.
                 Patel and D. Reed and W. Deng and C. Mendes and Z. Shi
                 and A. YarKhan and J. Dongarra",
  title =        "New grid scheduling and rescheduling methods in the
                 {GrADS} project",
  crossref =     "IEEE:2004:IPD",
  pages =        "199--??",
  year =         "2004",
  DOI =          "",
  bibdate =      "Fri May 27 10:40:46 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Shirley Moore and Phil Mucci and
                 Keith Seymour and Haihang You",
  title =        "Accurate Cache and {TLB} Characterization Using
                 hardware Counters",
  crossref =     "Bubak:2004:CSIa",
  pages =        "??--??",
  year =         "2004",
  bibdate =      "Tue Jan 13 17:48:09 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxnote =       "Which of the four volumes did this appear in??",

  author =       "Jack J. Dongarra",
  title =        "Performance of Various Computers Using Standard Linear
                 Equations Software, ({Linpack} Benchmark Report)",
  type =         "Technical report",
  number =       "CS-89-85",
  institution =  inst-UTK,
  address =      inst-UTK:adr,
  year =         "2004",
  bibdate =      "Tue Jan 13 17:47:01 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and B. Tourancheau",
  title =        "Preface: Workshop on clusters and computational grids
                 for scientific computing",
  journal =      j-IJHPCA,
  volume =       "18",
  number =       "3",
  pages =        "283--283",
  month =        "Fall",
  year =         "2004",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Kaj Madsen and Jerzy
  title =        "Selected numerical algorithms",
  journal =      j-FUT-GEN-COMP-SYS,
  volume =       "20",
  number =       "3",
  pages =        "349--351",
  day =          "1",
  month =        apr,
  year =         "2004",
  CODEN =        "FGSEVI",
  DOI =          "",
  ISSN =         "0167-739X (print), 1872-7115 (electronic)",
  ISSN-L =       "0167-739X",
  bibdate =      "Fri Jul 15 08:00:44 MDT 2005",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Future Generation Computer Systems",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra",
  title =        "The {Boole Lecture}: Trends in High Performance
  journal =      j-COMP-J,
  volume =       "47",
  number =       "4",
  pages =        "399--403",
  month =        jul,
  year =         "2004",
  CODEN =        "CMPJA6",
  DOI =          "",
  ISSN =         "0010-4620 (print), 1460-2067 (electronic)",
  ISSN-L =       "0010-4620",
  bibdate =      "Tue Jun 8 12:55:15 MDT 2004",
  bibsource =    ";
  URL =          ";
  abstract =     "The Annual Boole Lecture was established and is
                 sponsored by the Boole Centre for Research in
                 Informatics, the Cork Constraint Computation Centre,
                 the Department of Computer Science, and the School of
                 Mathematics, Applied Mathematics and Statistics at
                 University College Cork. The series is named in honour
                 of George Boole, the first professor of Mathematics at
                 UCC, whose seminal work on logic in the late 1800s is
                 central to modern digital computing. To mark this great
                 contribution, leaders in the fields of computing and
                 mathematics are invited to talk to the general public
                 on directions in science, on past achievements and on
                 visions for the future.",
  acknowledgement = ack-nhfb,
  fjournal =     "The Computer Journal",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "T. Eidson and V. Eijkhout and J. Dongarra",
  title =        "Improvements in the efficient composition of
                 applications built using a component-based programming
  crossref =     "IEEE:2004:IPD",
  pages =        "198--198",
  year =         "2004",
  DOI =          "",
  bibdate =      "Fri May 27 10:41:51 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Graham E. Fagg and Jack J. Dongarra",
  title =        "Building and Using a Fault-Tolerant {MPI}
  journal =      j-IJHPCA,
  volume =       "18",
  number =       "3",
  pages =        "353--361",
  month =        "Fall",
  year =         "2004",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Aug 31 09:59:45 MDT 2010",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Kevin Heinrich and Michael W. Berry and Jack J.
                 Dongarra and Sathish Vadhiyar",
  title =        "The Semantic Conference Organizer",
  crossref =     "Bozdogan:2004:EMP",
  year =         "2004",
  bibdate =      "Tue Jan 13 18:36:14 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Piotr Luszczek and Jack Dongarra",
  title =        "Design of Interactive Environment for Numerically
                 Intensive Parallel Linear Algebra Calculations",
  crossref =     "Bubak:2004:CSIa",
  pages =        "??--??",
  year =         "2004",
  bibdate =      "Tue Jan 13 17:48:09 2004",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxnote =       "Which of the four volumes did this appear in??",

  author =       "F. Song and F. Wolf and N. Bhatia and J. Dongarra and
                 S. Moore",
  title =        "An algebra for cross-experiment performance analysis",
  crossref =     "Eigenmann:2004:IIC",
  pages =        "63--72",
  year =         "2004",
  bibdate =      "Fri May 27 10:15:33 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Y. Tanimura and K. Aoi and T. Hiroyasu and M. Miki and
                 Y. Okamoto and J. Dongarra",
  title =        "Implementation of protein tertiary structure
                 prediction system with {NetSolve}",
  crossref =     "IEEE:2004:SIC",
  pages =        "320--327",
  year =         "2004",
  DOI =          "",
  bibdate =      "Fri May 27 10:39:52 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sathish S. Vadhiyar and Jack J. Dongarra",
  title =        "{GrADSolve} --- a grid-based {RPC} system for parallel
                 computing with application-level scheduling",
  journal =      j-J-PAR-DIST-COMP,
  volume =       "64",
  number =       "6",
  pages =        "774--783",
  month =        jun,
  year =         "2004",
  CODEN =        "JPDCER",
  DOI =          "",
  ISSN =         "0743-7315 (print), 1096-0848 (electronic)",
  ISSN-L =       "0743-7315",
  bibdate =      "Sat Dec 4 15:15:09 MST 2004",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of Parallel and Distributed Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sathish S. Vadhiyar and Graham E. Fagg and Jack J.
  title =        "Towards an Accurate Model for Collective
  journal =      j-IJHPCA,
  volume =       "18",
  number =       "1",
  pages =        "159--167",
  month =        feb,
  year =         "2004",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Aug 31 09:59:44 MDT 2010",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Asim YarKhan and Jack Dongarra",
  title =        "Biological Sequence Alignment on the {Computational
                 Grid} Using the {Grads Framework}",
  journal =      j-J-GRID-COMP,
  volume =       "1",
  number =       "1",
  pages =        "??--??",
  month =        "????",
  year =         "2004",
  ISSN =         "1570-7873 (print), 1572-9184 (electronic)",
  ISSN-L =       "1570-7873",
  bibdate =      "Tue Jan 13 17:59:18 2004",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of Grid Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "M. Beck and J. Dongarra and J. S. Plank",
  title =        "{NetSolve/D}: a Massively Parallel Grid Execution
                 System for Scalable Data Intensive Collaboration",
  crossref =     "IEEE:2005:IPD",
  pages =        "223a-223a",
  year =         "2005",
  bibdate =      "Fri May 27 10:12:14 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "F. Berman and H. Casanova and A. Chien and K. Cooper
                 and H. Dail and A. Dasgupta and W. Deng and J. Dongarra
                 and L. Johnsson and K. Kennedy and C. Koelbel and B.
                 Liu and X. Liu and A. Mandal and G. Marin and M. Mazina
                 and J. Mellor-Crummey and C. Mendes and A. Olugbile and
                 M. Patel and D. Reed and Z. Shi and O. Sievert and H.
                 Xia and A. YarKhan",
  title =        "New {Grid} Scheduling and Rescheduling Methods in the
                 {GrADS Project}",
  journal =      j-INT-J-PARALLEL-PROG,
  volume =       "33",
  number =       "2--3",
  pages =        "209--229",
  month =        jun,
  year =         "2005",
  CODEN =        "IJPPE5",
  DOI =          "",
  ISSN =         "0885-7458 (print), 1573-7640 (electronic)",
  ISSN-L =       "0885-7458",
  bibdate =      "Wed Jul 9 16:05:27 MDT 2008",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of Parallel Programming",
  journal-URL =  "",
  keywords =     "Grid computing; rescheduling; scheduling",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Zizhong Chen and Jack J. Dongarra",
  title =        "Condition Numbers of {Gaussian} Random Matrices",
  journal =      j-SIAM-J-MAT-ANA-APPL,
  volume =       "27",
  number =       "3",
  pages =        "603--620",
  month =        jul,
  year =         "2005",
  CODEN =        "SJMAEL",
  DOI =          "",
  ISSN =         "0895-4798 (print), 1095-7162 (electronic)",
  ISSN-L =       "0895-4798",
  bibdate =      "Thu Dec 29 16:33:57 MST 2005",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM Journal on Matrix Analysis and Applications",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jim Demmel and Jack Dongarra",
  title =        "{LAPACK 2005} Prospectus: Reliable and Scalable
                 Software for Linear Algebra Computations on High End
  type =         "LAPACK Working Note",
  number =       "164",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        feb,
  year =         "2005",
  bibdate =      "Fri Apr 22 17:06:37 2005",
  bibsource =    "",
  note =         "UT-CS-05-546, February 2005.",
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Demmel and J. Dongarra and V. Eijkhout and E.
                 Fuentes and A. Petitet and R. Vuduc and R. C. Whaley
                 and K. Yelick",
  title =        "Self-adapting linear algebra algorithms and software",
  journal =      j-PROC-IEEE,
  volume =       "93",
  number =       "2",
  pages =        "293--312",
  month =        feb,
  year =         "2005",
  CODEN =        "IEEPAD",
  DOI =          "",
  ISSN =         "0018-9219 (print), 1558-2256 (electronic)",
  ISSN-L =       "0018-9219",
  bibdate =      "Fri May 27 10:03:49 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Proceedings of the IEEE",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Thomas Sterling and Horst Simon and
                 Erich Strohmaier",
  title =        "High-Performance Computing: Clusters, Constellations,
                 {MPPs}, and Future Directions",
  journal =      j-COMPUT-SCI-ENG,
  volume =       "7",
  number =       "2",
  pages =        "51--59",
  month =        mar # "\slash " # apr,
  year =         "2005",
  CODEN =        "CSENFA",
  DOI =          "",
  ISSN =         "1521-9615 (print), 1558-366X (electronic)",
  ISSN-L =       "1521-9615",
  bibdate =      "Sat May 14 13:11:45 MDT 2005",
  bibsource =    ";
  URL =          ";
  acknowledgement = ack-nhfb,
  fjournal =     "Computing in Science and Engineering",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Victor Eijkhout and Erika Fuentes and Thomas Eidson
                 and Jack Dongarra",
  title =        "The Component Structure of a Self-Adapting Numerical
                 Software System",
  journal =      j-INT-J-PARALLEL-PROG,
  volume =       "33",
  number =       "2--3",
  pages =        "137--143",
  month =        jun,
  year =         "2005",
  CODEN =        "IJPPE5",
  DOI =          "",
  ISSN =         "0885-7458 (print), 1573-7640 (electronic)",
  ISSN-L =       "0885-7458",
  bibdate =      "Wed Jul 9 16:05:27 MDT 2008",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of Parallel Programming",
  journal-URL =  "",
  keywords =     "adaptive systems; component frameworks; Linear system
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Graham E. Fagg and Edgar Gabriel and Zizhong Chen and
                 Thara Angskun and George Bosilca and Jelena
                 Pjesivac-Grbovic and Jack J. Dongarra",
  title =        "Process Fault Tolerance: Semantics, Design and
                 Applications for High Performance Computing",
  journal =      j-IJHPCA,
  volume =       "19",
  number =       "4",
  pages =        "465--477",
  month =        "Winter",
  year =         "2005",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Aug 31 09:59:45 MDT 2010",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Edgar Gabriel and Graham E. Fagg and Jack J.
  title =        "Evaluating Dynamic Communicators and One-Sided
                 Operations for Current {MPI} Libraries",
  journal =      j-IJHPCA,
  volume =       "19",
  number =       "1",
  pages =        "67--79",
  month =        "Spring",
  year =         "2005",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Aug 31 09:59:45 MDT 2010",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Dieter Kranzlm{\"u}ller and Peter Kacsuk and Jack
  title =        "Recent Advances in {Parallel Virtual Machine} and
                 {Message Passing Interface}",
  journal =      j-IJHPCA,
  volume =       "19",
  number =       "2",
  pages =        "99--101",
  month =        "Summer",
  year =         "2005",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Aug 31 09:59:45 MDT 2010",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. M. F. Moura and M. Puschel and D. Padua and J.
  title =        "Scanning the Issue: Special Issue on Program
                 Generation, Optimization, and Platform Adaptation",
  journal =      j-PROC-IEEE,
  volume =       "93",
  number =       "2",
  pages =        "211--215",
  month =        feb,
  year =         "2005",
  CODEN =        "IEEPAD",
  DOI =          "",
  ISSN =         "0018-9219 (print), 1558-2256 (electronic)",
  ISSN-L =       "0018-9219",
  bibdate =      "Fri May 27 10:04:59 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Proceedings of the IEEE",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Manish Parashar and Rajeev Muralidhar and Wonsuck Lee
                 and Dorian Arnold and Jack Dongarra and Mary Wheeler",
  title =        "Enabling interactive and collaborative oil reservoir
                 simulations on the {Grid}",
  journal =      j-CCPE,
  volume =       "17",
  number =       "11",
  pages =        "1387--1414",
  month =        sep,
  year =         "2005",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Sat May 14 11:30:58 MDT 2005",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Prac\-tice and
  journal-URL =  "",
  onlinedate =   "8 Apr 2005",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Pjesivac-Grbovic and T. Angskun and G. Bosilca and
                 G. E. Fagg and E. Gabriel and J. J. Dongarra",
  title =        "Performance Analysis of {MPI} Collective Operations",
  crossref =     "IEEE:2005:IPD",
  pages =        "272a-272a",
  year =         "2005",
  bibdate =      "Fri May 27 10:13:34 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Erich Strohmaier and Jack J. Dongarra and Hans W.
                 Meuer and Horst D. Simon",
  title =        "Recent trends in the marketplace of high performance
  journal =      j-PARALLEL-COMPUTING,
  volume =       "31",
  number =       "3--4",
  pages =        "261--273",
  month =        mar # "\slash " # apr,
  year =         "2005",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Thu Sep 2 17:51:03 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sathish S. Vadhiyar and Jack J. Dongarra",
  title =        "Self adaptivity in {Grid} computing",
  journal =      j-CCPE,
  volume =       "17",
  number =       "2--4",
  pages =        "235--257",
  month =        feb # "\slash " # apr,
  year =         "2005",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Sat May 14 11:30:56 MDT 2005",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Prac\-tice and
  journal-URL =  "",
  onlinedate =   "7 Feb 2005",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Asim YarKhan and Jack J. Dongarra",
  title =        "Biological sequence alignment on the computational
                 grid using the {GrADS} framework",
  journal =      j-FUT-GEN-COMP-SYS,
  volume =       "21",
  number =       "6",
  pages =        "980--986",
  month =        jun,
  year =         "2005",
  CODEN =        "FGSEVI",
  DOI =          "",
  ISSN =         "0167-739X (print), 1872-7115 (electronic)",
  ISSN-L =       "0167-739X",
  bibdate =      "Fri Jul 15 08:00:46 MDT 2005",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Future Generation Computer Systems",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Alfredo Buttari and Jack J. Dongarra and Jakub Kurzak
                 and Piotr Luszczek and Stanimire Tomov",
  title =        "Using Mixed Precision for Sparse Matrix Computations
                 to Enhance the Performance while Achieving 64-bit
  type =         "LAPACK Working Note",
  number =       "180",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "22",
  month =        oct,
  year =         "2006",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  abstract =     "By using a combination of 32-bit and 64-bit floating
                 point arithmetic the performance of many sparse linear
                 algebra algorithms can be significantly enhanced while
                 maintaining the 64-bit accuracy of the resulting
                 solution. These ideas can be applied to sparse
                 multifrontal and supernodal direct techniques, and
                 sparse iterative techniques such as Krylov subspace
                 methods. The approach presented here can apply not only
                 to conventional processors but also to exotic
                 technologies such as Field Programmable Gate Arrays
                 (FPGA), Graphical Processing Units (GPU), and the Cell
                 BE processor.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-06-584",

  author =       "J. Dongarra and G. Bosilca and Z. Chen and V. Eijkhout
                 and G. E. Fagg and E. Fuentes and J. Langou and P.
                 Luszczek and J. Pjesivac-Grbovic and K. Seymour and H.
                 You and S. S. Vadhiyar",
  title =        "{Self-Adapting Numerical Software} ({SANS}) effort",
  journal =      j-IBM-JRD,
  volume =       "50",
  number =       "2/3",
  pages =        "223--238",
  month =        mar # " \slash " # may,
  year =         "2006",
  CODEN =        "IBMJAE",
  ISSN =         "0018-8646 (print), 2151-8556 (electronic)",
  ISSN-L =       "0018-8646",
  bibdate =      "Fri Feb 9 20:16:31 MST 2007",
  bibsource =    ";
  URL =          "",
  abstract =     "The challenge for the development of next-generation
                 software is the successful management of the complex
                 computational environment while delivering to the
                 scientist the full power of flexible compositions of
                 the available algorithmic alternatives. Self-adapting
                 numerical software (SANS) systems are intended to meet
                 this significant challenge. The process of arriving at
                 an efficient numerical solution of problems in
                 computational science involves numerous decisions by a
                 numerical expert. Attempts to automate such decisions
                 distinguish three levels: algorithmic decision,
                 management of the parallel environment, and
                 processor-specific tuning of kernels. Additionally, at
                 any of these levels we can decide to rearrange the
                 user's data. In this paper we look at a number of
                 efforts at the University of Tennessee to investigate
                 these areas.",
  acknowledgement = ack-nhfb,
  fjournal =     "IBM Journal of Research and Development",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  ordernumber =  "G322-0247-00",

  author =       "Jack Dongarra and Bernard Tourancheau",
  title =        "Special Issue on Tools in the {ACTS Collection 2004}",
  journal =      j-IJHPCA,
  volume =       "20",
  number =       "3",
  pages =        "317--317",
  month =        "Fall",
  year =         "2006",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Aug 31 09:59:45 MDT 2010",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra",
  title =        "Trends in high-performance computing",
  journal =      "IEEE Circuits \& Devices",
  volume =       "22",
  number =       "1",
  pages =        "22--27",
  month =        "????",
  year =         "2006",
  DOI =          "",
  ISSN =         "8755-3996",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Nahid Emad and S.-A. Shahzadeh-Fazeli and Jack
  title =        "An asynchronous algorithm on the {NetSolve} global
                 computing system",
  journal =      j-FUT-GEN-COMP-SYS,
  volume =       "22",
  number =       "3",
  pages =        "279--290",
  month =        feb,
  year =         "2006",
  CODEN =        "FGSEVI",
  DOI =          "",
  ISSN =         "0167-739X (print), 1872-7115 (electronic)",
  ISSN-L =       "0167-739X",
  bibdate =      "Sat Sep 11 13:08:05 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Future Generation Computer Systems",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jakub Kurzak and Jack Dongarra",
  title =        "Implementing Linear Algebra Routines on Multi-Core
                 Processors with Pipelining and a Look Ahead",
  type =         "LAPACK Working Note",
  number =       "178",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  pages =        "11",
  month =        sep,
  year =         "2006",
  bibdate =      "Mon Oct 09 12:05:43 2006",
  bibsource =    "",
  note =         "Also available as UT-CS-06-581.",
  URL =          ";
  abstract =     "Linear algebra algorithms commonly encapsulate
                 parallelism in Basic Linear Algebra Subroutines (BLAS).
                 This solution relies on the fork-join model of parallel
                 execution, which may result in suboptimal performance
                 on current and future generations of multi-core
                 processors. To overcome the shortcomings of this
                 approach a pipelined model of parallel execution is
                 presented, and the idea of the look ahead is utilized
                 in order to suppress the negative effects of sequential
                 formulation of the algorithms. Application to one-sided
                 matrix factorizations, LU, Cholesky and QR, is
                 described. Shared memory implementation using POSIX
                 threads is presented.",
  acknowledgement = ack-nhfb,
  keywords =     "linear algebra; look ahead; multi-core processors;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jakub Kurzak and Jack Dongarra",
  title =        "Implementation of the Mixed-Precision High Performance
                 {LINPACK} Benchmark on the {CELL Processor}",
  type =         "LAPACK Working Note",
  number =       "177",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  pages =        "12",
  month =        sep,
  year =         "2006",
  bibdate =      "Mon Oct 09 12:05:43 2006",
  bibsource =    "",
  note =         "Also available as UT-CS-06-580.",
  URL =          ";
  abstract =     "This paper describes the design concepts behind
                 implementations of mixed-precision linear algebra
                 routines targeted for the Cell processor. It describes
                 in detail the implementation of code to solve linear
                 system of equations using Gaussian elimination in
                 single precision with iterative refinement of the
                 solution to the full double precision accuracy. By
                 utilizing this approach the algorithm achieves close to
                 an order of magnitude higher performance on the Cell
                 processor than the performance offered by the standard
                 double precision algorithm. Effectively the code is an
                 implementation of the high performance LINPACK
                 benchmark, since it meets all the requirements
                 concerning the problem being solved and the numerical
                 properties of the solution.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Julie Langou and Julien Langou and Piotr Luszczek and
                 Jakub Kurzak and Alfredo Buttari and Jack Dongarra",
  title =        "Exploiting the Performance of 32 bit Floating Point
                 Arithmetic in Obtaining 64 bit Accuracy (Revisiting
                 Iterative Refinement for Linear Systems)",
  type =         "LAPACK Working Note",
  number =       "175",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  pages =        "17",
  month =        jun,
  year =         "2006",
  bibdate =      "Mon Oct 09 12:05:43 2006",
  bibsource =    "",
  URL =          ";
  abstract =     "Recent versions of microprocessors exhibit performance
                 characteristics for 32 bit floating point arithmetic
                 (single precision) that is substantially higher than 64
                 bit floating point arithmetic (double precision).
                 Examples include the Intel's Pentium IV and M
                 processors, AMD's Opteron architectures and the IBM's
                 Cell Broad Engine processor. When working in single
                 precision, floating point operations can be performed
                 up to two times faster on the Pentium and up to ten
                 times faster on the Cell over double precision. The
                 performance enhancements in these architectures are
                 derived by accessing extensions to the basic
                 architecture, such as SSE2 in the case of the Pentium
                 and the vector functions on the IBM Cell. The
                 motivation for this paper is to exploit single
                 precision operations whenever possible and resort to
                 double precision at critical stages while attempting to
                 provide the full double precision results. The results
                 described here are fairly general and can be applied to
                 various problems in linear algebra such as solving
                 large sparse systems, using direct or iterative methods
                 and some eigenvalue problems. There are limitations to
                 the success of this process, such as when the
                 conditioning of the problem exceeds the reciprocal of
                 the accuracy of the single precision computations. In
                 that case the double precision algorithm should be
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Julie Langou and Julien Langou and Piotr Luszczek and
                 Jakub Kurzak and Alfredo Buttari and Jack Dongarra",
  title =        "Exploiting the performance of 32 bit floating point
                 arithmetic in obtaining 64 bit accuracy (revisiting
                 iterative refinement for linear systems)",
  crossref =     "ACM:2006:SCH",
  pages =        "??--??",
  year =         "2006",
  DOI =          "",
  bibdate =      "Thu Nov 08 20:00:17 2007",
  bibsource =    "",
  abstract =     "Recent versions of microprocessors exhibit performance
                 characteristics for 32 bit floating point arithmetic
                 (single precision) that is substantially higher than 64
                 bit floating point arithmetic (double precision).
                 Examples include the Intel's Pentium IV and M
                 processors, AMD's Opteron architectures and the IBM's
                 Cell Broad Engine processor. When working in single
                 precision, floating point operations can be performed
                 up to two times faster on the Pentium and up to ten
                 times faster on the Cell over double precision. The
                 performance enhancements in these architectures are
                 derived by accessing extensions to the basic
                 architecture, such as SSE2 in the case of the Pentium
                 and the vector functions on the IBM Cell. The
                 motivation for this paper is to exploit single
                 precision operations whenever possible and resort to
                 double precision at critical stages while attempting to
                 provide the full double precision results. The results
                 described here are fairly general and can be applied to
                 various problems in linear algebra such as solving
                 large sparse systems, using direct or iterative methods
                 and some eigenvalue problems. There are limitations to
                 the success of this process, such as when the
                 conditioning of the problem exceeds the reciprocal of
                 the accuracy of the single precision computations. In
                 that case the double precision algorithm should be
  acknowledgement = ack-nhfb,
  articleno =    "113",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Zhiao Shi and Jack J. Dongarra",
  title =        "Scheduling workflow applications on processors with
                 different capabilities",
  journal =      j-FUT-GEN-COMP-SYS,
  volume =       "22",
  number =       "6",
  pages =        "665--675",
  month =        may,
  year =         "2006",
  CODEN =        "FGSEVI",
  DOI =          "",
  ISSN =         "0167-739X (print), 1872-7115 (electronic)",
  ISSN-L =       "0167-739X",
  bibdate =      "Sat Sep 11 13:08:06 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Future Generation Computer Systems",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Asim YarKhan and Keith Seymour and Kiran Sagi and
                 Zhiao Shi and Jack Dongarra",
  title =        "Recent Developments in {GridSolve}",
  journal =      j-IJHPCA,
  volume =       "20",
  number =       "1",
  pages =        "131--141",
  month =        "Spring",
  year =         "2006",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Aug 31 09:59:45 MDT 2010",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Marc Baboulin and Jack J. Dongarra and Serge Gratton
                 and Julien Langou",
  title =        "Computing the Conditioning of the Components of a
                 Linear Least Squares Solution",
  type =         "LAPACK Working Note",
  number =       "193",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        sep,
  year =         "2007",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper, we address the accuracy of the results
                 for the overdetermined full rank linear least squares
                 problem. We recall theoretical results obtained in [2]
                 on conditioning of the least squares solution and the
                 components of the solution when the matrix
                 perturbations are measured in Frobenius or spectral
                 norms. Then we define computable estimates for these
                 condition numbers and we interpret them in terms of
                 statistical quantities. In particular, we show that, in
                 the classical linear statistical model, the ratio of
                 the variance of one component of the solution by the
                 variance of the right-hand side is exactly the
                 condition number of this solution component when
                 perturbations on the right-hand side are considered. We
                 also provide fragment codes using LAPACK [1] routines
                 to compute the variance-covariance matrix and the least
                 squares conditioning and we give the corresponding
                 computational cost. Finally we present a small
                 historical numerical example that was used by Laplace
                 [19] for computing the mass of Jupiter and experiments
                 from the space industry with real physical data.",
  acknowledgement = ack-nhfb,
  keywords =     "condition number; LAPACK; Linear least squares;
                 parameter estimation; ScaLAPACK; statistical linear
                 least squares; variance-covariance matrix",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-07-604",

  author =       "Alfredo Buttari and Julien Langou and Jakub Kurzak and
                 Jack J. Dongarra",
  title =        "A Class of Parallel Tiled Linear Algebra Algorithms
                 for Multicore Architectures",
  type =         "LAPACK Working Note",
  number =       "191",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        sep,
  year =         "2007",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  abstract =     "As multicore systems continue to gain ground in the
                 High Performance Computing world, linear algebra
                 algorithms have to be reformulated or new algorithms
                 have to be developed in order to take advantage of the
                 architectural features on these new processors. Fine
                 grain parallelism becomes a major requirement and
                 introduces the necessity of loose synchronization in
                 the parallel execution of an operation. This paper
                 presents an algorithm for the Cholesky, LU and QR
                 factorization where the operations can be represented
                 as a sequence of small tasks that operate on square
                 blocks of data. These tasks can be dynamically
                 scheduled for execution based on the dependencies among
                 them and on the availability of computational
                 resources. This may result in an out of order execution
                 of the tasks which will completely hide the presence of
                 intrinsically sequential tasks in the factorization.
                 Performance comparisons are presented with the LAPACK
                 algorithms where parallelism can only be exploited at
                 the level of the BLAS operations and vendor
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-07-600",

  author =       "Alfredo Buttari and Jack J. Dongarra and Jakub
  title =        "Limitations of the {PlayStation 3} for High
                 Performance Cluster Computing",
  type =         "LAPACK Working Note",
  number =       "185",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        may,
  year =         "2007",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-07-597",

  author =       "Alfredo Buttari and Jack Dongarra and Julie Langou and
                 Julien Langou and Piotr Luszczek and Jakub Kurzak",
  title =        "Mixed Precision Iterative Refinement Techniques for
                 the Solution of Dense Linear Systems",
  journal =      j-IJHPCA,
  volume =       "21",
  number =       "4",
  pages =        "457--466",
  month =        nov,
  year =         "2007",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Aug 31 09:59:45 MDT 2010",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Alfredo Buttari and Julien Langou and Jakub Kurzak and
                 Jack J. Dongarra",
  title =        "Parallel Tiled {$ Q R $} Factorization for Multicore
  type =         "LAPACK Working Note",
  number =       "190",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        jul,
  year =         "2007",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  note =         "Published in \cite{Buttari:2008:PTF}.",
  URL =          "",
  abstract =     "As multicore systems continue to gain ground in the
                 High Performance Computing world, linear algebra
                 algorithms have to be reformulated or new algorithms
                 have to be developed in order to take advantage of the
                 architectural features on these new processors. Fine
                 grain parallelism becomes a major requirement and
                 introduces the necessity of loose synchronization in
                 the parallel execution of an operation. This paper
                 presents an algorithm for the QR factorization where
                 the operations can be represented as a sequence of
                 small tasks that operate on square blocks of data.
                 These tasks can be dynamically scheduled for execution
                 based on the dependencies among them and on the
                 availability of computational resources. This may
                 result in an out of order execution of the tasks which
                 will completely hide the presence of intrinsically
                 sequential tasks in the factorization. Performance
                 comparisons are presented with the LAPACK algorithm for
                 QR factorization where parallelism can only be
                 exploited at the level of the BLAS operations.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-07-598",

  author =       "James W. Demmel and Jack J. Dongarra and Beresford N.
                 Parlett and William Kahan and Ming Gu and David S.
                 Bindel and Yozo Hida and Xiaoye S. Li and Osni A.
                 Marques and E. Jason Riedy and Christof V{\"o}mel and
                 Julien Langou and Piotr Luszczek and Jakub Kurzak and
                 Alfredo Buttari and Julie Langou and Stanimire Tomov",
  title =        "Prospectus for the Next {LAPACK} and {ScaLAPACK}
  type =         "LAPACK Working Note",
  number =       "181",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "11",
  month =        mar,
  year =         "2007",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-07-592",

  author =       "Beniamino {Di Martino} and Dieter Kranzlm{\"u}ller and
                 Jack Dongarra",
  title =        "Special issue on selected papers from the
                 {EuroPVM\slash MPI 2005 Conference , Sorrento, Italy,
                 18-21 September 2005} --- Preface",
  journal =      j-IJHPCA,
  volume =       "21",
  number =       "2",
  pages =        "129--131",
  month =        "Summer",
  year =         "2007",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Victor Eijkhout and Julien Langou",
  title =        "{BLAS}",
  crossref =     "Hogben:2007:HLA",
  pages =        "??--??",
  year =         "2007",
  bibdate =      "Mon Aug 23 08:59:55 2010",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Piotr Luszczek",
  title =        "How Elegant Code Evolves With Hardware: The Case of
                 {Gaussian} Elimination",
  crossref =     "Oram:2007:BC",
  chapter =      "14",
  pages =        "229--252",
  year =         "2007",
  bibdate =      "Sat Nov 07 16:28:35 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Emmanuel Jeannot and Keith Seymour and Asym Yarkhan
                 and Jack J. Dongarra",
  title =        "Improved Runtime and Transfer Time Prediction
                 Mechanisms in a Network Enabled Servers Middleware",
  journal =      j-PARALLEL-PROCESS-LETT,
  volume =       "17",
  number =       "1",
  pages =        "47--59",
  month =        mar,
  year =         "2007",
  CODEN =        "PPLTEE",
  DOI =          "",
  ISSN =         "0129-6264 (print), 1793-642X (electronic)",
  MRnumber =     "2364277",
  bibdate =      "Mon Aug 23 18:27:04 2010",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Processing Letters",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jakub Kurzak and Jack Dongarra",
  title =        "Implementation of mixed precision in solving systems
                 of linear equations on the {Cell} processor",
  journal =      j-CCPE,
  volume =       "19",
  number =       "10",
  pages =        "1371--1385",
  month =        jul,
  year =         "2007",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Mon Dec 5 10:08:14 MST 2011",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Prac\-tice and
  journal-URL =  "",
  onlinedate =   "9 Jan 2007",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jakub Kurzak and Alfredo Buttari and Jack J.
  title =        "Solving Systems of Linear Equations on the {CELL}
                 Processor Using {Cholesky} Factorization",
  type =         "LAPACK Working Note",
  number =       "184",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        may,
  year =         "2007",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  abstract =     "The STI CELL processor introduces pioneering solutions
                 in processor architecture. At the same time it presents
                 new challenges for the development of numerical
                 algorithms. One is effective exploitation of the
                 differential between the speed of single and double
                 precision arithmetic; the other is efficient
                 parallelization between the short vector SIMD cores. In
                 this work, the first challenge is addressed by
                 utilizing a mixed-precision algorithm for the solution
                 of a dense symmetric positive definite system of linear
                 equations, which delivers double precision accuracy,
                 while performing the bulk of the work in single
                 precision. The second challenge is approached by
                 introducing much finer granularity of parallelization
                 than has been used for other architectures and using a
                 lightweight decentralized synchronization. The
                 implementation of the computationally intensive
                 sections gets within 90 percent of peak floating point
                 performance, while the implementation of the memory
                 intensive sections reaches within 90 percent of peak
                 memory bandwidth. On a single CELL processor, the
                 algorithm achieves over 170 Gflop/s when solving a
                 symmetric positive definite system of linear equation
                 in single precision and over 150 Gflop/s when
                 delivering the result in double precision accuracy.",
  acknowledgement = ack-nhfb,
  keywords =     "CELL BE; Cholesky factorization; iterative refinement;
                 mixed-precision algorithms",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-07-596",

  author =       "J. Langou and Z. Chen and G. Bosilca and J. Dongarra",
  title =        "Recovery Patterns for Iterative Methods in a Parallel
                 Unstable Environment",
  journal =      j-SIAM-J-SCI-COMP,
  volume =       "30",
  number =       "1",
  pages =        "102--116",
  year =         "2007",
  CODEN =        "SJOCE3",
  DOI =          "",
  ISSN =         "1064-8275 (print), 1095-7197 (electronic)",
  ISSN-L =       "1064-8275",
  MRclass =      "65F10 (68W10)",
  MRnumber =     "MR2377433 (2009b:65083)",
  MRreviewer =   "Olexander S. Babanin",
  bibdate =      "Wed May 19 10:43:59 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM Journal on Scientific Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Piotr Luszczek and Jack Dongarra",
  title =        "High Performance Development for High End Computing
                 With {Python Language Wrapper (PLW)}",
  journal =      j-IJHPCA,
  volume =       "21",
  number =       "3",
  pages =        "360--369",
  month =        aug,
  year =         "2007",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Aug 31 09:59:45 MDT 2010",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Beniamino {Di Martino} and Dieter Kranzlm{\"u}ller and
                 Jack Dongarra",
  title =        "Preface",
  journal =      j-IJHPCA,
  volume =       "21",
  number =       "2",
  pages =        "129--131",
  month =        may,
  year =         "2007",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Aug 31 09:59:45 MDT 2010",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Bernd Mohr and Jesper Larsson Traff and Joachim
                 Worringen and Jack Dongarra",
  title =        "Selected papers from {EuroPVM\slash MPI 2006}",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "33",
  number =       "9",
  pages =        "593--594",
  month =        "????",
  year =         "2007",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jelena Pje{\v{s}}ivac-Grbovi{\'c} and George Bosilca
                 and Graham E. Fagg and Thara Angskun and Jack J.
  title =        "{MPI} collective algorithm selection and quadtree
  journal =      j-PARALLEL-COMPUTING,
  volume =       "33",
  number =       "9",
  pages =        "613--623",
  month =        sep,
  year =         "2007",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Thu Sep 2 17:51:07 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jelena Pjesivac-Grbovic and Thara Angskun and George
                 Bosilca and Graham E. Fagg and Edgar Gabriel and Jack
                 J. Dongarra",
  title =        "Performance analysis of {MPI} collective operations",
  journal =      "The Journal of Networks, Software Tools, and Cluster
  volume =       "10",
  number =       "2",
  pages =        "127--143",
  month =        "????",
  year =         "2007",
  DOI =          "",
  ISSN =         "1386-7857",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classification = "Denver, CO",
  conference-date = "Apr 03--08, 2005",
  conference-name = "4th International Workshop on Performance
                 Modelling, Evaluation, and Optimization of Parallel and
                 Distributed Systems",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Christof V{\"o}mel and Stanimire Z. Tomov and Lin-Wang
                 Wang and Osni A. Marques and Jack J. Dongarra",
  title =        "The use of bulk states to accelerate the band edge
                 state calculation of a semiconductor quantum dot",
  journal =      j-J-COMPUT-PHYS,
  volume =       "223",
  number =       "2",
  pages =        "774--782",
  day =          "1",
  month =        may,
  year =         "2007",
  CODEN =        "JCTPAH",
  DOI =          "",
  ISSN =         "0021-9991 (print), 1090-2716 (electronic)",
  ISSN-L =       "0021-9991",
  bibdate =      "Mon Jan 2 22:13:32 MST 2012",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of Computational Physics",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jerzy Wa{\'s}niewski and Jack Dongarra and Kaj Madsen
                 and Sivan Toledo and Zahari Zlatev",
  title =        "Editorial introduction to the special issue on
                 computational linear algebra and sparse matrix
  volume =       "18",
  number =       "3",
  pages =        "205--207",
  year =         "2007",
  CODEN =        "AAECEW",
  DOI =          "",
  ISSN =         "0938-1279 (print), 1432-0622 (electronic)",
  ISSN-L =       "0938-1279",
  MRclass =      "15-06 (65-06)",
  MRnumber =     "2357727",
  bibdate =      "Mon Aug 23 18:27:26 2010",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Applicable Algebra in Engineering, Communication and
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Felix Wolf and Bernd Mohr and Jack Dongarra and
                 Shirley Moore",
  title =        "Automatic analysis of inefficiency patterns in
                 parallel applications",
  journal =      j-CCPE,
  volume =       "19",
  number =       "11",
  pages =        "1481--1496",
  day =          "10",
  month =        aug,
  year =         "2007",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Mon Dec 5 10:08:15 MST 2011",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Prac\-tice and
  journal-URL =  "",
  onlinedate =   "24 Oct 2006",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Wesley Alvaro and Jakub Kurzak and Jack J. Dongarra",
  title =        "Fast and Small Short Vector {SIMD} Matrix
                 Multiplication Kernels for the {CELL} Processor",
  type =         "LAPACK Working Note",
  number =       "189",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        jan,
  year =         "2008",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  abstract =     "Matrix multiplication is one of the most common
                 numerical operations, especially in the area of dense
                 linear algebra, where it forms the core of many
                 important algorithms, including solvers of linear
                 systems of equations, least square problems, and
                 singular and eigenvalue computations. The STI CELL
                 processor exceeds the capabilities of any other
                 processor available today in terms of peak single
                 precision, floating point performance. In order to
                 fully exploit the potential of the CELL processor for a
                 wide range of numerical algorithms, fast implementation
                 of the matrix multiplication operation is essential.
                 The crucial component is the matrix multiplication
                 kernel crafted for the short vector Single Instruction
                 Multiple Data architecture of the Synergistic
                 Processing Element of the CELL processor. In this
                 paper, single precision matrix multiplication kernels
                 are presented implementing the {$ C = C - A \times B T
                 $} operation and the {$ C = C - A \times B $} operation
                 for matrices of size $ 64 \times 64 $ elements. For the
                 latter case, the performance of 25.55 Gflop/s is
                 reported, or 99.80 percent of the peak, using as little
                 as 5.9 KB of storage for code and auxiliary data
  acknowledgement = ack-nhfb,
  keywords =     "CELL BE; matrix multiplication; SGEMM; short vector
                 SIMD; SPE",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-08-609",

  author =       "Marc Baboulin and Jack J. Dongarra and Stanimire
  title =        "Some Issues in Dense Linear Algebra for Multicore and
                 Special Purpose Architectures",
  type =         "LAPACK Working Note",
  number =       "200",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        may,
  year =         "2008",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  abstract =     "We address some key issues in designing dense linear
                 algebra (DLA) algorithms that are common for both
                 multi/many-cores and special purpose architectures (in
                 particular GPUs). We present them in the context of an
                 LU factorization algorithm, where randomization
                 techniques are used as an alternative to pivoting. This
                 approach yields an algorithm based entirely on a
                 collection of small Level 3 BLAS type computational
                 tasks, which has emerged as a common goal in designing
                 DLA algorithms for new architectures. Other common
                 trends, also considered here, are block asynchronous
                 task execution and ``Block'' layouts for the data
                 associated with the separate tasks. We present
                 numerical results and other specific experiments with
                 DLA algorithms on NVIDIA GPUs using CUDA. The GPU
                 results are also of interest themselves as we show a
                 performance of up to 160 Glop/s on a single Quadro FX
                 5600 card. Keywords: dense linear algebra, parallel
                 algorithms, LU factorization, multicore processors,
                 graphic process units.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-08-615",

  author =       "George Bosilca and Remi Delmas and Jack J. Dongarra
                 and Julien Langou",
  title =        "Algorithmic Based Fault Tolerance Applied to High
                 Performance Computing",
  type =         "LAPACK Working Note",
  number =       "205",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "23",
  month =        may,
  year =         "2008",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  abstract =     "We present a new approach to fault tolerance for High
                 Performance Computing system. Our approach is based on
                 a careful adaptation of the Algorithmic Based Fault
                 Tolerance technique (Huang and Abraham, 1984) to the
                 need of parallel distributed computation. We obtain a
                 strongly scalable mechanism for fault tolerance. We can
                 also detect and correct errors (bit-flip) on the fly of
                 a computation. To assess the viability of our approach,
                 we have developed a fault tolerant matrix-matrix
                 multiplication subroutine and we propose some models to
                 predict its running time. Our parallel fault-tolerant
                 matrix-matrix multiplication scores 1.4 TFLOPS on 484
                 processors (cluster {\tt}) and
                 returns a correct result while one process failure has
                 happened. This represents 65\% of the machine peak
                 efficiency and less than 12\% overhead with respect to
                 the fastest failure-free implementation. We predict
                 (and have observed) that, as we increase the processor
                 count, the overhead of the fault tolerance drops
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-08-620",

  author =       "Alfredo Buttari and Julien Langou and Jakub Kurzak and
                 Jack Dongarra",
  title =        "Parallel Tiled {$ Q R $} Factorization for Multicore
  journal =      j-CCPE,
  volume =       "20",
  number =       "13",
  pages =        "1573--1590",
  month =        SEP,
  year =         "2008",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Prac\-tice and
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  remark =       "Journal publication of LAWN 190

  author =       "Alfredo Buttari and Julien Langou and Jakub Kurzak and
                 Jack Dongarra",
  title =        "Parallel tiled {QR} factorization for multicore
  journal =      j-CCPE,
  volume =       "20",
  number =       "13",
  pages =        "1573--1590",
  day =          "10",
  month =        sep,
  year =         "2008",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Mon Dec 5 10:08:26 MST 2011",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Prac\-tice and
  journal-URL =  "",
  onlinedate =   "3 Jun 2008",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Alfredo Buttari and Jack Dongarra and Jakub Kurzak and
                 Piotr Luszczek and Stanimir Tomov",
  title =        "Using Mixed Precision for Sparse Matrix Computations
                 to Enhance the Performance while Achieving 64-bit
  journal =      j-TOMS,
  volume =       "34",
  number =       "4",
  pages =        "17:1--17:22",
  month =        jul,
  year =         "2008",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  MRclass =      "65L50 (65F05 65F10 65G50)",
  MRnumber =     "MR2474523 (2009m:65120)",
  bibdate =      "Wed Jul 16 11:30:01 MDT 2008",
  bibsource =    "",
  abstract =     "By using a combination of 32-bit and 64-bit floating
                 point arithmetic, the performance of many sparse linear
                 algebra algorithms can be significantly enhanced while
                 maintaining the 64-bit accuracy of the resulting
                 solution. These ideas can be applied to sparse
                 multifrontal and supernodal direct techniques and
                 sparse iterative techniques such as Krylov subspace
                 methods. The approach presented here can apply not only
                 to conventional processors but also to exotic
                 technologies such as Field Programmable Gate Arrays
                 (FPGA), Graphical Processing Units (GPU), and the Cell
                 BE processor.",
  acknowledgement = ack-nhfb,
  articleno =    "17",
  fjournal =     "Association for Computing Machinery. Transactions on
                 Mathematical Software",
  journal-URL =  "",
  keywords =     "floating point; iterative refinement; linear systems;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Zizhong Chen and Jack Dongarra",
  title =        "Algorithm-Based Fault Tolerance for Fail-Stop
  journal =      j-IEEE-TRANS-PAR-DIST-SYS,
  volume =       "19",
  number =       "12",
  pages =        "1628--1641",
  month =        dec,
  year =         "2008",
  CODEN =        "ITDSEO",
  DOI =          "",
  ISSN =         "1045-9219 (print), 1558-2183 (electronic)",
  ISSN-L =       "1045-9219",
  bibdate =      "Thu May 13 12:06:56 2010",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Transactions on Parallel and Distributed
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Beniamino {Di Martino} and Dieter Kranzlmueller and
                 Jack Dongarra",
  title =        "Special section: Grid computing and the message
                 passing interface",
  journal =      j-FUT-GEN-COMP-SYS,
  volume =       "24",
  number =       "2",
  pages =        "119--120",
  month =        "????",
  year =         "2008",
  CODEN =        "FGSEVI",
  DOI =          "",
  ISSN =         "0167-739x (print), 1872-7115 (electronic)",
  ISSN-L =       "0167-739X",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Future Generation Computer Systems",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ivan Dimov and Jack Dongarra and Kaj Madsen and Jerzy
                 Wasniewski and Zahari Zlatev",
  title =        "Special section: Applications of distributed and grid
  journal =      j-FUT-GEN-COMP-SYS,
  volume =       "24",
  number =       "6",
  pages =        "582--584",
  month =        jun,
  year =         "2008",
  CODEN =        "FGSEVI",
  DOI =          "",
  ISSN =         "0167-739X (print), 1872-7115 (electronic)",
  ISSN-L =       "0167-739X",
  bibdate =      "Sat Sep 11 13:08:12 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Future Generation Computer Systems",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Thomas Haigh",
  title =        "Biographies",
  journal =      j-IEEE-ANN-HIST-COMPUT,
  volume =       "30",
  number =       "2",
  pages =        "74--81",
  month =        apr # "\slash " # jun,
  year =         "2008",
  CODEN =        "IAHCEX",
  DOI =          "",
  ISSN =         "1058-6180 (print), 1934-1547 (electronic)",
  ISSN-L =       "1058-6180",
  bibdate =      "Thu Jul 3 10:46:12 MDT 2008",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Annals of the History of Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Jean-Fran{\c{c}}ois Pineau and Yves
                 Robert and Fr{\'e}d{\'e}ric Vivien",
  editor =       "{ACM}",
  title =        "Matrix Product on Heterogeneous Master--Worker
  crossref =     "Chatterjee:2008:PPA",
  pages =        "53--62",
  year =         "2008",
  bibdate =      "Sat Dec 02 07:09:03 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Gene H. Golub and Eric Grosse and
                 Cleve Moler and Keith Moore",
  title =        "{Netlib} and {NA-Net}: Building a Scientific Computing
  journal =      j-IEEE-ANN-HIST-COMPUT,
  volume =       "30",
  number =       "2",
  pages =        "30--41",
  month =        apr # "\slash " # jun,
  year =         "2008",
  CODEN =        "IAHCEX",
  DOI =          "",
  ISSN =         "1058-6180 (print), 1934-1547 (electronic)",
  ISSN-L =       "1058-6180",
  bibdate =      "Thu Jul 3 10:46:12 MDT 2008",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Annals of the History of Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  remark =       "Gene H. Golub, (Deceased 16 November 2007).",

  author =       "Jack J. Dongarra and Julien Langou",
  title =        "The Problem with the {Linpack} Benchmark Matrix
  type =         "LAPACK Working Note",
  number =       "206",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "12",
  month =        jun,
  year =         "2008",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  note =         "Version 1; version 2 is dated 18 September 2008.",
  URL =          "",
  abstract =     "We characterize the matrix sizes for which the Linpack
                 Benchmark 1.0 matrix generator constructs a matrix with
                 identical columns.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  ucdenvernumber = "UCD-CCM-271",

  author =       "Jack Dongarra and Jean-Fran{\c{c}}ois Pineau and Yves
                 Robert and Zhiao Shi and Fr{\'e}d{\'e}ric Vivien",
  title =        "Revisiting Matrix Product on Master-Worker Platforms",
  journal =      j-INT-J-FOUND-COMP-SCI,
  volume =       "19",
  number =       "6",
  pages =        "1317--1336",
  month =        dec,
  year =         "2008",
  CODEN =        "IFCSEN",
  DOI =          "",
  ISSN =         "0129-0541 (print), 1793-6373 (electronic)",
  ISSN-L =       "0129-0541",
  MRclass =      "65F30",
  MRnumber =     "MR2484316 (2009m:65073)",
  bibdate =      "Tue Aug 31 07:37:14 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of Foundations of Computer
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Bernard Tourancheau",
  title =        "Special section: Cluster and computational grids for
                 scientific computing",
  journal =      j-FUT-GEN-COMP-SYS,
  volume =       "24",
  number =       "1",
  pages =        "30--30",
  month =        jan,
  year =         "2008",
  CODEN =        "FGSEVI",
  DOI =          "",
  ISSN =         "0167-739X (print), 1872-7115 (electronic)",
  ISSN-L =       "0167-739X",
  bibdate =      "Sat Sep 11 13:08:10 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Future Generation Computer Systems",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Fred G. Gustavson and Jerzy Wasniewski and Jack
  title =        "Level-3 {Cholesky} kernel subroutine of a fully
                 portable High Performance minimal storage hybrid format
                 {Cholesky} algorithm",
  type =         "LAPACK Working Note",
  number =       "211",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        dec,
  year =         "2008",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-08-634",

  author =       "Fred G. Gustavson and Jerzy Wasniewski and Jack J.
                 Dongarra and Julien Langou",
  title =        "Rectangular Full Packed Format for {Cholesky}'s
                 Algorithm: Factorization, Solution and Inversion",
  type =         "LAPACK Working Note",
  number =       "199",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        apr,
  year =         "2008",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  abstract =     "We describe a new data format for storing triangular,
                 symmetric, and Hermitian matrices called RFPF
                 (Rectangular Full Packed Format). The standard two
                 dimensional arrays of Fortran and C (also known as full
                 format) that are used to represent triangular and
                 symmetric matrices waste nearly half of the storage
                 space but provide high performance via the use of Level
                 3 BLAS. Standard packed format arrays fully utilize
                 storage (array space) but provide low performance as
                 there is no Level 3 packed BLAS. We combine the good
                 features of packed and full storage using RFPF to
                 obtain high performance via using Level 3 BLAS as RFPF
                 is a standard full format representation. Also, RFPF
                 requires exactly the same minimal storage as packed
                 format. Each LAPACK full and/or packed triangular,
                 symmetric, and Hermitian routine becomes a single new
                 RFPF routine based on eight possible data layouts of
                 RFPF. This new RFPF routine usually consists of two
                 calls to the corresponding LAPACK full format routine
                 and two calls to Level 3 BLAS routines. This means no
                 new software is required. As examples, we present
                 LAPACK routines for Cholesky factorization, Cholesky
                 solution and Cholesky inverse computation in RFPF to
                 illustrate this new work and to describe its
                 performance on several commonly used computer
                 platforms. Performance of LAPACK full routines using
                 RFPF versus LAPACK full routines using standard format
                 for both serial and SMP parallel processing is about
                 the same while using half the storage. Performance
                 gains are roughly one to a factor of 43 for serial and
                 one to a factor of 97 for SMP parallel times faster
                 using vendor LAPACK full routines with RFPF than with
                 using vendor and/or reference packed routines.",
  acknowledgement = ack-nhfb,
  keywords =     "Algorithms; BLAS; Linear Algebra Libraries;
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  subject =      "G.1.3 [Numerical Analysis]: Numerical Linear Algebra -
                 Linear Systems (symmetric and Hermitian); G.4
                 [Mathematics of Computing]: Mathematical Software",
  utknumber =    "UT-CS-08-614",

  author =       "Jakub Kurzak and Jack J. Dongarra",
  title =        "{$ Q R $} Factorization for the {CELL} Processor",
  type =         "LAPACK Working Note",
  number =       "201",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        may,
  year =         "2008",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  abstract =     "The QR factorization is one of the most important
                 operations in dense linear algebra, offering a
                 numerically stable method for solving linear systems of
                 equations including overdetermined and underdetermined
                 systems. Classic implementation of the QR factorization
                 suffers from performance limitations due to the use of
                 matrix-vector type operations in the phase of panel
                 factorization. These limitations can be remedied by
                 using the idea of updating of QR factorization,
                 rendering an algorithm, which is much more scalable and
                 much more suitable for implementation on a multi-core
                 processor. It is demonstrated how the potential of the
                 CELL processor can be utilized to the fullest by
                 employing the new algorithmic approach and successfully
                 exploiting the capabilities of the CELL processor in
                 terms of Instruction Level Parallelism and Thread-Level
  acknowledgement = ack-nhfb,
  keywords =     "CELL processor; linear algebra; matrix factorization;
                 multi-core; numerical algorithms",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-08-616",

  author =       "Jakub Kurzak and Alfredo Buttari and Piotr Luszczek
                 and Jack Dongarra",
  title =        "The {PlayStation 3} for High-Performance Scientific
  journal =      j-COMPUT-SCI-ENG,
  volume =       "10",
  number =       "3",
  pages =        "84--87",
  month =        may # "\slash " # jun,
  year =         "2008",
  CODEN =        "CSENFA",
  DOI =          "",
  ISSN =         "1521-9615 (print), 1558-366X (electronic)",
  ISSN-L =       "1521-9615",
  bibdate =      "Thu Jul 3 11:24:19 MDT 2008",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Computing in Science and Engineering",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jakub Kurzak and Alfredo Buttari and Jack Dongarra",
  title =        "Solving Systems of Linear Equations on the {CELL}
                 Processor Using {Cholesky} Factorization",
  journal =      j-IEEE-TRANS-PAR-DIST-SYS,
  volume =       "19",
  number =       "9",
  pages =        "1175--1186",
  month =        sep,
  year =         "2008",
  CODEN =        "ITDSEO",
  DOI =          "",
  ISSN =         "1045-9219 (print), 1558-2183 (electronic)",
  ISSN-L =       "1045-9219",
  bibdate =      "Thu May 13 12:06:56 2010",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Transactions on Parallel and Distributed
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hatem Ltaief and Jakub Kurzak and Jack Dongarra",
  title =        "Parallel Block {Hessenberg} Reduction using
                 Algorithms-By-Tiles for Multicore Architectures
  type =         "LAPACK Working Note",
  number =       "208",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        aug,
  year =         "2008",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  abstract =     "The objective of this paper is to extend and redesign
                 the block matrix reduction applied for the family of
                 two-sided factorizations, introduced by Dongarra et al.
                 [9], to the context of multicore architectures using
                 algorithms-by-tiles. In particular, the Block
                 Hessenberg Reduction is very often used as a
                 pre-processing step in solving dense linear algebra
                 problems, such as the standard eigenvalue problem.
                 Although expensive, orthogonal transformations are
                 commonly used for this reduction because they guarantee
                 stability, as opposed to Gaussian Elimi- nation. Two
                 versions of the Block Hessenberg Reduction are
                 presented in this paper, the first one with Householder
                 reflectors and the second one with Givens rotations. A
                 short investigation on variants of Fast Givens
                 Rotations is also mentioned. Furthermore, in the last
                 Top500 list from June 2008, 98\% of the fastest
                 parallel systems in the world are based on multicores.
                 The emerging petascale systems consisting of hundreds
                 of thousands of cores have exacerbated the problem even
                 more and it becomes judicious to efficiently integrate
                 existing or new numerical linear algebra algorithms
                 suitable for such hardwares. By exploiting the concepts
                 of algorithms-by-tiles in the multicore environment
                 (i.e., high level of parallelism with fine granularity
                 and high performance data representation combined with
                 a dynamic data driven execution), the Block Hessenberg
                 Reduction presented here achieves 72\% of the DGEMM
                 peak on a 12000 \times 12000 matrix with 16 Intel
                 Tigerton 2.4 GHz processors.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-08-624",

  author =       "Hatem Ltaief and Jakub Kurzak and Jack Dongarra",
  title =        "Parallel Band Two-Sided Matrix Bidiagonalization for
                 Multicore Architectures",
  type =         "LAPACK Working Note",
  number =       "209",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        oct,
  year =         "2008",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  abstract =     "The objective of this paper is to extend, in the
                 context of multicore architectures, the concepts of
                 algorithms-by-tiles [Buttari et al., 2007] for
                 Cholesky, LU, QR factorizations to the family of two-
                 sided factorizations. In particular, the bidiagonal
                 reduction of a general, dense matrix is very often used
                 as a pre-processing step for calculating the singular
                 value decomposition. Furthermore, in the last Top500
                 list from June 2008, 98\% of the fastest parallel
                 systems in the world were based on multicores. The
                 manycore trend has increasingly exacerbated the
                 problem, and it becomes critical to efficiently
                 integrate existing or new numerical linear algebra
                 algorithms suitable for such hardware. By exploiting
                 the concept of algorithms-by-tiles in the multicore
                 environment (i.e., high level of parallelism with fine
                 granularity and high performance data representation
                 combined with a dynamic data driven execution), the
                 band bidiagonal reduction presented here achieves 94
                 Gflop/s on a 12000 \times 12000 matrix with 16 Intel
                 Tigerton 2.4 GHz processors.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-08-631",

  author =       "Beniamino {Di Martino} and Dieter Kranzlm{\"u}ller and
                 Jack Dongarra",
  title =        "Special section: {Grid} computing and the {Message
                 Passing Interface}",
  journal =      j-FUT-GEN-COMP-SYS,
  volume =       "24",
  number =       "2",
  pages =        "119--120",
  month =        feb,
  year =         "2008",
  CODEN =        "FGSEVI",
  ISSN =         "0167-739X (print), 1872-7115 (electronic)",
  ISSN-L =       "0167-739X",
  bibdate =      "Sat Sep 11 13:08:11 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Future Generation Computer Systems",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Stanimire Tomov and Jack Dongarra and Marc Baboulin",
  title =        "Towards Dense Linear Algebra for Hybrid {GPU}
                 Accelerated Manycore Systems",
  type =         "LAPACK Working Note",
  number =       "210",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        oct,
  year =         "2008",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  abstract =     "If multicore is a disruptive technology, try to
                 imagine hybrid multicore systems enhanced with
                 accelerators! This is happening today as accelerators,
                 in particular Graphics Processing Units (GPUs), are
                 steadily making their way into the high performance
                 computing (HPC) world. We highlight the trends leading
                 to the idea of hybrid manycore/GPU systems, and we
                 present a set of techniques that can be used to
                 efficiently program them. The presentation is in the
                 context of Dense Linear Algebra (DLA), a major building
                 block for many scientific computing applications. We
                 motivate the need for new algorithms that would split
                 the computation in a way that would fully exploit the
                 power that each of the hybrid components offers. As the
                 area of hybrid multicore/GPU computing is still in its
                 infancy, we also argue for its importance in view of
                 what future architectures may look like. We therefore
                 envision the need for a DLA library similar to LAPACK
                 but for hybrid manycore/GPU systems. We illustrate the
                 main ideas with an LU-factorization algorithm where
                 particular techniques are used to reduce the amount of
                 pivoting, resulting in an algorithm achieving up to 388
                 GFlop/s for single and up to 99.4 GFlop/s for double
                 precision factorization on a hybrid Intel Xeon (2x4
                 cores @ 2.33 GHz) --- NVIDIA GeForce GTX 280 5 (240
                 cores @ 1.30 GHz) system.",
  acknowledgement = ack-nhfb,
  keywords =     "dense linear algebra; graphics processing units.;
                 hybrid computing; LU factorization; multicore
                 processors; parallel algorithms",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-08-632",

  author =       "Christof V{\"o}mel and Stanimire Z. Tomov and Osni A.
                 Marques and A. Canning and Lin-Wang Wang and Jack J.
  title =        "State-of-the-art eigensolvers for electronic structure
                 calculations of large scale nano-systems",
  journal =      j-J-COMPUT-PHYS,
  volume =       "227",
  number =       "15",
  pages =        "7113--7124",
  year =         "2008",
  CODEN =        "JCTPAH",
  DOI =          "",
  ISSN =         "0021-9991 (print), 1090-2716 (electronic)",
  ISSN-L =       "0021-9991",
  bibdate =      "Sat Dec 31 18:11:58 2011",
  bibsource =    ";
  ZMnumber =     "1141.82346",
  abstract =     "The band edge states determine optical and electronic
                 properties of semiconductor nano-structures which can
                 be computed from an interior eigenproblem. We study the
                 reliability and performance of state-of-the-art
                 iterative eigensolvers on large quantum dots and wires,
                 focusing on variants of preconditioned CG, Lanczos, and
                 Davidson methods. One Davidson variant, the {$ G D + k
                 $} (Olsen) method, is identified to be as reliable as
                 the commonly used preconditioned CG while consistently
                 being between two and three times faster.",
  acknowledgement = ack-nhfb,
  classmath =    "*82D37 (Semiconductors) 65F15 (Eigenvalues (numerical
                 linear algebra))",
  fjournal =     "Journal of Computational Physics",
  journal-URL =  "",
  keywords =     "computational nano-technology; Davidson's method;
                 electronic structure; implicitly restarted Arnoldi;
                 preconditioned conjugate gradients",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Emmanuel Agullo and Bilel Hadri and Hatem Ltaief and
                 Jack Dongarra",
  title =        "Comparative Study of One-Sided Factorizations with
                 Multiple Software Packages on Multi-Core Hardware",
  type =         "LAPACK Working Note",
  number =       "217",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "28",
  month =        apr,
  year =         "2009",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-09-640.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Marc Baboulin and Alfredo Buttari and Jack Dongarra
                 and Jakub Kurzak and Julie Langou and Julien Langou and
                 Piotr Luszczek and Stanimire Tomov",
  title =        "Accelerating scientific computations with mixed
                 precision algorithms",
  journal =      j-COMP-PHYS-COMM,
  volume =       "180",
  number =       "12",
  pages =        "2526--2533",
  month =        dec,
  year =         "2009",
  CODEN =        "CPHCBZ",
  DOI =          "",
  ISSN =         "0010-4655 (print), 1879-2944 (electronic)",
  ISSN-L =       "0010-4655",
  bibdate =      "Mon Feb 13 23:42:47 MST 2012",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Computer Physics Communications",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Marc Baboulin and Jack Dongarra and Serge Gratton and
                 Julien Langou",
  title =        "Computing the conditioning of the components of a
                 linear least-squares solution",
  journal =      j-NUM-LIN-ALG-APPL,
  volume =       "16",
  number =       "7",
  pages =        "517--533",
  year =         "2009",
  CODEN =        "NLAAEM",
  DOI =          "",
  ISSN =         "1070-5325 (print), 1099-1506 (electronic)",
  ISSN-L =       "1070-5325",
  MRclass =      "65F20 (62J05 65F35)",
  MRnumber =     "MR2537606 (2010f:65089)",
  MRreviewer =   "Ninoslav Truhar",
  bibdate =      "Sat Aug 21 14:31:35 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Numerical Linear Algebra with Applications",
  journal-URL =  "",
  onlinedate =   "26 Nov 2008",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "George Bosilca and R{\'e}mi Delmas and Jack Dongarra
                 and Julien Langou",
  title =        "Algorithm-based fault tolerance applied to high
                 performance computing",
  journal =      j-J-PAR-DIST-COMP,
  volume =       "69",
  number =       "4",
  pages =        "410--416",
  month =        apr,
  year =         "2009",
  CODEN =        "JPDCER",
  DOI =          "",
  ISSN =         "0743-7315 (print), 1096-0848 (electronic)",
  ISSN-L =       "0743-7315",
  bibdate =      "Wed Sep 1 16:27:24 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of Parallel and Distributed Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Alfredo Buttari and Julien Langou and Jakub Kurzak and
                 Jack Dongarra",
  title =        "A class of parallel tiled linear algebra algorithms
                 for multicore architectures",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "35",
  number =       "1",
  pages =        "38--53",
  month =        jan,
  year =         "2009",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  MRclass =      "65Y05 (65F99)",
  MRnumber =     "MR2492567 (2010c:65265)",
  bibdate =      "Thu Sep 2 17:51:10 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing. Systems \& Applications",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Franck Cappello and Thomas Herault and Jack Dongarra",
  title =        "Foreword [Special issue: selected papers from the
                 {14th European PVM\slash MPI Users Group Meeting,
                 Paris, September 30--October 3, 2007}]",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "35",
  number =       "12",
  pages =        "571--571",
  month =        dec,
  year =         "2009",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  MRclass =      "68-06 (68M10 68M12)",
  MRnumber =     "MR2596831",
  bibdate =      "Sat Sep 4 17:11:07 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing. Systems \& Applications",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Zizhong Chen and J. Dongarra",
  title =        "Highly Scalable Self-Healing Algorithms for High
                 Performance Scientific Computing",
  journal =      j-IEEE-TRANS-COMPUT,
  volume =       "58",
  number =       "11",
  pages =        "1512--1524",
  month =        nov,
  year =         "2009",
  CODEN =        "ITCOB4",
  DOI =          "",
  ISSN =         "0018-9340 (print), 1557-9956 (electronic)",
  ISSN-L =       "0018-9340",
  MRnumber =     "2751573",
  bibdate =      "Mon Jul 4 11:37:44 MDT 2011",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Transactions on Computers",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Bernard Tourancheau",
  title =        "Editorial",
  journal =      j-IJHPCA,
  volume =       "23",
  number =       "3",
  pages =        "195--195",
  month =        aug,
  year =         "2009",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Aug 31 09:59:45 MDT 2010",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Bernard Tourancheau",
  title =        "Guest editor's note: special issue on clusters and
                 computational grids for scientific computing",
  journal =      j-PARALLEL-PROCESS-LETT,
  volume =       "19",
  number =       "3",
  pages =        "379",
  year =         "2009",
  CODEN =        "PPLTEE",
  ISSN =         "0129-6264 (print), 1793-642X (electronic)",
  MRnumber =     "2750909",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Processing Letters",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Pete Beckman and Patrick Aerts and
                 Frank Cappello and Thomas Lippert and Satoshi Matsuoka
                 and Paul Messina and Terry Moore and Rick Stevens and
                 Anne Trefethen and Mateo Valero",
  title =        "The {International Exascale Software Project}: a Call
                 To Cooperative Action By the Global High-Performance
  journal =      j-IJHPCA,
  volume =       "23",
  number =       "4",
  pages =        "309--322",
  month =        nov,
  year =         "2009",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Aug 31 09:59:45 MDT 2010",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Julien Langou",
  title =        "The Problem With the {LINPACK Benchmark 1.0 Matrix
  journal =      j-IJHPCA,
  volume =       "23",
  number =       "1",
  pages =        "5--13",
  month =        feb,
  year =         "2009",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Aug 31 09:59:45 MDT 2010",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Bilel Hadri and Hatem Ltaief and Emmanuel Agullo and
                 Jack Dongarra",
  title =        "Enhancing Parallelism of Tile {$ Q R $} Factorization
                 for Multicore Architectures",
  type =         "LAPACK Working Note",
  number =       "222",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "4",
  month =        sep,
  year =         "2009",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-09-645.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jakub Kurzak and Jack Dongarra",
  title =        "{$ Q R $} factorization for the {Cell Broadband
  journal =      j-SCI-PROG,
  volume =       "17",
  number =       "1--2",
  pages =        "31--42",
  month =        "????",
  year =         "2009",
  CODEN =        "SCIPEV",
  DOI =          "",
  ISSN =         "1058-9244 (print), 1875-919X (electronic)",
  ISSN-L =       "1058-9244",
  bibdate =      "Wed Sep 1 14:50:29 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Scientific Programming",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jakub Kurzak and Jack Dongarra",
  title =        "Fully Dynamic Scheduler for Numerical Computing on
                 Multicore Processors",
  type =         "LAPACK Working Note",
  number =       "220",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "4",
  month =        jun,
  year =         "2009",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-09-643.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jakub Kurzak and Wesley Alvaro and Jack Dongarra",
  title =        "Optimizing matrix multiplication for a short-vector
                 {SIMD} architecture --- {CELL} processor",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "35",
  number =       "3",
  pages =        "138--150",
  month =        mar,
  year =         "2009",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Thu Sep 2 17:51:10 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jakub Kurzak and Hatem Ltaief and Jack Dongarra and
                 Rosa M. Badia",
  title =        "Scheduling Linear Algebra Operations on Multicore
  type =         "LAPACK Working Note",
  number =       "213",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        feb,
  year =         "2009",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  abstract =     "We present performance results for dense linear
                 algebra using the 8-series NVIDIA GPUs. Our
                 matrix-matrix multiply routine (GEMM) runs 60\% faster
                 than the vendor implementation in CUBLAS 1.1 and
                 approaches the peak of hardware capabilities. Our LU,
                 QR and Cholesky factorizations achieve up to 80--90\%
                 of the peak GEMM rate. Our parallel LU running on two
                 GPUs achieves up to $ \approx $300 Gflop/s. These
                 results are accomplished by challenging the accepted
                 view of the GPU architecture and

                 programming guidelines. We argue that modern GPUs
                 should be viewed as multithreaded multicore vector
                 units. We exploit blocking similarly to vector
                 computers and heterogeneity of the system by computing
                 both on GPU and CPU. This study includes detailed
                 benchmarking of the GPU memory system that reveals
                 sizes and latencies of caches and TLB. We present a
                 couple of algorithmic optimizations aimed at increasing
                 parallelism and regularity in the problem that provide
                 us with slightly higher performance.",
  acknowledgement = ack-nhfb,
  keywords =     "Cholesky; factorization; linear algebra; LU;
                 multicore; QR; scheduling; task graph",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-09-636",

  author =       "Jakub Kurzak and Hatem Ltaief and Jack Dongarra",
  title =        "Scheduling Two-sided Transformations using
                 Algorithms-by-Tiles on Multicore Architectures",
  type =         "LAPACK Working Note",
  number =       "214",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        feb,
  year =         "2009",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  abstract =     "The objective of this paper is to describe, in the
                 context of multicore architectures, different scheduler
                 implementations for the two-sided linear algebra
                 transformations, in particular the Hessenberg and
                 Bidiagonal reductions which are the first steps for the
                 standard eigenvalue problems and the singular value
                 decompositions respectively. State-of-the-art dense
                 linear algebra softwares, such as the LAPACK and
                 ScaLAPACK libraries, suffer performance losses on
                 multicore processors due to their inability to fully
                 exploit thread-level parallelism. At the same time the
                 coarse-grain dataflow model gains popularity as a
                 paradigm for programming multicore architectures. By
                 using the concepts of algorithms-by-tiles [Buttari et
                 al., 2007] along with efficient mechanisms for
                 data-driven execution, these two-sided reductions
                 achieve high performance computing. The main drawback
                 of the algorithms-by-tiles approach for two-sided
                 transformations is that the full reduction can not be
                 obtained in one stage. Other methods have to be
                 considered to further reduce the band matrices to the
                 required forms.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-09-637",

  author =       "Alexey Lastovetsky and J. J. Dongarra",
  title =        "High-Performance Heterogeneous Computing",
  publisher =    pub-WILEY,
  address =      pub-WILEY:adr,
  pages =        "xii + 267 + 2",
  year =         "2009",
  ISBN =         "0-470-04039-4 (cloth)",
  ISBN-13 =      "978-0-470-04039-3 (cloth)",
  LCCN =         "QA76.88 .L38 2009",
  bibdate =      "Fri Mar 26 11:41:01 MDT 2010",
  bibsource =    ";
  series =       "Wiley series on parallel and distributed computing",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  subject =      "High performance computing; Heterogeneous computing;
                 Computer networks",

  author =       "Yinan Li and Jack Dongarra and Stanimire Tomov",
  title =        "A Note on Auto-tuning {GEMM} for {GPUs}",
  type =         "LAPACK Working Note",
  number =       "212",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        jan,
  year =         "2009",
  bibdate =      "Fri Apr 24 12:25:43 2009",
  bibsource =    "",
  URL =          "",
  abstract =     "The development of high performance dense linear
                 algebra (DLA) critically depends on highly optimized
                 BLAS, and especially on the matrix multiplication
                 routine (GEMM). This is especially true for Graphics
                 Processing Units (GPUs), as evidenced by recently
                 published results on DLA for GPUs that rely on highly
                 optimized GEMM [13, 11]. However, the current best GEMM
                 performance, e.g. of up to 375 GFlop/s in single
                 precision and of up to 75 GFlop/s in double precision
                 arithmetic on NVIDIA's GTX 280, is difficult to
                 achieve. The development involves extensive GPU
                 knowledge and even backward engineering to understand
                 some undocumented insides about the architecture that
                 have been of key importance in the development [12]. In
                 this paper, we describe some GPU GEMM auto-tuning
                 optimization techniques that allow us to keep up with
                 changing hardware by rapidly reusing, rather than
                 reinventing, the existing ideas. Auto-tuning, as we
                 show in this paper, is a very practical solution where
                 in addition to getting an easy portability, we can
                 often get substantial speedups even on current GPUs
                 (e.g. up to 27\% in certain cases for both single and
                 double precision GEMMs on the GTX 280).",
  acknowledgement = ack-nhfb,
  keywords =     "Auto-tuning; dense linear algebra; GPUs; matrix
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  utknumber =    "UT-CS-09-635",

  author =       "Hatem Ltaief and Stanimire Tomov and Rajib Nath and
                 Peng Du and Jack Dongarra",
  title =        "A Scalable High Performant {Cholesky} Factorization
                 for Multicore with {GPU} Accelerators",
  type =         "LAPACK Working Note",
  number =       "223",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "25",
  month =        nov,
  year =         "2009",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-09-646.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Fengguang Song and Asim YarKhan and Jack Dongarra",
  title =        "Dynamic Task Scheduling for Linear Algebra Algorithms
                 on Distributed-Memory Multicore Systems",
  type =         "LAPACK Working Note",
  number =       "221",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "13",
  month =        apr,
  year =         "2009",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-09-638.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Stanimire Tomov and Jack Dongarra",
  title =        "Accelerating the reduction to upper {Hessenberg} form
                 through hybrid {GPU}-based computing",
  type =         "LAPACK Working Note",
  number =       "219",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "24",
  month =        may,
  year =         "2009",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-09-642.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Lamia Youseff and Keith Seymour and Haihang You and
                 Dmitrii Zagorodnov and Jack Dongarra and Rich Wolski",
  title =        "Paravirtualization effect on single-and multi-threaded
                 memory-intensive linear algebra software",
  journal =      "The Journal of Networks, Software Tools, and Cluster
  volume =       "12",
  number =       "2",
  pages =        "101--122",
  month =        "????",
  year =         "2009",
  DOI =          "",
  ISSN =         "1386-7857",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Emmanuel Agullo and Cedric Augonnet and Jack Dongarra
                 and Hatem Ltaief and Raymond Namyst and Samuel Thibault
                 and Stanimire Tomov",
  title =        "Faster, Cheaper, Better --- a Hybridization
                 Methodology to Develop Linear Algebra Software for
  type =         "LAPACK Working Note",
  number =       "230",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "15",
  month =        sep,
  year =         "2010",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-10-658. To appear in GPU Computing GEMs, vol.
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "E. Agullo and C. Augonnet and J. Dongarra and M.
                 Faverge and H. Ltaief and S. Thibault and S. Tomov",
  title =        "{$ Q R $} Factorization on a Multicore Node Enhanced
                 with Multiple {GPU} Accelerators",
  type =         "LAPACK Working Note",
  number =       "233",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        oct,
  year =         "2010",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-10-XXX, published in Proceedings of IPDPS
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Emmanuel Agullo and Camille Coti and Jack Dongarra and
                 Thomas Herault and Julien Langou",
  title =        "{$ Q R $} Factorization of Tall and Skinny Matrices in
                 a Grid Computing Environment",
  type =         "LAPACK Working Note",
  number =       "224",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "6",
  month =        apr,
  year =         "2010",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-10-651. Published in the Proceedings of IPDPS
                 2010: 24th IEEE International Parallel and Distributed
                 Processing Symposium Atlanta GA April 2010.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Thara Angskun and Graham Fagg and George Bosilca and
                 Jelena Pje{\v{s}}ivac-Grbovi{\'c} and Jack Dongarra",
  title =        "Self-healing network for scalable fault-tolerant
                 runtime environments",
  journal =      j-FUT-GEN-COMP-SYS,
  volume =       "26",
  number =       "3",
  pages =        "479--485",
  month =        mar,
  year =         "2010",
  CODEN =        "FGSEVI",
  DOI =          "",
  ISSN =         "0167-739X (print), 1872-7115 (electronic)",
  ISSN-L =       "0167-739X",
  bibdate =      "Sat Sep 11 13:08:16 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Future Generation Computer Systems",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "G. Bosilca and A. Bouteiller and A. Danalis and T.
                 Herault and P. Lemarinier and J. Dongarra",
  title =        "{DAGuE}: a generic distributed {DAG} engine for high
                 performance computing",
  type =         "LAPACK Working Note",
  number =       "231",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "15",
  month =        sep,
  year =         "2010",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-10-659.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "G. Bosilca and A. Bouteiller and A. Danalis and M.
                 Faverge and H. Haidar and T. Herault and J. Kurzak and
                 J. Langou and P. Lemarinier and H. Ltaief and P.
                 Luszczekl and A. YarKhan and J. Dongarra",
  title =        "Distributed-Memory Task Execution and Dependence
                 Tracking within {DAGuE} and the {DPLASMA Project}",
  type =         "LAPACK Working Note",
  number =       "232",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "15",
  month =        sep,
  year =         "2010",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-10-660.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Aurelien Bouteiller and George Bosilca and Jack
  title =        "Redesigning the message logging model for high
  journal =      j-CCPE,
  volume =       "22",
  number =       "16",
  pages =        "2196--2211",
  month =        nov,
  year =         "2010",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Mon Dec 5 10:08:49 MST 2011",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  onlinedate =   "27 Jun 2010",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Thomas Brady and Jack Dongarra and Michele Guidolin
                 and Alexey Lastovetsky and Keith Seymour",
  title =        "{SmartGridRPC}: {The} new {RPC} model for high
                 performance {Grid} computing",
  journal =      j-CCPE,
  volume =       "22",
  number =       "18",
  pages =        "2467--2487",
  day =          "25",
  month =        dec,
  year =         "2010",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Mon Dec 5 10:08:51 MST 2011",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  onlinedate =   "12 Nov 2010",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra",
  key =          "CUDA",
  title =        "Foreword",
  crossref =     "Sanders:2010:CEI",
  pages =        "xiii--xiv",
  year =         "2010",
  bibdate =      "Sun Sep 05 06:40:55 2010",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra and Hans W. Meuer and Horst D. Simon
                 and Erich Strohmaier",
  title =        "Recent trends in high performance computing",
  crossref =     "Bultheel:2010:BNA",
  pages =        "93--107",
  year =         "2010",
  MRclass =      "65Y10 (68M99)",
  MRnumber =     "2604143",
  bibdate =      "Mon Aug 23 18:26:52 2010",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Piotr Luszczek",
  title =        "Reducing the time to tune parallel dense linear
                 algebra routines with partial execution and performance
  type =         "LAPACK Working Note",
  number =       "235",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "8",
  month =        oct,
  year =         "2010",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-10-661.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Peng Du and Rick Weber and Piotr Luszczek and
                 Stanimire Tomov and Gregory Peterson and Jack
  title =        "From {CUDA} to {OpenCL}: Towards a
                 Performance-portable Solution for Multi-platform {GPU}
  type =         "LAPACK Working Note",
  number =       "228",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "6",
  month =        sep,
  year =         "2010",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-10-656.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Fred G. Gustavson and Jerzy Wa{\'s}niewski and Jack J.
                 Dongarra and Julien Langou",
  title =        "Rectangular full packed format for {Cholesky}'s
                 algorithm: factorization, solution, and inversion",
  journal =      j-TOMS,
  volume =       "37",
  number =       "2",
  pages =        "18:1--18:21",
  month =        apr,
  year =         "2010",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  MRclass =      "65F05 (65Y15)",
  MRnumber =     "2738225",
  bibdate =      "Wed Apr 21 11:39:57 MDT 2010",
  bibsource =    ";
  abstract =     "We describe a new data format for storing triangular,
                 symmetric, and Hermitian matrices called {\em
                 Rectangular Full Packed Format\/} (RFPF). The standard
                 two-dimensional arrays of Fortran and C (also known as
                 {\em full format\/}) that are used to represent
                 triangular and symmetric matrices waste nearly half of
                 the storage space but provide high performance via the
                 use of Level 3 BLAS. Standard packed format arrays
                 fully utilize storage (array space) but provide low
                 performance as there is no Level 3 packed BLAS. We
                 combine the good features of packed and full storage
                 using RFPF to obtain high performance via using Level 3
                 BLAS as RFPF is a standard full-format representation.
                 Also, RFPF requires exactly the same minimal storage as
                 the packed format. Each LAPACK full and/or packed
                 triangular, symmetric, and Hermitian routine becomes a
                 single new RFPF routine based on eight possible data
                 layouts of RFPF. This new RFPF routine usually consists
                 of two calls to the corresponding LAPACK full-format
                 routine and two calls to Level 3 BLAS routines. This
                 means {\em no\/} new software is required. As examples,
                 we present LAPACK routines for Cholesky factorization,
                 Cholesky solution, and Cholesky inverse computation in
                 RFPF to illustrate this new work and to describe its
                 performance on several commonly used computer
                 platforms. Performance of LAPACK full routines using
                 RFPF versus LAPACK full routines using the standard
                 format for both serial and SMP parallel processing is
                 about the same while using half the storage.
                 Performance gains are roughly one to a factor of 43 for
                 serial and one to a factor of 97 for SMP parallel times
                 faster using vendor LAPACK full routines with RFPF than
                 with using vendor and/or reference packed routines.",
  acknowledgement = ack-nhfb,
  articleno =    "18",
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  keywords =     "BLAS; Cholesky factorization and solution; complex
                 Hermitian matrices; LAPACK; linear algebra libraries;
                 novel packed matrix data structures; positive definite
                 matrices; Real symmetric matrices; Rectangular Full
                 Packed Format; recursive algorithms",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  pagecount =    "21",

  author =       "Jakub Kurzak and Rajib Nath and Peng Du and Jack
  title =        "An Implementation of the Tile {$ Q R $} Factorization
                 for a {GPU} and Multiple {CPUs}",
  type =         "LAPACK Working Note",
  number =       "229",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "15",
  month =        sep,
  year =         "2010",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-10-657. Submitted to PARA'10",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Jakub Kurzak and David A. Bader and J. J. Dongarra",
  title =        "Scientific computing with multicore and accelerators",
  volume =       "10",
  publisher =    pub-CRC,
  address =      pub-CRC:adr,
  pages =        "xxxiii + 480",
  year =         "2010",
  ISBN =         "1-4398-2536-X (hardback)",
  ISBN-13 =      "978-1-4398-2536-5 (hardback)",
  LCCN =         "Q183.9 .S325 2010",
  bibdate =      "Fri Nov 16 06:29:59 MST 2012",
  bibsource =    ";
  series =       "Chapman and Hall/CRC computational science",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  subject =      "Science; Data processing; Engineering; High
                 performance computing; Multiprocessors; MATHEMATICS /
                 General; MATHEMATICS / Advanced; MATHEMATICS / Number

  author =       "Jakub Kurzak and Hatem Ltaief and Jack Dongarra and
                 Rosa M. Badia",
  title =        "Scheduling dense linear algebra operations on
                 multicore processors",
  journal =      j-CCPE,
  volume =       "22",
  number =       "1",
  pages =        "15--44",
  month =        jan,
  year =         "2010",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Mon Dec 5 10:08:40 MST 2011",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Prac\-tice and
  journal-URL =  "",
  onlinedate =   "11 Aug 2009",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hatem Ltaief and Jakub Kurzak and Jack Dongarra",
  title =        "Parallel Two-Sided Matrix Reduction to Band Bidiagonal
                 Form on Multicore Architectures",
  journal =      j-IEEE-TRANS-PAR-DIST-SYS,
  volume =       "21",
  number =       "4",
  pages =        "417--423",
  month =        apr,
  year =         "2010",
  CODEN =        "ITDSEO",
  DOI =          "",
  ISSN =         "1045-9219 (print), 1558-2183 (electronic)",
  ISSN-L =       "1045-9219",
  bibdate =      "Thu May 13 12:06:56 2010",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Transactions on Parallel and Distributed
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hatem Ltaief and Jakub Kurzak and Jack Dongarra and
                 Rosa M. Badia",
  title =        "Scheduling two-sided transformations using tile
                 algorithms on multicore architectures",
  journal =      j-SCI-PROG,
  volume =       "18",
  number =       "1",
  pages =        "35--50",
  month =        "????",
  year =         "2010",
  CODEN =        "SCIPEV",
  DOI =          "",
  ISSN =         "1058-9244 (print), 1875-919X (electronic)",
  ISSN-L =       "1058-9244",
  bibdate =      "Wed Sep 1 14:50:29 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Scientific Programming",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Rajib Nath and Stanimire Tomov and Jack Dongarra",
  title =        "An Improved {MAGMA GEMM} for {Fermi GPUs}",
  type =         "LAPACK Working Note",
  number =       "227",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "29",
  month =        jul,
  year =         "2010",
  DOI =          "",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-10-655.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Peter Sloot and Peter Coveney and Jack Dongarra",
  title =        "Preface",
  journal =      j-J-COMPUT-SCI,
  volume =       "1",
  number =       "1",
  pages =        "3--4",
  month =        may,
  year =         "2010",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "1877-7503 (print), 1877-7511 (electronic)",
  ISSN-L =       "1877-7503",
  bibdate =      "Tue Sep 19 13:53:01 MDT 2023",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "J. Comput. Sci.",
  fjournal =     "Journal of Computational Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Stanimire Tomov and Rajib Nath and Jack Dongarra",
  title =        "Accelerating the reduction to upper {Hessenberg},
                 tridiagonal, and bidiagonal forms through hybrid
                 {GPU}-based computing",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "36",
  number =       "12",
  pages =        "645--654",
  month =        dec,
  year =         "2010",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  MRclass =      "65F30 (15A23 65F25 65Y05)",
  MRnumber =     "2762590 (2011i:65067)",
  bibdate =      "Mon Nov 1 10:18:30 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing. Systems \& Applications",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Stanimire Tomov and Rajib Nath and Hatem Ltaief and
                 Jack Dongarra",
  booktitle =    "{2010 IEEE International Symposium on Parallel \&
                 Distributed Processing, Workshops and Phd Forum
  title =        "Dense linear algebra solvers for multicore with {GPU}
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  month =        apr,
  year =         "2010",
  DOI =          "",
  bibdate =      "Thu Nov 7 16:56:45 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Stanimire Tomov and Rajib Nath and Hatem Ltaief and
                 Jack Dongarra",
  title =        "Dense Linear Algebra Solvers for Multicore with {GPU}
  type =         "LAPACK Working Note",
  number =       "225",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "18",
  month =        apr,
  year =         "2010",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-09-649. Published in the Proceedings of IPDPS
                 2010: 24th IEEE International Parallel and Distributed
                 Processing Symposium Atlanta GA April 2010.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Stanimire Tomov and Jack Dongarra and Marc Baboulin",
  title =        "Towards dense linear algebra for hybrid {GPU}
                 accelerated manycore systems",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "36",
  number =       "5--6",
  pages =        "232--240",
  month =        jun,
  year =         "2010",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Thu Sep 2 17:51:12 MDT 2010",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Emmanuel Agullo and Jack Dongarra and Rajib Nath and
                 Stanimire Tomov",
  title =        "A Fully Empirical Autotuned Dense {$ Q R $}
                 Factorization For Multicore Architectures",
  type =         "LAPACK Working Note",
  number =       "242",
  institution =  "INRIA",
  address =      "????",
  day =          "9",
  month =        mar,
  year =         "2011",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "INRIA-7526.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Emmanuel Agullo and Camille Coti and Thomas Herault
                 and Julien Langou and Sylvain Peyronnet and Ala
                 Rezmerita and Franck Cappello and Jack Dongarra",
  title =        "{QCG-OMPI}: {MPI} applications on grids",
  journal =      j-FUT-GEN-COMP-SYS,
  volume =       "27",
  number =       "4",
  pages =        "357--369",
  month =        apr,
  year =         "2011",
  CODEN =        "FGSEVI",
  DOI =          "",
  ISSN =         "0167-739X (print), 1872-7115 (electronic)",
  ISSN-L =       "0167-739X",
  bibdate =      "Tue Aug 30 11:43:29 MDT 2011",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Future Generation Computer Systems",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hartwig Anzt and Stanimire Tomov and Jack Dongarra and
                 Vincent Heuveline",
  title =        "A Block-Asynchronous Relaxation Method for Graphics
                 Processing Units",
  type =         "LAPACK Working Note",
  number =       "258",
  institution =  inst-CS-U-Tenn,
  address =      inst-CS-U-Tenn:adr,
  month =        dec,
  year =         "2011",
  bibdate =      "Sun May 5 11:20:19 2013",
  bibsource =    ";
  note =         "UT-CS-11-687.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hartwig Anzt and Piotr Luszczek and Jack Dongarra and
                 Vincent Heuveline",
  title =        "{GPU}-Accelerated Asynchronous Error Correction for
                 Mixed Precision Iterative Refinement",
  type =         "LAPACK Working Note",
  number =       "260",
  institution =  inst-CS-U-Tenn,
  address =      inst-CS-U-Tenn:adr,
  month =        dec,
  year =         "2011",
  bibdate =      "Sun May 5 11:20:19 2013",
  bibsource =    ";
  note =         "UT-CS-11-690.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Marc Baboulin and Jack Dongarra and Julien Herrmann
                 and Stanimire Tomov",
  title =        "Accelerating linear system solutions using
                 randomization techniques",
  type =         "LAPACK Working Note",
  number =       "246",
  institution =  "INRIA",
  address =      "????",
  day =          "15",
  month =        may,
  year =         "2011",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "INRIA RR-7616.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Marc Baboulin and Dulceneia Becker and Jack Dongarra",
  title =        "A parallel tiled solver for dense symmetric indefinite
                 systems on multicore architectures",
  type =         "LAPACK Working Note",
  number =       "261",
  institution =  inst-INRIA,
  address =      inst-INRIA:adr,
  month =        dec,
  year =         "2011",
  bibdate =      "Sun May 5 11:20:19 2013",
  bibsource =    ";
  note =         "INRIA-7762.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Mathieu Faverge and Hatem Ltaief and
                 Piotr Luszczek",
  title =        "Achieving Numerical Accuracy and High Performance
                 using Recursive Tile {$ L U $} Factorization",
  type =         "LAPACK Working Note",
  number =       "259",
  institution =  inst-CS-U-Tenn,
  address =      inst-CS-U-Tenn:adr,
  month =        dec,
  year =         "2011",
  bibdate =      "Sun May 5 11:20:19 2013",
  bibsource =    ";
  note =         "UT-CS-11-688.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra",
  title =        "Foreword",
  crossref =     "Hager:2011:IHP",
  pages =        "??--??",
  year =         "2011",
  bibdate =      "Sun Sep 05 06:40:55 2010",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Bernard Tourancheau",
  title =        "{Guest Editors}' note: special issue on clusters,
                 clouds and grids for scientific computing",
  journal =      j-PARALLEL-PROCESS-LETT,
  volume =       "21",
  number =       "2",
  pages =        "109--109",
  month =        jun,
  year =         "2011",
  CODEN =        "PPLTEE",
  DOI =          "",
  ISSN =         "0129-6264 (print), 1793-642X (electronic)",
  MRclass =      "Indexed",
  MRnumber =     "2811996",
  bibdate =      "Tue Feb 28 11:32:07 MST 2012",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Processing Letters",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Mathieu Faverge and Thomas Herault
                 and Julien Langou and Yves Robert",
  title =        "Hierarchical {$ Q R $} factorization algorithms for
                 multi-core cluster systems",
  type =         "LAPACK Working Note",
  number =       "257",
  institution =  inst-CS-U-Tenn,
  address =      inst-CS-U-Tenn:adr,
  month =        oct,
  year =         "2011",
  bibdate =      "Sun May 5 11:20:19 2013",
  bibsource =    ";
  note =         "UT-CS-11-684.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Pete Beckman and Terry Moore and
                 Patrick Aerts and Giovanni Aloisio and Jean-Claude
                 Andre and David Barkai and Jean-Yves Berthou and
                 Taisuke Boku and Bertrand Braunschweig and Franck
                 Cappello and Barbara Chapman and Xuebin Chi and Alok
                 Choudhary and Sudip Dosanjh and Thom Dunning and Sandro
                 Fiore and Al Geist and Bill Gropp and Robert Harrison
                 and Mark Hereld and Michael Heroux and Adolfy Hoisie
                 and Koh Hotta and Zhong Jin and Yutaka Ishikawa and
                 Fred Johnson and Sanjay Kale and Richard Kenway and
                 David Keyes and Bill Kramer and Jesus Labarta and Alain
                 Lichnewsky and Thomas Lippert and Bob Lucas and Barney
                 Maccabe and Satoshi Matsuoka and Paul Messina and Peter
                 Michielse and Bernd Mohr and Matthias S. Mueller and
                 Wolfgang E. Nagel and Hiroshi Nakashima and Michael E.
                 Papka and Dan Reed and Mitsuhisa Sato and Ed Seidel and
                 John Shalf and David Skinner and Marc Snir and Thomas
                 Sterling and Rick Stevens and Fred Streitz and Bob
                 Sugar and Shinji Sumimoto and William Tang and John
                 Taylor and Rajeev Thakur and Anne Trefethen and Mateo
                 Valero and Aad van der Steen and Jeffrey Vetter and Peg
                 Williams and Robert Wisniewski and Kathy Yelick",
  title =        "The {International Exascale Software Project}
  journal =      j-IJHPCA,
  volume =       "25",
  number =       "1",
  pages =        "3--60",
  month =        feb,
  year =         "2011",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Sep 6 15:14:36 MDT 2011",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  onlinedate =   "January 6, 2011",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Bernard Tourancheau",
  title =        "Selected papers of the {Workshop on Clusters, Clouds
                 and Grids for Scientific Computing (CCGSC)}",
  journal =      j-IJHPCA,
  volume =       "25",
  number =       "3",
  pages =        "259--260",
  month =        aug,
  year =         "2011",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Sep 6 15:14:38 MDT 2011",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Peng Du and Aurelien Bouteiller and George Bosilca and
                 Thomas Herault and Jack Dongarra",
  title =        "Algorithm-based Fault Tolerance for Dense Matrix
  type =         "LAPACK Working Note",
  number =       "253",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "5",
  month =        aug,
  year =         "2011",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-11-676.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Peng Du and Piotr Luszczek and Jack Dongarra",
  title =        "High Performance Linear System Solver with Resilience
                 to Multiple Soft Errors",
  type =         "LAPACK Working Note",
  number =       "256",
  institution =  inst-CS-U-Tenn,
  address =      inst-CS-U-Tenn:adr,
  month =        oct,
  year =         "2011",
  bibdate =      "Sun May 5 11:20:19 2013",
  bibsource =    ";
  note =         "UT-CS-11-683.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Peng Du and Piotr Luszczek and Stanimire Tomov and
                 Jack Dongarra",
  title =        "Soft Error Resilient {$ Q R $} Factorization for
                 Hybrid System",
  type =         "LAPACK Working Note",
  number =       "252",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "1",
  month =        jul,
  year =         "2011",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-11-675.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Fred G. Gustavson and Jerzy W{\'a}sniewski and Jack J.
                 Dongarra and Jos{\'e} R. Herrero and Julien Langou",
  title =        "Level-3 {Cholesky} Factorization Routines as Part of
                 Many {Cholesky} Algorithms",
  type =         "LAPACK Working Note",
  number =       "249",
  institution =  "????",
  address =      "????",
  year =         "2011",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "DTU/IMM-Technical-Report-2011-11, submitted at TOMS.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Azzam Haidar and Hatem Ltaief and Asim YarKhan and
                 Jack Dongarra",
  title =        "Analysis of Dynamically Scheduled Tile Algorithms for
                 Dense Linear Algebra on Multicore Architectures",
  type =         "LAPACK Working Note",
  number =       "243",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "10",
  month =        mar,
  year =         "2011",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-11-666. Submitted at Concurrency and
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Azzam Haidar and Hatem Ltaief and Jack Dongarra",
  title =        "Parallel Reduction to Condensed Forms for Symmetric
                 Eigenvalue Problems using Aggregated Fine-Grained and
                 Memory-Aware Kernels",
  type =         "LAPACK Working Note",
  number =       "254",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "5",
  month =        aug,
  year =         "2011",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-11-677 Aug 5 2011.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Azzam Haidar and Hatem Ltaief and Jack Dongarra",
  title =        "Parallel reduction to condensed forms for symmetric
                 eigenvalue problems using aggregated fine-grained and
                 memory-aware kernels",
  crossref =     "Lathrop:2011:SPI",
  pages =        "8:1--8:11",
  year =         "2011",
  DOI =          "",
  bibdate =      "Fri Dec 16 11:05:47 MST 2011",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  articleno =    "8",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Heike Jagode and Andreas Kn{\"u}pfer and Jack Dongarra
                 and Matthias Jurenz and Matthias S. M{\"u}ller and
                 Wolfgang E. Nagel",
  title =        "Trace-based performance analysis for the petascale
                 simulation code {FLASH}",
  journal =      j-IJHPCA,
  volume =       "25",
  number =       "4",
  pages =        "428--439",
  month =        nov,
  year =         "2011",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  onlinedate =   "December 29, 2010",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jakub Kurzak and Stanimire Tomov and Jack Dongarra",
  title =        "Autotuning {GEMMs} for {Fermi}",
  type =         "LAPACK Working Note",
  number =       "245",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "18",
  month =        apr,
  year =         "2011",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-11-671. Submitted at SC11 November 12-18, 2011,
                 Seattle, Washington, USA.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hatem Ltaief and Piotr Luszczek and Jack Dongarra",
  title =        "High Performance Bidiagonal Reduction using Tile
                 Algorithms on Homogeneous Multicore Architectures",
  type =         "LAPACK Working Note",
  number =       "247",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "18",
  month =        may,
  year =         "2011",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-11-673. Submitted at TOMS.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hatem Ltaief and Piotr Luszczek and Jack Dongarra",
  title =        "Profiling High Performance Dense Linear Algebra
                 Algorithms on Multicore Architectures for Power and
                 Energy Efficiency",
  type =         "LAPACK Working Note",
  number =       "251",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "21",
  month =        jun,
  year =         "2011",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-11-674.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Piotr Luszczek and Hatem Ltaief and Jack Dongarra",
  title =        "Two-Stage Tridiagonal Reduction for Dense Symmetric
                 Matrices using Tile Algorithms on Multicore
  type =         "LAPACK Working Note",
  number =       "244",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "18",
  month =        apr,
  year =         "2011",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-11-670.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Rajib Nath and Stanimire Tomov and Tingxing ``Tim''
                 Dong and Jack Dongarra",
  title =        "Optimizing symmetric dense matrix-vector
                 multiplication on {GPUs}",
  crossref =     "Lathrop:2011:SPI",
  pages =        "6:1--6:10",
  year =         "2011",
  DOI =          "",
  bibdate =      "Fri Dec 16 11:05:47 MST 2011",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  articleno =    "6",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Fengguang Song and Stanimire Tomov and Jack Dongarra",
  title =        "Efficient Support for Matrix Computations on
                 Heterogeneous Multi-core and Multi-{GPU}
  type =         "LAPACK Working Note",
  number =       "250",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "16",
  month =        jun,
  year =         "2011",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-11-668.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Fengguang Song and Hatem Ltaief and Bilel Hadri and
                 Jack Dongarra",
  title =        "Scalable Tile Communication-Avoiding {$ Q R $}
                 Factorization on Multicore Cluster Systems",
  type =         "LAPACK Working Note",
  number =       "241",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  day =          "4",
  month =        mar,
  year =         "2011",
  bibdate =      "Wed Aug 24 12:36:41 MDT 2011",
  bibsource =    "",
  note =         "UT-CS-10-653. Published at SC'10",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jeffrey S. Vetter and Richard Glassbrook and Jack
                 Dongarra and Karsten Schwan and Bruce Loftis and
                 Stephen McNally and Jeremy Meredith and James Rogers
                 and Philip Roth and Kyle Spafford and Sudhakar
  title =        "{Keeneland}: Bringing Heterogeneous {GPU} Computing to
                 the Computational Science Community",
  journal =      j-COMPUT-SCI-ENG,
  volume =       "13",
  number =       "5",
  pages =        "90--95",
  month =        sep # "\slash " # oct,
  year =         "2011",
  CODEN =        "CSENFA",
  DOI =          "",
  ISSN =         "1521-9615 (print), 1558-366X (electronic)",
  ISSN-L =       "1521-9615",
  bibdate =      "Wed Aug 31 18:09:32 2011",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Computing in Science and Engineering",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "David S. Watkins",
  title =        "{Francis}'s Algorithm",
  journal =      j-AMER-MATH-MONTHLY,
  volume =       "118",
  number =       "5",
  pages =        "387--403",
  month =        may,
  year =         "2011",
  CODEN =        "AMMYAE",
  ISSN =         "0002-9890 (print), 1930-0972 (electronic)",
  ISSN-L =       "0002-9890",
  bibdate =      "Thu May 26 16:28:05 2011",
  bibsource =    "",
  URL =          "",
  abstract =     "John Francis's implicitly shifted QR algorithm turned
                 the problem of matrix eigenvalue computation from
                 difficult to routine almost overnight about fifty years
                 ago. It was named one of the top ten algorithms of the
                 twentieth century by Dongarra and Sullivan, and it
                 deserves to be more widely known and understood by the
                 general mathematical community. This article provides
                 an efficient introduction to Francis's algorithm that
                 follows a novel path. Efficiency is gained by omitting
                 the traditional but wholly unnecessary detour through
                 the basic QR algorithm. A brief history of the
                 algorithm is also included. It was not a one-man show;
                 some other important names are Rutishauser, Wilkinson,
                 and Kublanovskaya. Francis was never a specialist in
                 matrix computations. He was employed in the early
                 computer industry, spent some time on the problem of
                 eigenvalue computation and did amazing work, and then
                 moved on to other things. He never looked back, and he
                 remained unaware of the huge impact of his work until
                 many years later.",
  acknowledgement = ack-nhfb,
  fjournal =     "American Mathematical Monthly",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. B. {White III} and J. J. Dongarra",
  title =        "High-performance high-resolution semi-{Lagrangian}
                 tracer transport on a sphere",
  journal =      j-J-COMPUT-PHYS,
  volume =       "230",
  number =       "17",
  pages =        "6778--6799",
  day =          "20",
  month =        jul,
  year =         "2011",
  CODEN =        "JCTPAH",
  DOI =          "",
  ISSN =         "0021-9991 (print), 1090-2716 (electronic)",
  ISSN-L =       "0021-9991",
  bibdate =      "Sat Dec 31 11:59:34 MST 2011",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of Computational Physics",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "George Bosilca and Aurelien Bouteiller and Anthony
                 Danalis and Thomas Herault and Pierre Lemarinier and
                 Jack Dongarra",
  title =        "{DAGuE}: a generic distributed {DAG} engine for {High
                 Performance Computing}",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "38",
  number =       "1--2",
  pages =        "37--51",
  month =        jan # "\slash " # feb,
  year =         "2012",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Sat Feb 4 15:17:36 MST 2012",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "George Bosilca and Aurelien Bouteiller and Anthony
                 Danalis and Thomas Herault and Piotr Luszczek and Jack
                 J. Dongarra",
  title =        "Dense Linear Algebra on Distributed Heterogeneous
                 Hardware with a Symbolic {DAG} Approach",
  type =         "LAPACK Working Note",
  number =       "264",
  institution =  inst-CS-U-Tenn,
  address =      inst-CS-U-Tenn:adr,
  month =        jan,
  year =         "2012",
  bibdate =      "Sun May 5 11:20:19 2013",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "George Bosilca and Aurelien Bouteiller and Elisabeth
                 Brunet and Franck Cappello and Jack Dongarra and Amina
                 Guermouche and Thomas Herault and Yves Robert and
                 Frederic Vivien and Dounia Zaidouni",
  title =        "Unified Model for Assessing Checkpointing Protocols at
  type =         "LAPACK Working Note",
  number =       "269",
  institution =  inst-CS-U-Tenn,
  address =      inst-CS-U-Tenn:adr,
  month =        jun,
  year =         "2012",
  bibdate =      "Sun May 5 11:20:19 2013",
  bibsource =    ";
  note =         "UT-CS-12-697.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Anthony Danalis and Piotr Luszczek and Gabriel Marin
                 and Jeffrey S. Vetter and Jack Dongarra",
  title =        "{BlackjackBench}: portable hardware characterization",
  journal =      j-SIGMETRICS,
  volume =       "40",
  number =       "2",
  pages =        "74--79",
  month =        sep,
  year =         "2012",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "0163-5999 (print), 1557-9484 (electronic)",
  ISSN-L =       "0163-5999",
  bibdate =      "Fri Nov 9 11:06:40 MST 2012",
  bibsource =    ";
  abstract =     "DARPA's AACE project aimed to develop Architecture
                 Aware Compiler Environments that automatically
                 characterizes the hardware and optimizes the
                 application codes accordingly. We present the
                 BlackjackBench --- a suite of portable benchmarks that
                 automate system characterization, plus statistical
                 analysis techniques for interpreting the results. The
                 BlackjackBench discovers the effective sizes and speeds
                 of the hardware environment rather than the often
                 unattainable peak values. We aim at hardware
                 characteristics that can be observed by running
                 standard C codes. We characterize the memory hierarchy,
                 including cache sharing and NUMA characteristics of the
                 system, properties of the processing cores affecting
                 instruction execution speed, and the length of the OS
                 scheduler time slot. We show how they all could
                 potentially interfere with each other and how
                 established classification and statistical analysis
                 techniques reduce experimental noise and aid automatic
                 interpretation of results.",
  acknowledgement = ack-nhfb,
  fjournal =     "ACM SIGMETRICS Performance Evaluation Review",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra",
  editor =       "????",
  booktitle =    "{ATIP '12: Proceedings of the ATIP\slash A*CRC
                 Workshop on Accelerator Technologies for
                 High-Performance Computing: Does Asia Lead the Way?}",
  title =        "Algorithmic and software challenges when moving
                 towards exascale",
  publisher =    pub-ACM,
  address =      pub-ACM:adr,
  pages =        "??--??",
  year =         "2012",
  ISBN =         "1-4503-1644-1",
  ISBN-13 =      "978-1-4503-1644-6",
  LCCN =         "????",
  bibdate =      "Wed Nov 14 10:44:01 2012",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  articleno =    "17",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  remark =       "Publisher has only PDF file of 35 lecture slides.",

  author =       "J. J. Dongarra and A. J. van der Steen",
  title =        "High-performance computing systems: Status and
  journal =      j-ACTA-NUMERICA,
  volume =       "21",
  pages =        "379--474",
  year =         "2012",
  CODEN =        "ANUMFU",
  DOI =          "",
  ISSN =         "0962-4929 (print), 1474-0508 (electronic)",
  ISSN-L =       "0962-4929",
  MRclass =      "65Y05",
  MRnumber =     "2916384",
  bibdate =      "Mon Nov 5 18:59:17 MST 2012",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ajournal =     "Acta Numer.",
  fjournal =     "Acta Numerica",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and James Demmel and Michael Heroux and
                 Jakub Kurzak",
  title =        "Linear Algebra Libraries for High-Performance
                 Computing: Scientific Computing with Multicore and
  crossref =     "Hollingsworth:2012:SPI",
  howpublished = "Supercomputer '2012 conference tutorial",
  day =          "10--16",
  month =        nov,
  year =         "2012",
  bibdate =      "Tue Nov 20 18:23:12 2012",
  bibsource =    "",
  note =         "PDF with 76 lecture slides.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Thomas Herault and Yves Robert",
  title =        "Revisiting the double checkpointing algorithm",
  type =         "LAPACK Working Note",
  number =       "274",
  institution =  inst-CS-U-Tenn,
  address =      inst-CS-U-Tenn:adr,
  month =        dec,
  year =         "2012",
  bibdate =      "Sun May 5 11:20:19 2013",
  bibsource =    ";
  note =         "UT-CS-13-705.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Peng Du and Aurelien Bouteiller and George Bosilca and
                 Thomas Herault and Jack Dongarra",
  title =        "Algorithm-based fault tolerance for dense matrix
  journal =      j-SIGPLAN,
  volume =       "47",
  number =       "8",
  pages =        "225--234",
  month =        aug,
  year =         "2012",
  CODEN =        "SINODQ",
  DOI =          "",
  ISSN =         "0362-1340 (print), 1523-2867 (print), 1558-1160
  ISSN-L =       "0362-1340",
  bibdate =      "Wed Sep 12 12:11:57 MDT 2012",
  bibsource =    ";
  note =         "PPOPP '12 conference proceedings.",
  abstract =     "Dense matrix factorizations, such as LU, Cholesky and
                 QR, are widely used for scientific applications that
                 require solving systems of linear equations,
                 eigenvalues and linear least squares problems. Such
                 computations are normally carried out on
                 supercomputers, whose ever-growing scale induces a fast
                 decline of the Mean Time To Failure (MTTF). This paper
                 proposes a new hybrid approach, based on
                 Algorithm-Based Fault Tolerance (ABFT), to help matrix
                 factorizations algorithms survive fail-stop failures.
                 We consider extreme conditions, such as the absence of
                 any reliable component and the possibility of loosing
                 both data and checksum from a single failure. We will
                 present a generic solution for protecting the right
                 factor, where the updates are applied, of all above
                 mentioned factorizations. For the left factor, where
                 the panel has been applied, we propose a scalable
                 checkpointing algorithm. This algorithm features high
                 degree of checkpointing parallelism and cooperatively
                 utilizes the checksum storage leftover from the right
                 factor protection. The fault-tolerant algorithms
                 derived from this hybrid solution is applicable to a
                 wide range of dense matrix factorizations, with minor
                 modifications. Theoretical analysis shows that the
                 fault tolerance overhead sharply decreases with the
                 scaling in the number of computing units and the
                 problem size. Experimental results of LU and QR
                 factorization on the Kraken (Cray XT5) supercomputer
                 validate the theoretical evaluation and confirm
                 negligible overhead, with- and without-errors.",
  acknowledgement = ack-nhfb,
  fjournal =     "ACM SIGPLAN Notices",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Peng Du and Rick Weber and Piotr Luszczek and
                 Stanimire Tomov and Gregory Peterson and Jack
  title =        "From {CUDA} to {OpenCL}: Towards a
                 performance-portable solution for multi-platform {GPU}
  journal =      j-PARALLEL-COMPUTING,
  volume =       "38",
  number =       "8",
  pages =        "391--407",
  month =        aug,
  year =         "2012",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Wed Jun 20 17:04:05 MDT 2012",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Peng Du and Stanimire Tomov and Jack Dongarra",
  title =        "Providing {GPU} Capability to {$ L U $} and {$ Q R $}
                 within the {ScaLAPACK} Framework",
  type =         "LAPACK Working Note",
  number =       "272",
  institution =  inst-CS-U-Tenn,
  address =      inst-CS-U-Tenn:adr,
  month =        sep,
  year =         "2012",
  bibdate =      "Sun May 5 11:20:19 2013",
  bibsource =    ";
  note =         "UT-CS-12-699.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Azzam Haidar and Hatem Ltaief and Asim YarKhan and
                 Jack Dongarra",
  title =        "Analysis of dynamically scheduled tile algorithms for
                 dense linear algebra on multicore architectures",
  journal =      j-CCPE,
  volume =       "24",
  number =       "3",
  pages =        "305--321",
  day =          "10",
  month =        mar,
  year =         "2012",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Wed Apr 4 09:18:01 MDT 2012",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  onlinedate =   "22 Aug 2011",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Azzam Haidar and Hatem Ltaief and Jack Dongarra",
  title =        "Toward a High Performance Tile Divide and Conquer
                 Algorithm for the Dense Symmetric Eigenvalue Problem",
  journal =      j-SIAM-J-SCI-COMP,
  volume =       "34",
  number =       "6",
  pages =        "C249--C274",
  month =        "????",
  year =         "2012",
  CODEN =        "SJOCE3",
  DOI =          "",
  ISSN =         "1064-8275 (print), 1095-7197 (electronic)",
  ISSN-L =       "1064-8275",
  MRclass =      "65F15 (15A18 65Y05 65Y20 68W10)",
  MRnumber =     "3029833",
  MRreviewer =   "Aaron Melman",
  bibdate =      "Fri Jul 19 07:43:33 MDT 2013",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM Journal on Scientific Computing",
  journal-URL =  "",
  onlinedate =   "January 2012",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Yulu Jia and Piotr Luszczek and Jack Dongarra",
  editor =       "????",
  booktitle =    "{ATIP '12: Proceedings of the ATIP\slash A*CRC
                 Workshop on Accelerator Technologies for
                 High-Performance Computing: Does Asia Lead the Way?}",
  title =        "Hybrid {$ L U $} factorization on multi-{GPU}
                 multi-core heterogeneous platforms",
  publisher =    pub-ACM,
  address =      pub-ACM:adr,
  pages =        "??--??",
  year =         "2012",
  ISBN =         "1-4503-1644-1",
  ISBN-13 =      "978-1-4503-1644-6",
  LCCN =         "????",
  bibdate =      "Wed Nov 14 10:44:01 2012",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  articleno =    "34",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  remark =       "Publisher has only 1-page poster PDF file.",

  author =       "Jakub Kurzak and Stanimire Tomov and Jack Dongarra",
  title =        "Autotuning {GEMM} Kernels for the {Fermi GPU}",
  journal =      j-IEEE-TRANS-PAR-DIST-SYS,
  volume =       "23",
  number =       "11",
  pages =        "2045--2057",
  month =        nov,
  year =         "2012",
  CODEN =        "ITDSEO",
  DOI =          "",
  ISSN =         "1045-9219 (print), 1558-2183 (electronic)",
  ISSN-L =       "1045-9219",
  bibdate =      "Mon Oct 22 08:15:38 2012",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Transactions on Parallel and Distributed
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jakub Kurzak and Piotr Luszczek and Mathieu Faverge
                 and Jack Dongarra",
  title =        "{$ L U $} Factorization with Partial Pivoting for a
                 Multi-{CPU}, Multi-{GPU} Shared Memory System",
  type =         "LAPACK Working Note",
  number =       "266",
  institution =  inst-CS-U-Tenn,
  address =      inst-CS-U-Tenn:adr,
  month =        apr,
  year =         "2012",
  bibdate =      "Sun May 5 11:20:19 2013",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jakub Kurzak and Piotr Luszczek and Stanimire Tomov
                 and Jack Dongarra",
  title =        "Preliminary Results of Autotuning {GEMM} Kernels for
                 the {NVIDIA Kepler Architecture GeForce GTX 680}",
  type =         "LAPACK Working Note",
  number =       "267",
  institution =  inst-CS-U-Tenn,
  address =      inst-CS-U-Tenn:adr,
  month =        apr,
  year =         "2012",
  bibdate =      "Sun May 5 11:20:19 2013",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Horst Simon and Jack Dongarra and Hemant Shukla",
  title =        "Introduction to the {Special Issue}",
  journal =      j-IJHPCA,
  volume =       "26",
  number =       "4",
  pages =        "335--336",
  month =        nov,
  year =         "2012",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Thu Nov 8 11:31:16 MST 2012",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Christof V{\"o}mel and Stanimire Tomov and Jack
  title =        "Divide and Conquer on Hybrid {GPU}-Accelerated
                 Multicore Systems",
  journal =      j-SIAM-J-SCI-COMP,
  volume =       "34",
  number =       "2",
  pages =        "C70--C82",
  month =        "????",
  year =         "2012",
  CODEN =        "SJOCE3",
  DOI =          "",
  ISSN =         "1064-8275 (print), 1095-7197 (electronic)",
  ISSN-L =       "1064-8275",
  MRclass =      "65F15 (65Y10)",
  MRnumber =     "2914328",
  MRreviewer =   "Thomas K. Huckle",
  bibdate =      "Tue Oct 30 14:48:54 MDT 2012",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM Journal on Scientific Computing",
  journal-URL =  "",
  onlinedate =   "January 2012",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Anonymous",
  title =        "A Conversation with {ISC Fellow Jack Dongarra}",
  journal =      j-SCI-COMPUT,
  day =          "10",
  month =        apr,
  year =         "2013",
  CODEN =        "SCHRCU",
  ISSN =         "1930-5753 (print), 1930-6156 (electronic)",
  ISSN-L =       "1930-5753",
  bibdate =      "Wed Apr 17 08:42:31 2013",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Scientific Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hartwig Anzt and Stanimire Tomov and Jack Dongarra and
                 Vincent Heuveline",
  title =        "A block-asynchronous relaxation method for graphics
                 processing units",
  journal =      j-J-PAR-DIST-COMP,
  volume =       "73",
  number =       "12",
  pages =        "1613--1626",
  month =        dec,
  year =         "2013",
  CODEN =        "JPDCER",
  ISSN =         "0743-7315 (print), 1096-0848 (electronic)",
  ISSN-L =       "0743-7315",
  bibdate =      "Fri Nov 29 09:55:28 MST 2013",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of Parallel and Distributed Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Guillaume Aupy and Anne Benoit and Thomas H{\'e}rault
                 and Yves Robert and Fr{\'e}d{\'e}ric Vivien and Dounia
  title =        "On the Combination of Silent Error Detection and
  type =         "LAPACK Working Note",
  number =       "278",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        jun,
  year =         "2013",
  bibdate =      "Sat Mar 15 07:08:58 2014",
  bibsource =    ";
  note =         "UT-CS-13-710.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Guillaume Aupy and Mathieu Faverge and Yves Robert and
                 Jakub Kurzak and Piotr Luszczek and Jack Dongarra",
  title =        "Implementing a systolic algorithm for {$ Q R $}
                 factorization on multicore clusters with {PaRSEC}",
  type =         "LAPACK Working Note",
  number =       "277",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        may,
  year =         "2013",
  bibdate =      "Sat Mar 15 07:08:58 2014",
  bibsource =    ";
  note =         "UT-CS-13-709.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Guillaume Aupy and Anne Benoit and Thomas Herault and
                 Yves Robert and Jack Dongarra",
  title =        "Optimal Checkpointing Period: Time vs. Energy",
  type =         "LAPACK Working Note",
  number =       "281",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        oct,
  year =         "2013",
  bibdate =      "Sat Mar 15 07:08:58 2014",
  bibsource =    ";
  note =         "UT-EECS-13-718.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Marc Baboulin and Jack Dongarra and Julien Herrmann
                 and Stanimire Tomov",
  title =        "Accelerating Linear System Solutions Using
                 Randomization Techniques",
  journal =      j-TOMS,
  volume =       "39",
  number =       "2",
  pages =        "8:1--8:13",
  month =        feb,
  year =         "2013",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  MRclass =      "65F05 (65Y05)",
  MRnumber =     "3031627",
  MRreviewer =   "Pierluigi Maponi",
  bibdate =      "Wed Feb 20 16:46:13 MST 2013",
  bibsource =    ";
  abstract =     "We illustrate how linear algebra calculations can be
                 enhanced by statistical techniques in the case of a
                 square linear system {$ A x = b $}. We study a random
                 transformation of {$A$} that enables us to avoid
                 pivoting and then to reduce the amount of
                 communication. Numerical experiments show that this
                 randomization can be performed at a very affordable
                 computational price while providing us with a
                 satisfying accuracy when compared to partial pivoting.
                 This random transformation called Partial Random
                 Butterfly Transformation (PRBT) is optimized in terms
                 of data storage and flops count. We propose a solver
                 where PRBT and the LU factorization with no pivoting
                 take advantage of the current hybrid multicore\slash
                 GPU machines and we compare its Gflop/s performance
                 with a solver implemented in a current parallel
  acknowledgement = ack-nhfb,
  articleno =    "8",
  fjournal =     "ACM Transactions on Mathematical Software (TOMS)",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Wesley Bland and Aurelien Bouteiller and Thomas
                 Herault and George Bosilca and Jack Dongarra",
  title =        "Post-failure recovery of {MPI} communication
                 capability: Design and rationale",
  journal =      j-IJHPCA,
  volume =       "27",
  number =       "3",
  pages =        "244--254",
  month =        aug,
  year =         "2013",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Fri Mar 14 15:39:55 MDT 2014",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  onlinedate =   "June 3, 2013",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Wesley Bland and Peng Du and Aurelien Bouteiller and
                 Thomas Herault and George Bosilca and Jack J.
  title =        "Special Issue Papers: Extending the scope of the
                 {Checkpoint-on-Failure} protocol for forward recovery
                 in standard {MPI}",
  journal =      j-CCPE,
  volume =       "25",
  number =       "17",
  pages =        "2381--2393",
  day =          "10",
  month =        dec,
  year =         "2013",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Tue Dec 3 10:37:48 MST 2013",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  onlinedate =   "23 Jul 2013",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "George Bosilca and Aurelien Bouteiller and Anthony
                 Danalis and Mathieu Faverge and Thomas Herault and Jack
                 J. Dongarra",
  title =        "{PaRSEC}: Exploiting Heterogeneity to Enhance
  journal =      j-COMPUT-SCI-ENG,
  volume =       "15",
  number =       "6",
  pages =        "36--45",
  month =        nov # "\slash " # dec,
  year =         "2013",
  CODEN =        "CSENFA",
  DOI =          "",
  ISSN =         "1521-9615 (print), 1558-366x (electronic)",
  ISSN-L =       "1521-9615",
  bibdate =      "Sat Apr 19 10:17:39 2014",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Computing in Science and Engineering",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Aurelien Bouteiller and Thomas Herault and George
                 Bosilca and Jack J. Dongarra",
  title =        "Correlated set coordination in fault tolerant message
                 logging protocols for many-core clusters",
  journal =      j-CCPE,
  volume =       "25",
  number =       "4",
  pages =        "572--585",
  month =        "????",
  year =         "2013",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Thu Mar 7 08:39:04 MST 2013",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Prac\-tice and
  journal-URL =  "",
  onlinedate =   "11 Jul 2012",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Chongxiao Cao and Jack Dongarra and Peng Du and Mark
                 Gates and Piotr Luszczek and Stanimire Tomov",
  title =        "{clMAGMA}: High Performance Dense Linear Algebra with
  type =         "LAPACK Working Note",
  number =       "275",
  institution =  inst-CS-U-Tenn,
  address =      inst-CS-U-Tenn:adr,
  month =        mar,
  year =         "2013",
  bibdate =      "Sun May 5 11:20:19 2013",
  bibsource =    ";
  note =         "UT-CS-13-706.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Simplice Donfack and Jack Dongarra and Mathieu Faverge
                 and Mark Gates and Jakub Kurzak and Piotr Luszczek and
                 Ichitaro Yamazaki",
  title =        "On Algorithmic Variants of Parallel {Gaussian}
                 Elimination: Comparison of Implementations in Terms of
                 Performance and Numerical Properties",
  type =         "LAPACK Working Note",
  number =       "280",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        jul,
  year =         "2013",
  bibdate =      "Sat Mar 15 07:08:58 2014",
  bibsource =    ";
  note =         "UT-CS-13-715",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Bernard Tourancheau",
  title =        "{Guest Editors}' Note: Special Issue on Clusters,
                 Clouds, and Data for Scientific Computing",
  journal =      j-PARALLEL-PROCESS-LETT,
  volume =       "23",
  number =       "2",
  pages =        "1302001, 1",
  month =        jun,
  year =         "2013",
  CODEN =        "PPLTEE",
  DOI =          "",
  ISSN =         "0129-6264 (print), 1793-642X (electronic)",
  ISSN-L =       "0129-6264",
  MRclass =      "Indexed",
  MRnumber =     "3080369",
  bibdate =      "Sat Mar 15 08:51:02 MDT 2014",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Processing Letters",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Mathieu Faverge and Thomas
                 H{\'e}rault and Mathias Jacquelin and Julien Langou and
                 Yves Robert",
  title =        "Hierarchical {QR} factorization algorithms for
                 multi-core clusters",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "39",
  number =       "4--5",
  pages =        "212--232",
  month =        apr # "\slash " # may,
  year =         "2013",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  MRclass =      "65F25 (65Y05)",
  MRnumber =     "3053976",
  bibdate =      "Thu Apr 18 13:00:52 MDT 2013",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing. Systems \& Applications",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Bernard Tourancheau",
  title =        "Introduction for {August} Special Issue {CCDSC}",
  journal =      j-IJHPCA,
  volume =       "27",
  number =       "3",
  pages =        "231--231",
  month =        aug,
  year =         "2013",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Fri Mar 14 15:39:55 MDT 2014",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Peng Du and Piotr Luszczek and Stan Tomov and Jack
  title =        "Soft error resilient {$ Q R $} factorization for
                 hybrid system with {GPGPU}",
  journal =      j-J-COMPUT-SCI,
  volume =       "4",
  number =       "6",
  pages =        "457--464",
  month =        nov,
  year =         "2013",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "1877-7503 (print), 1877-7511 (electronic)",
  ISSN-L =       "1877-7503",
  bibdate =      "Tue Sep 19 13:53:30 MDT 2023",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "J. Comput. Sci.",
  fjournal =     "Journal of Computational Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Mathieu Faverge and Julien Herrmann and Julien Langou
                 and Bradley Lowery and Yves Robert and Jack Dongarra",
  title =        "Designing {$ L U $--$ Q R $} hybrid solvers for
                 performance and stability",
  type =         "LAPACK Working Note",
  number =       "282",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        oct,
  year =         "2013",
  bibdate =      "Sat Mar 15 07:08:58 2014",
  bibsource =    ";
  note =         "UT-EECS-13-719.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Fred G. Gustavson and Jerzy Wa{\'s}niewski and Jack J.
                 Dongarra and Jos{\'e} R. Herrero and Julien Langou",
  title =        "Level-3 {Cholesky} Factorization Routines Improve
                 Performance of Many {Cholesky} Algorithms",
  journal =      j-TOMS,
  volume =       "39",
  number =       "2",
  pages =        "9:1--9:10",
  month =        feb,
  year =         "2013",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  MRclass =      "65F05 (65Y15)",
  MRnumber =     "3031628",
  bibdate =      "Wed Feb 20 16:46:13 MST 2013",
  bibsource =    ";
  abstract =     "Four routines called DPOTF3i, $ i = a, b, c, d $, are
                 presented. DPOTF3i are a novel type of level-3 BLAS for
                 use by BPF (Blocked Packed Format) Cholesky
                 factorization and LAPACK routine DPOTRF. Performance of
                 routines DPOTF3i are still increasing when the
                 performance of Level-2 routine DPOTF2 of LAPACK starts
                 decreasing. This is our main result and it implies, due
                 to the use of larger block size $ n_b $, that DGEMM,
                 DSYRK, and DTRSM performance also increases! The four
                 DPOTF3i routines use simple register blocking.
                 Different platforms have different numbers of
                 registers. Thus, our four routines have different
                 register blocking sizes. BPF is introduced. LAPACK
                 routines for POTRF and PPTRF using BPF instead of full
                 and packed format are shown to be trivial modifications
                 of LAPACK POTRF source codes. We call these codes
                 BPTRF. There are two variants of BPF: lower and upper.
                 Upper BPF is ``identical'' to Square Block Packed
                 Format (SBPF). ``LAPACK'' implementations on multicore
                 processors use SBPF. Lower BPF is less efficient than
                 upper BPF. Vector inplace transposition converts lower
                 BPF to upper BPF very efficiently. Corroborating
                 performance results for DPOTF3i versus DPOTF2 on a
                 variety of common platforms are given for $ n \approx
                 n_b $ as well as results for large $n$ comparing DBPTRF
                 versus DPOTRF.",
  acknowledgement = ack-nhfb,
  articleno =    "9",
  fjournal =     "ACM Transactions on Mathematical Software (TOMS)",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Azzam Haidar and Piotr Luszczek and Jakub Kurzak and
                 Jack Dongarra",
  title =        "An Improved Parallel Singular Value Algorithm and Its
                 Implementation for Multicore Hardware",
  type =         "LAPACK Working Note",
  number =       "283",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        oct,
  year =         "2013",
  bibdate =      "Sat Mar 15 07:08:58 2014",
  bibsource =    ";
  note =         "UT-EECS-13-720.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Yulu Jia and Piotr Luszczek and Jack Dongarra",
  title =        "Transient Error Resilient {Hessenberg} Reduction on
                 {GPU}-based Hybrid Architectures",
  type =         "LAPACK Working Note",
  number =       "279",
  institution =  inst-UTK-CS,
  address =      inst-UTK-CS:adr,
  month =        jun,
  year =         "2013",
  bibdate =      "Sat Mar 15 07:08:58 2014",
  bibsource =    ";
  note =         "UT-CS-13-712.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jakub Kurzak and Piotr Luszczek and Mathieu Faverge
                 and Jack Dongarra",
  title =        "{$ L U $} Factorization with Partial Pivoting for a
                 Multicore System with Accelerators",
  journal =      j-IEEE-TRANS-PAR-DIST-SYS,
  volume =       "24",
  number =       "8",
  pages =        "1613--1621",
  month =        aug,
  year =         "2013",
  CODEN =        "ITDSEO",
  DOI =          "",
  ISSN =         "1045-9219 (print), 1558-2183 (electronic)",
  ISSN-L =       "1045-9219",
  bibdate =      "Mon Aug 12 11:15:20 2013",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Transactions on Parallel and Distributed
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Yinan Li and Asim YarKhan and Jack Dongarra and Keith
                 Seymour and Aur{\`e}lie Hurault",
  title =        "Enabling workflows in {GridSolve}: request sequencing
                 and service trading",
  journal =      j-J-SUPERCOMPUTING,
  volume =       "64",
  number =       "3",
  pages =        "1133--1152",
  month =        jun,
  year =         "2013",
  CODEN =        "JOSUED",
  DOI =          "",
  ISSN =         "0920-8542 (print), 1573-0484 (electronic)",
  ISSN-L =       "0920-8542",
  bibdate =      "Sat Feb 8 11:30:45 MST 2014",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "The Journal of Supercomputing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hatem Ltaief and Piotr Luszczek and Jack Dongarra",
  title =        "High-performance bidiagonal reduction using tile
                 algorithms on homogeneous multicore architectures",
  journal =      j-TOMS,
  volume =       "39",
  number =       "3",
  pages =        "16:1--16:22",
  month =        apr,
  year =         "2013",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  MRclass =      "65F15 (65Y05)",
  MRnumber =     "3094972",
  bibdate =      "Tue Apr 30 18:50:55 MDT 2013",
  bibsource =    ";
  abstract =     "This article presents a new high-performance
                 bidiagonal reduction (BRD) for homogeneous multicore
                 architectures. This article is an extension of the
                 high-performance tridiagonal reduction implemented by
                 the same authors [Luszczek et al., IPDPS 2011] to the
                 BRD case. The BRD is the first step toward computing
                 the singular value decomposition of a matrix, which is
                 one of the most important algorithms in numerical
                 linear algebra due to its broad impact in computational
                 science. The high performance of the BRD described in
                 this article comes from the combination of four
                 important features: (1) tile algorithms with tile data
                 layout, which provide an efficient data representation
                 in main memory; (2) a two-stage reduction approach that
                 allows to cast most of the computation during the first
                 stage (reduction to band form) into calls to Level 3
                 BLAS and reduces the memory traffic during the second
                 stage (reduction from band to bidiagonal form) by using
                 high-performance kernels optimized for cache reuse; (3)
                 a data dependence translation layer that maps the
                 general algorithm with column-major data layout into
                 the tile data layout; and (4) a dynamic runtime system
                 that efficiently schedules the newly implemented
                 kernels across the processing units and ensures that
                 the data dependencies are not violated. A detailed
                 analysis is provided to understand the critical impact
                 of the tile size on the total execution time, which
                 also corresponds to the matrix bandwidth size after the
                 reduction of the first stage. The performance results
                 show a significant improvement over currently
                 established alternatives. The new high-performance BRD
                 achieves up to a 30-fold speedup on a 16-core Intel
                 Xeon machine with a 12000$ \times $ 12000 matrix size
                 against the state-of-the-art open source and commercial
                 numerical software packages, namely LAPACK, compiled
                 with optimized and multithreaded BLAS from MKL as well
                 as Intel MKL version 10.2.",
  acknowledgement = ack-nhfb,
  articleno =    "16",
  fjournal =     "ACM Transactions on Mathematical Software (TOMS)",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Teng Ma and George Bosilca and Aurelien Bouteiller and
                 Jack J. Dongarra",
  title =        "Kernel-assisted and topology-aware {MPI} collective
                 communications on multicore/many-core platforms",
  journal =      j-J-PAR-DIST-COMP,
  volume =       "73",
  number =       "7",
  pages =        "1000--1010",
  month =        jul,
  year =         "2013",
  CODEN =        "JPDCER",
  ISSN =         "0743-7315 (print), 1096-0848 (electronic)",
  ISSN-L =       "0743-7315",
  bibdate =      "Mon Aug 26 16:44:35 MDT 2013",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of Parallel and Distributed Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Marc Baboulin and Dulceneia Becker and George Bosilca
                 and Anthony Danalis and Jack Dongarra",
  title =        "An efficient distributed randomized algorithm for
                 solving large dense symmetric indefinite linear
  journal =      j-PARALLEL-COMPUTING,
  volume =       "40",
  number =       "7",
  pages =        "213--223",
  month =        jul,
  year =         "2014",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  MRclass =      "65F05 (65Y05)",
  MRnumber =     "3225341",
  bibdate =      "Sat Aug 16 11:23:28 MDT 2014",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing. Systems \& Applications",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Grey Ballard and Dulceneia Becker and James Demmel and
                 Jack Dongarra and Alex Druinsky and Inon Peled and Oded
                 Schwartz and Sivan Toledo and Ichitaro Yamazaki",
  title =        "Communication-Avoiding Symmetric-Indefinite
  journal =      j-SIAM-J-MAT-ANA-APPL,
  volume =       "35",
  number =       "4",
  pages =        "1364--1406",
  month =        "????",
  year =         "2014",
  CODEN =        "SJMAEL",
  DOI =          "",
  ISSN =         "0895-4798 (print), 1095-7162 (electronic)",
  ISSN-L =       "0895-4798",
  MRclass =      "65F05 (15A23 65Y20)",
  MRnumber =     "3277218",
  bibdate =      "Thu Feb 12 08:43:50 MST 2015",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM Journal on Matrix Analysis and Applications",
  journal-URL =  "",
  onlinedate =   "January 2014",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "George Bosilca and Aur{\'e}lien Bouteiller and
                 Elisabeth Brunet and Franck Cappello and Jack Dongarra
                 and Amina Guermouche and Thomas Herault and Yves Robert
                 and Fr{\'e}d{\'e}ric Vivien and Dounia Zaidouni",
  title =        "Unified model for assessing checkpointing protocols at
  journal =      j-CCPE,
  volume =       "26",
  number =       "17",
  pages =        "2772--2791",
  day =          "10",
  month =        dec,
  year =         "2014",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Wed Feb 11 22:34:11 MST 2015",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  onlinedate =   "4 Nov 2013",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Anthony Danalis and Piotr Luszczek and Gabriel Marin
                 and Jeffrey S. Vetter and Jack Dongarra",
  title =        "{BlackjackBench}: Portable Hardware Characterization
                 with Automated Results' Analysis",
  journal =      j-COMP-J,
  volume =       "57",
  number =       "7",
  pages =        "1002--1016",
  month =        jul,
  year =         "2014",
  CODEN =        "CMPJA6",
  DOI =          "",
  ISSN =         "0010-4620 (print), 1460-2067 (electronic)",
  ISSN-L =       "0010-4620",
  bibdate =      "Fri Jun 20 08:41:22 MDT 2014",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Computer Journal",
  journal-URL =  "",
  onlinedate =   "June 28, 2013",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Mathieu Faverge and Hatem Ltaief and
                 Piotr Luszczek",
  title =        "Achieving numerical accuracy and high performance
                 using recursive tile {$ L U $} factorization with
                 partial pivoting",
  journal =      j-CCPE,
  volume =       "26",
  number =       "7",
  pages =        "1408--1431",
  month =        may,
  year =         "2014",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Fri May 30 08:55:40 MDT 2014",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  onlinedate =   "18 Sep 2013",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Mark Gates and Azzam Haidar and
                 Jakub Kurzak and Piotr Luszczek and Stanimire Tomov and
                 Ichitaro Yamazaki",
  booktitle =    "Numerical Computations with {GPUs}",
  title =        "Accelerating Numerical Dense Linear Algebra
                 Calculations with {GPUs}",
  publisher =    "Springer International Publishing",
  address =      "Cham, Switzerland",
  pages =        "3--28",
  year =         "2014",
  DOI =          "",
  bibdate =      "Thu Nov 7 16:48:33 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Azzam Haidar and Jakub Kurzak and
                 Piotr Luszczek and Stanimire Tomov and Asim YarKhan",
  title =        "Model-Driven One-Sided Factorizations on Multicore
                 Accelerated Systems",
  journal =      j-SUPERFRI,
  volume =       "1",
  number =       "1",
  pages =        "85--115",
  month =        "????",
  year =         "2014",
  CODEN =        "????",
  ISSN =         "2409-6008 (print), 2313-8734 (electronic)",
  bibdate =      "Sat Nov 11 07:15:27 MST 2017",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Supercomputing Frontiers and Innovations",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Mark Gates and Azzam Haidar and Yulu
                 Jia and Khairul Kabir and Piotr Luszczek and Stanimire
  booktitle =    "Parallel processing and applied mathematics. {Part
  title =        "Portable {HPC} programming on {Intel}
                 many-integrated-core hardware with {MAGMA} port to
                 {Xeon Phi}",
  volume =       "8384",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "571--581",
  year =         "2014",
  DOI =          "",
  MRclass =      "65Y10",
  MRnumber =     "3218407",
  bibdate =      "Tue Apr 4 18:55:47 2017",
  bibsource =    "",
  series =       j-LECT-NOTES-COMP-SCI,
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Azzam Haidar and Stanimire Tomov and Jack Dongarra and
                 Raffaele Solc{\`a} and Thomas Schulthess",
  title =        "A novel hybrid {CPU-GPU} generalized eigensolver for
                 electronic structure calculations based on fine-grained
                 memory aware tasks",
  journal =      j-IJHPCA,
  volume =       "28",
  number =       "2",
  pages =        "196--209",
  month =        may,
  year =         "2014",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Sep 9 12:27:17 MDT 2014",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  onlinedate =   "August 30, 2013",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Piotr Luszczek and Jakub Kurzak and Jack Dongarra",
  title =        "Looking back at dense linear algebra software",
  journal =      j-J-PAR-DIST-COMP,
  volume =       "74",
  number =       "7",
  pages =        "2548--2560",
  month =        jul,
  year =         "2014",
  CODEN =        "JPDCER",
  ISSN =         "0743-7315 (print), 1096-0848 (electronic)",
  ISSN-L =       "0743-7315",
  bibdate =      "Mon May 26 16:27:22 MDT 2014",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of Parallel and Distributed Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ichitaro Yamazaki and Jakub Kurzak and Piotr Luszczek
                 and Jack Dongarra",
  title =        "Design and Implementation of a Large Scale Tree-Based
                 {QR} Decomposition Using a {$3$D} Virtual Systolic
                 Array and a Lightweight Runtime",
  journal =      j-PARALLEL-PROCESS-LETT,
  volume =       "24",
  number =       "4",
  pages =        "1442004, 23",
  month =        dec,
  year =         "2014",
  CODEN =        "PPLTEE",
  DOI =          "",
  ISSN =         "0129-6264 (print), 1793-642X (electronic)",
  ISSN-L =       "0129-6264",
  MRclass =      "Indexed",
  MRnumber =     "3294500",
  bibdate =      "Fri Feb 13 13:51:16 MST 2015",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Processing Letters",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ichitaro Yamazaki and Tingxing Dong and Raffaele
                 Solc{\`a} and Stanimire Tomov and Jack Dongarra and
                 Thomas Schulthess",
  title =        "Tridiagonalization of a dense symmetric matrix on
                 multiple {GPUs} and its application to symmetric
                 eigenvalue problems",
  journal =      j-CCPE,
  volume =       "26",
  number =       "16",
  pages =        "2652--2666",
  month =        nov,
  year =         "2014",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Wed Feb 11 22:34:10 MST 2015",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  onlinedate =   "3 Oct 2013",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hartwig Anzt and Stanimire Tomov and Piotr Luszczek
                 and William Sawyer and Jack Dongarra",
  title =        "Acceleration of {GPU}-based {Krylov} solvers via data
                 transfer reduction",
  journal =      j-IJHPCA,
  volume =       "29",
  number =       "3",
  pages =        "366--383",
  month =        aug,
  year =         "2015",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Apr 4 14:51:30 MDT 2017",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hartwig Anzt and Blake Haugen and Jakub Kurzak and
                 Piotr Luszczek and Jack Dongarra",
  title =        "Experiences in autotuning matrix multiplication for
                 energy minimization on {GPUs}",
  journal =      j-CCPE,
  volume =       "27",
  number =       "17",
  pages =        "5096--5113",
  day =          "10",
  month =        dec,
  year =         "2015",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Tue Feb 9 06:13:20 MST 2016",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  onlinedate =   "20 May 2015",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Aurelien Bouteiller and Thomas Herault and George
                 Bosilca and Peng Du and Jack Dongarra",
  title =        "Algorithm-Based Fault Tolerance for Dense Matrix
                 Factorizations, Multiple Failures and Accuracy",
  journal =      j-TOPC,
  volume =       "1",
  number =       "2",
  pages =        "10:1--10:??",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-4949 (print), 2329-4957 (electronic)",
  ISSN-L =       "2329-4949",
  bibdate =      "Wed Feb 18 16:46:00 MST 2015",
  bibsource =    ";
  abstract =     "Dense matrix factorizations, such as LU, Cholesky and
                 QR, are widely used for scientific applications that
                 require solving systems of linear equations,
                 eigenvalues and linear least squares problems. Such
                 computations are normally carried out on
                 supercomputers, whose ever-growing scale induces a fast
                 decline of the Mean Time To Failure (MTTF). This
                 article proposes a new hybrid approach, based on
                 Algorithm-Based Fault Tolerance (ABFT), to help matrix
                 factorizations algorithms survive fail-stop failures.
                 We consider extreme conditions, such as the absence of
                 any reliable node and the possibility of losing both
                 data and checksum from a single failure. We will
                 present a generic solution for protecting the right
                 factor, where the updates are applied, of all above
                 mentioned factorizations. For the left factor, where
                 the panel has been applied, we propose a scalable
                 checkpointing algorithm. This algorithm features high
                 degree of checkpointing parallelism and cooperatively
                 utilizes the checksum storage leftover from the right
                 factor protection. The fault-tolerant algorithms
                 derived from this hybrid solution is applicable to a
                 wide range of dense matrix factorizations, with minor
                 modifications. Theoretical analysis shows that the
                 fault tolerance overhead decreases inversely to the
                 scaling in the number of computing units and the
                 problem size. Experimental results of LU and QR
                 factorization on the Kraken (Cray XT5) supercomputer
                 validate the theoretical evaluation and confirm
                 negligible overhead, with- and without-errors.
                 Applicability to tolerate multiple failures and
                 accuracy after multiple recovery is also considered.",
  acknowledgement = ack-nhfb,
  articleno =    "10",
  fjournal =     "ACM Transactions on Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Simplice Donfack and Jack Dongarra and Mathieu Faverge
                 and Mark Gates and Jakub Kurzak and Piotr Luszczek and
                 Ichitaro Yamazaki",
  title =        "A survey of recent developments in parallel
                 implementations of {Gaussian} elimination",
  journal =      j-CCPE,
  volume =       "27",
  number =       "5",
  pages =        "1292--1309",
  day =          "10",
  month =        apr,
  year =         "2015",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Sat Jul 25 19:54:07 MDT 2015",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  onlinedate =   "2 Jun 2014",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Tingzing Tim Dong and Stanimire Z. Tomov and Piotr R.
                 Luszczek and Jack J. Dongarra",
  title =        "A Framework for Batched and {GPU}-Resident
                 Factorization Algorithms Applied to Block {Householder}
  type =         "Technical Report",
  institution =  inst-ORNL,
  address =      inst-ORNL:adr,
  day =          "1",
  month =        jan,
  year =         "2015",
  bibdate =      "Fri Dec 21 07:37:30 2018",
  bibsource =    ";
  URL =          "",
  abstract =     "As modern hardware keeps evolving, an increasingly
                 effective approach to developing energy efficient and
                 high-performance solvers is to design them to work on
                 many small size and independent problems. Many
                 applications already need this functionality,
                 especially for GPUs, which are currently known to be
                 about four to five times more energy efficient than
                 multicore CPUs. We describe the development of
                 one-sided factorizations that work for a set of small
                 dense matrices in parallel, and we illustrate our
                 techniques on the QR factorization based on Householder
                 transformations. We refer to this mode of operation as
                 a batched factorization. Our approach is based on
                 representing the algorithms as a sequence of batched
                 BLAS routines for GPU-only execution. This is in
                 contrast to the hybrid CPU-GPU algorithms that rely
                 heavily on using the multicore CPU for specific parts
                 of the workload. But for a system to benefit fully from
                 the GPU's significantly higher energy efficiency,
                 avoiding the use of the multicore CPU must be a primary
                 design goal, so the system can rely more heavily on the
                 more efficient GPU. Additionally, this will result in
                 the removal of the costly CPU-to-GPU communication.
                 Furthermore, we do not use a single symmetric
                 multiprocessor(on the GPU) to factorize a single
                 problem at a time. We illustrate how our performance
                 analysis, and the use of profiling and tracing tools,
                 guided the development and optimization of our batched
                 factorization to achieve up to a 2-fold speedup and a
                 3-fold energy efficiency improvement compared to our
                 highly optimized batched CPU implementations based on
                 the MKL library(when using two sockets of Intel Sandy
                 Bridge CPUs). Compared to a batched QR factorization
                 featured in the CUBLAS library for GPUs, we achieved up
                 to $ 5 \times $ speedup on the K40 GPU.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Bernard Tourancheau",
  title =        "{Guest Editors}' Note: Special Issue on Clusters,
                 Clouds and Data for Scientific Computing",
  journal =      j-PARALLEL-PROCESS-LETT,
  volume =       "25",
  number =       "3",
  pages =        "1502002:1--1502002:2",
  month =        sep,
  year =         "2015",
  CODEN =        "PPLTEE",
  DOI =          "",
  ISSN =         "0129-6264 (print), 1793-642X (electronic)",
  ISSN-L =       "0129-6264",
  MRclass =      "68-06",
  MRnumber =     "3402373",
  bibdate =      "Tue Apr 4 18:57:22 2017",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Processing Letters",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Mark Gates and Azzam Haidar and Yulu
                 Jia and Khairul Kabir and Piotr Luszczek and Stanimire
  title =        "{HPC} Programming on {Intel Many-Integrated-Core}
                 Hardware with {MAGMA} Port to {Xeon Phi}",
  journal =      j-SCI-PROG,
  volume =       "2015",
  number =       "??",
  pages =        "502593:1--502593:11",
  month =        "????",
  year =         "2015",
  CODEN =        "SCIPEV",
  DOI =          "",
  ISSN =         "1058-9244 (print), 1875-919X (electronic)",
  ISSN-L =       "1058-9244",
  bibdate =      "Tue Sep 20 07:53:46 MDT 2016",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Scientific Programming",
  journal-URL =  "",
  journalabr =   "Sci. Prog",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and M. Abalenkovs and A. Abdelfattah and
                 M. Gates and A. Haidar and J. Kurzak and P. Luszczek
                 and S. Tomov and I. Yamazaki and A. YarKhan",
  title =        "Parallel Programming Models for Dense Linear Algebra
                 on Heterogeneous Systems",
  journal =      j-SUPERFRI,
  volume =       "2",
  number =       "4",
  pages =        "67--86",
  month =        "????",
  year =         "2015",
  CODEN =        "????",
  ISSN =         "2409-6008 (print), 2313-8734 (electronic)",
  bibdate =      "Sat Nov 11 07:15:27 MST 2017",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Supercomputing Frontiers and Innovations",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Mathieu Faverge and Julien Herrmann and Julien Langou
                 and Bradley Lowery and Yves Robert and Jack Dongarra",
  title =        "Mixing {$ L U $} and {$ Q R $} factorization
                 algorithms to design high-performance dense linear
                 algebra solvers",
  journal =      j-J-PAR-DIST-COMP,
  volume =       "85",
  number =       "??",
  pages =        "32--46",
  month =        nov,
  year =         "2015",
  CODEN =        "JPDCER",
  ISSN =         "0743-7315 (print), 1096-0848 (electronic)",
  ISSN-L =       "0743-7315",
  bibdate =      "Sat Sep 26 07:40:06 MDT 2015",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of Parallel and Distributed Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Azzam Haidar and Tingxing Dong and Piotr Luszczek and
                 Stanimire Tomov and Jack Dongarra",
  title =        "Batched matrix computations on hardware accelerators
                 based on {GPUs}",
  journal =      j-IJHPCA,
  volume =       "29",
  number =       "2",
  pages =        "193--208",
  month =        may,
  year =         "2015",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Apr 4 14:50:50 MDT 2017",
  bibsource =    ";
  note =         "See retraction notice \cite{Anonymous:2024:RNA}.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "Int. J. High Perform. Comput. Appl.",
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Azzam Haidar and Tingxing Tim Dong and Stanimire Tomov
                 and Piotr Luszczek and Jack Dongarra",
  booktitle =    "{High Performance Computing. ISC High Performance
  title =        "A Framework for Batched and {GPU}-Resident
                 Factorization Algorithms Applied to Block {Householder}
  publisher =    "Springer International Publishing",
  address =      "Cham, Switzerland",
  pages =        "31--47",
  year =         "2015",
  DOI =          "",
  bibdate =      "Fri Dec 21 15:19:09 2018",
  bibsource =    ";
  series =       ser-LNCS,
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Azzam Haidar and Tingxing Dong and Piotr Luszczek and
                 Stanimire Tomov and Jack Dongarra",
  title =        "Towards batched linear solvers on accelerated hardware
  journal =      j-SIGPLAN,
  volume =       "50",
  number =       "8",
  pages =        "261--262",
  month =        aug,
  year =         "2015",
  CODEN =        "SINODQ",
  DOI =          "",
  ISSN =         "0362-1340 (print), 1523-2867 (print), 1558-1160
  ISSN-L =       "0362-1340",
  bibdate =      "Tue Feb 16 12:01:42 MST 2016",
  bibsource =    ";
  abstract =     "As hardware evolves, an increasingly effective
                 approach to develop energy efficient, high-performance
                 solvers, is to design them to work on many small and
                 independent problems. Indeed, many applications already
                 need this functionality, especially for GPUs, which are
                 known to be currently about four to five times more
                 energy efficient than multicore CPUs for every
                 floating-point operation. In this paper, we describe
                 the development of the main one-sided factorizations:
                 LU, QR, and Cholesky; that are needed for a set of
                 small dense matrices to work in parallel. We refer to
                 such algorithms as batched factorizations. Our approach
                 is based on representing the algorithms as a sequence
                 of batched BLAS routines for GPU-contained execution.
                 Note that this is similar in functionality to the
                 LAPACK and the hybrid MAGMA algorithms for large-matrix
                 factorizations. But it is different from a
                 straightforward approach, whereby each of GPU's
                 symmetric multiprocessors factorizes a single problem
                 at a time. We illustrate how our performance analysis
                 together with the profiling and tracing tools guided
                 the development of batched factorizations to achieve up
                 to 2-fold speedup and 3-fold better energy efficiency
                 compared to our highly optimized batched CPU
                 implementations based on the MKL library on a
                 two-sockets, Intel Sandy Bridge server. Compared to a
                 batched LU factorization featured in the NVIDIA's
                 CUBLAS library for GPUs, we achieves up to 2.5-fold
                 speedup on the K40 GPU.",
  acknowledgement = ack-nhfb,
  fjournal =     "ACM SIGPLAN Notices",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  remark =       "PPoPP '15 conference proceedings.",

  author =       "Daniel A. Reed and Jack Dongarra",
  title =        "Exascale computing and big data",
  journal =      j-CACM,
  volume =       "58",
  number =       "7",
  pages =        "56--68",
  month =        jul,
  year =         "2015",
  CODEN =        "CACMA2",
  DOI =          "",
  ISSN =         "0001-0782 (print), 1557-7317 (electronic)",
  ISSN-L =       "0001-0782",
  bibdate =      "Tue Jul 28 10:56:51 MDT 2015",
  bibsource =    ";
  URL =          "",
  abstract =     "Scientific discovery and engineering innovation
                 requires unifying traditionally separated
                 high-performance computing and big data analytics.",
  acknowledgement = ack-nhfb,
  fjournal =     "Communications of the ACM",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Fengguang Song and Jack Dongarra",
  title =        "A scalable approach to solving dense linear algebra
                 problems on hybrid {CPU--GPU} systems",
  journal =      j-CCPE,
  volume =       "27",
  number =       "14",
  pages =        "3702--3723",
  day =          "25",
  month =        sep,
  year =         "2015",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Mon Sep 28 09:32:54 MDT 2015",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  onlinedate =   "1 Oct 2014",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Erich Strohmaier and Hans W. Meuer and Jack Dongarra
                 and Horst D. Simon",
  title =        "The {TOP500} List and Progress in High-Performance
  journal =      j-COMPUTER,
  volume =       "48",
  number =       "11",
  pages =        "42--49",
  month =        nov,
  year =         "2015",
  CODEN =        "CPTRB4",
  DOI =          "",
  ISSN =         "0018-9162 (print), 1558-0814 (electronic)",
  ISSN-L =       "0018-9162",
  bibdate =      "Mon Jan 4 18:58:36 MST 2016",
  bibsource =    ";
  URL =          "",
  abstract-URL = "",
  acknowledgement = ack-nhfb,
  fjournal =     "Computer",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Vladimir V. Voevodin and Alexander S. Antonov and Jack
  title =        "{AlgoWiki}: an Open Encyclopedia of Parallel
                 Algorithmic Features",
  journal =      j-SUPERFRI,
  volume =       "2",
  number =       "1",
  pages =        "4--18",
  month =        "????",
  year =         "2015",
  CODEN =        "????",
  ISSN =         "2409-6008 (print), 2313-8734 (electronic)",
  bibdate =      "Sat Nov 11 07:15:27 MST 2017",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Supercomputing Frontiers and Innovations",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ichitaro Yamazaki and Stanimire Tomov and Jack
  title =        "Computing Low-Rank Approximation of a Dense Matrix on
                 Multicore {CPUs} with a {GPU} and Its Application to
                 Solving a Hierarchically Semiseparable Linear System of
  journal =      j-SCI-PROG,
  volume =       "2015",
  number =       "??",
  pages =        "246019:1--246019:17",
  month =        "????",
  year =         "2015",
  CODEN =        "SCIPEV",
  DOI =          "",
  ISSN =         "1058-9244 (print), 1875-919X (electronic)",
  ISSN-L =       "1058-9244",
  bibdate =      "Tue Sep 20 07:53:48 MDT 2016",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Scientific Programming",
  journal-URL =  "",
  journalabr =   "Sci. Prog",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ichitaro Yamazaki and Stanimire Tomov and Jack
  title =        "Mixed-Precision {Cholesky} {$ Q R $} Factorization and
                 Its Case Studies on Multicore {CPU} with Multiple
  journal =      j-SIAM-J-SCI-COMP,
  volume =       "37",
  number =       "3",
  pages =        "C307--C330",
  month =        "????",
  year =         "2015",
  CODEN =        "SJOCE3",
  DOI =          "",
  ISSN =         "1064-8275 (print), 1095-7197 (electronic)",
  ISSN-L =       "1064-8275",
  MRclass =      "65F05 (65F20 65F25 65Y05 65Y10)",
  MRnumber =     "3345351",
  MRreviewer =   "Jos\~A\copyright{}-Javier Mart\~A-nez",
  bibdate =      "Sat Aug 8 06:48:44 MDT 2015",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM Journal on Scientific Computing",
  journal-URL =  "",
  onlinedate =   "January 2015",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "A. Abdelfattah and H. Anzt and J. Dongarra and M.
                 Gates and A. Haidar and J. Kurzak and P. Luszczek and
                 S. Tomov and I. Yamazaki and A. YarKhan",
  title =        "Linear algebra software for large-scale accelerated
                 multicore computing",
  journal =      j-ACTA-NUMERICA,
  volume =       "25",
  pages =        "1--160",
  year =         "2016",
  CODEN =        "ANUMFU",
  DOI =          "",
  ISSN =         "0962-4929 (print), 1474-0508 (electronic)",
  ISSN-L =       "0962-4929",
  MRclass =      "65-02 (65Fxx 65Y05)",
  MRnumber =     "3509208",
  MRreviewer =   "Michael J. Carley",
  bibdate =      "Tue May 24 12:29:05 MDT 2016",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ajournal =     "Acta Numer.",
  fjournal =     "Acta Numerica",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ahmad Abdelfattah and Hatem Ltaief and David Keyes and
                 Jack Dongarra",
  title =        "Performance optimization of Sparse Matrix-Vector
                 Multiplication for multi-component {PDE}-based
                 applications using {GPUs}",
  journal =      j-CCPE,
  volume =       "28",
  number =       "12",
  pages =        "3447--3465",
  day =          "25",
  month =        aug,
  year =         "2016",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Tue Sep 13 08:30:12 MDT 2016",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hartwig Anzt and Edmond Chow and Daniel B. Szyld and
                 Jack Dongarra",
  booktitle =    "Software for exascale computing---{SPPEXA}
  title =        "Domain overlap for iterative sparse triangular solves
                 on {GPUs}",
  volume =       "113",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "527--545",
  year =         "2016",
  MRclass =      "65F50 (65Y10)",
  MRnumber =     "3706434",
  bibdate =      "Tue May 8 15:32:28 2018",
  bibsource =    "",
  series =       "Lect. Notes Comput. Sci. Eng.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hartwig Anzt and Edmond Chow and Jens Saak and Jack
  title =        "Updating incomplete factorization preconditioners for
                 model order reduction",
  journal =      j-NUMER-ALGORITHMS,
  volume =       "73",
  number =       "3",
  pages =        "611--630",
  month =        nov,
  year =         "2016",
  CODEN =        "NUALEG",
  DOI =          "",
  ISSN =         "1017-1398 (print), 1572-9265 (electronic)",
  ISSN-L =       "1017-1398",
  MRclass =      "65F08",
  MRnumber =     "3564862",
  MRreviewer =   "Bruno Carpentieri",
  bibdate =      "Wed Mar 1 09:12:13 MST 2017",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Numerical Algorithms",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Marc Baboulin and Jack Dongarra and Adrien R{\'e}my
                 and Stanimire Tomov and Ichitaro Yamazaki",
  booktitle =    "Parallel processing and applied mathematics. {Part
  title =        "Dense symmetric indefinite factorization on {GPU}
                 accelerated architectures",
  volume =       "9573",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "86--95",
  year =         "2016",
  DOI =          "",
  MRclass =      "65F99 (65Y10 68W20)",
  MRnumber =     "3492296",
  bibdate =      "Thu Jun 29 09:17:17 2017",
  bibsource =    "",
  series =       ser-LNCS,
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Michael A. Heroux and Piotr
  title =        "High-performance conjugate-gradient benchmark: a new
                 metric for ranking high-performance computing systems",
  journal =      j-IJHPCA,
  volume =       "30",
  number =       "1",
  pages =        "3--10",
  month =        feb,
  year =         "2016",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Apr 4 14:51:30 MDT 2017",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Michael A. Heroux and Piotr
  title =        "A new metric for ranking high performance computing
  journal =      j-NATL-SCI-REV,
  volume =       "??",
  number =       "??",
  pages =        "??--??",
  day =          "6",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2053-714X (print), 2095-5138 (electronic)",
  ISSN-L =       "2053-714X",
  bibdate =      "Mon Jan 11 09:14:33 2016",
  bibsource =    "",
  URL =          "",
  abstract =     "We present the HPCG benchmark: High Performance
                 Conjugate Gradients that is aimed providing more
                 application-oriented measurement of system performance
                 when compared with the High Performance LINPACK
                 benchmark. We show the model partial differential
                 equation and its discretization as well as the
                 algorithm for iteratively solving it. The performance
                 results show how HPCG ranks large supercomputing
                 installations and delivers richer view of important
                 system characteristics.",
  acknowledgement = ack-nhfb,
  fjournal =     "National Science Review",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  remark =       "In-progress publication: no volume/number/pages yet

  author =       "Julien Herrmann and George Bosilca and Thomas
                 H{\'e}rault and Loris Marchal and Yves Robert and Jack
  title =        "Assessing the cost of redistribution followed by a
                 computational kernel: Complexity and performance
  journal =      j-PARALLEL-COMPUTING,
  volume =       "52",
  number =       "??",
  pages =        "22--41",
  month =        feb,
  year =         "2016",
  CODEN =        "PACOEJ",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Fri Feb 12 18:56:20 MST 2016",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Heike Jagode and Anthony Danalis and George Bosilca
                 and Jack Dongarra",
  booktitle =    "Parallel processing and applied mathematics. {Part
  title =        "Accelerating {NWChem} coupled cluster through
                 dataflow-based execution",
  volume =       "9573",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "366--376",
  year =         "2016",
  DOI =          "",
  MRclass =      "80A50 (65Y05 92E10)",
  MRnumber =     "3492322",
  bibdate =      "Thu Jun 29 09:18:26 2017",
  bibsource =    "",
  series =       ser-LNCS,
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jakub Kurzak and Hartwig Anzt and Mark Gates and Jack
  title =        "Implementation and Tuning of Batched {Cholesky}
                 Factorization and Solve for {NVIDIA} {GPUs}",
  journal =      j-IEEE-TRANS-PAR-DIST-SYS,
  volume =       "27",
  number =       "7",
  pages =        "2036--2048",
  month =        jul,
  year =         "2016",
  CODEN =        "ITDSEO",
  DOI =          "",
  ISSN =         "1045-9219 (print), 1558-2183 (electronic)",
  ISSN-L =       "1045-9219",
  bibdate =      "Tue Jun 14 09:25:28 MDT 2016",
  bibsource =    ";
  URL =          "",
  abstract-URL = "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Transactions on Parallel and Distributed
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ian Masliah and Ahmad Abdelfattah and A. Haidar and S.
                 Tomov and Marc Baboulin and J. Falcou and J. Dongarra",
  booktitle =    "{Euro-Par 2016}: parallel processing",
  title =        "High-performance matrix--matrix multiplications of
                 very small matrices",
  volume =       "9833",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "659--671",
  year =         "2016",
  DOI =          "",
  MRclass =      "65F99 (65Y99 68M07)",
  MRnumber =     "3568397",
  bibdate =      "Thu Jun 29 09:18:56 2017",
  bibsource =    "",
  series =       ser-LNCS,
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ichitaro Yamazaki and Stanimire Tomov and Jack
  title =        "Stability and Performance of Various Singular Value {$
                 Q R $} Implementations on Multicore {CPU} with a
  journal =      j-TOMS,
  volume =       "43",
  number =       "2",
  pages =        "10:1--10:18",
  month =        sep,
  year =         "2016",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  MRclass =      "65F15 (65Y10)",
  MRnumber =     "3550008",
  bibdate =      "Tue Nov 22 17:45:25 MST 2016",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  articleno =    "10",
  fjournal =     "ACM Transactions on Mathematical Software",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ahmad Abdelfattah and Azzam Haidar and Stanimire Tomov
                 and Jack Dongarra",
  title =        "Fast {Cholesky} factorization on {GPUs} for batch and
                 native modes in {MAGMA}",
  journal =      j-J-COMPUT-SCI,
  volume =       "20",
  pages =        "85--93",
  month =        may,
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "1877-7503 (print), 1877-7511 (electronic)",
  ISSN-L =       "1877-7503",
  bibdate =      "Tue Sep 19 13:54:22 MDT 2023",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "J. Comput. Sci.",
  fjournal =     "Journal of Computational Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hartwig Anzt and Stanimire Tomov and Jack Dongarra",
  title =        "On the performance and energy efficiency of sparse
                 linear algebra on {GPUs}",
  journal =      j-IJHPCA,
  volume =       "31",
  number =       "5",
  pages =        "375--390",
  month =        sep,
  year =         "2017",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Sat Jan 6 10:31:59 MST 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hartwig Anzt and Mark Gates and Jack Dongarra and
                 Moritz Kreutzer and Gerhard Wellein and Martin
  title =        "Preconditioned {Krylov} solvers on {GPUs}",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "68",
  number =       "??",
  pages =        "32--44",
  month =        oct,
  year =         "2017",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  MRclass =      "65F10 (65F08 65Y05 65Y10 65Y20 68W10)",
  MRnumber =     "3689686",
  bibdate =      "Thu Aug 24 15:19:06 MDT 2017",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Marc Baboulin and Jack Dongarra and Adrien R{\'e}my
                 and Stanimire Tomov and Ichitaro Yamazaki",
  title =        "Solving dense symmetric indefinite systems using
  journal =      j-CCPE,
  volume =       "29",
  number =       "9",
  pages =        "??--??",
  day =          "10",
  month =        may,
  year =         "2017",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Mon Jul 24 08:22:36 MDT 2017",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Gordon Bell and David H. Bailey and Jack Dongarra and
                 Alan H. Karp and Kevin Walsh",
  title =        "A look back on 30 years of the {Gordon Bell Prize}",
  journal =      j-IJHPCA,
  volume =       "31",
  number =       "6",
  pages =        "469--484",
  month =        nov,
  year =         "2017",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Sat Jan 6 10:31:59 MST 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Stanimire Tomov and Piotr Luszczek
                 and Jakub Kurzak and Mark Gates and Ichitaro Yamazaki
                 and Hartwig Anzt and Azzam Haidar and Ahmad
  title =        "With Extreme Computing, the Rules Have Changed",
  journal =      j-COMPUT-SCI-ENG,
  volume =       "19",
  number =       "3",
  pages =        "52--62",
  month =        may # "\slash " # jun,
  year =         "2017",
  CODEN =        "CSENFA",
  DOI =          "",
  ISSN =         "1521-9615 (print), 1558-366X (electronic)",
  ISSN-L =       "1521-9615",
  bibdate =      "Thu Aug 24 06:23:55 MDT 2017",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Computing in Science and Engineering",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Bernard Tourancheau",
  title =        "{Guest Editor}'s Note: Special Issue on Clusters,
                 Clouds and Data for Scientific Computing",
  journal =      j-IJHPCA,
  volume =       "31",
  number =       "1",
  pages =        "3--3",
  month =        jan,
  year =         "2017",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue Apr 4 14:51:30 MDT 2017",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Azzam Haidar and Panruo Wu and Stanimire Tomov and
                 Jack Dongarra",
  booktitle =    "Proceedings of the {8th Workshop on Latest Advances in
                 Scalable Algorithms for Large-Scale Systems ---
  title =        "Investigating half precision arithmetic to accelerate
                 dense linear system solvers",
  publisher =    pub-ACM,
  address =      pub-ACM:adr,
  year =         "2017",
  DOI =          "",
  ISBN =         "1-4503-5125-5 (hardcover)",
  ISBN-13 =      "978-1-4503-5125-6 (hardcover)",
  LCCN =         "????",
  bibdate =      "Thu Nov 7 16:51:39 2019",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sergey V. Kovalchuk and Tesfamariam M. Abuhay and
                 Ilkay Altintas and Michael L. Norman and Michael H.
                 Lees and Valeria V. Krzhizhanovskaya and Jack Dongarra
                 and Peter M. A. Sloot",
  title =        "Data through the {Computational Lens}",
  journal =      j-J-COMPUT-SCI,
  volume =       "20",
  pages =        "81--84",
  month =        may,
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "1877-7503 (print), 1877-7511 (electronic)",
  ISSN-L =       "1877-7503",
  bibdate =      "Tue Sep 19 13:54:22 MDT 2023",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "J. Comput. Sci.",
  fjournal =     "Journal of Computational Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jakub Kurzak and Piotr Luszczek and Ichitaro Yamazaki
                 and Yves Robert and Jack Dongarra",
  title =        "Design and Implementation of the {PULSAR} Programming
                 System for Large Scale Computing",
  journal =      j-SUPERFRI,
  volume =       "4",
  number =       "1",
  pages =        "4--26",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  ISSN =         "2409-6008 (print), 2313-8734 (electronic)",
  bibdate =      "Sat Nov 11 07:15:27 MST 2017",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Supercomputing Frontiers and Innovations",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ichitaro Yamazaki and Stanimire Tomov and Jack
  title =        "Non-{GPU}-resident symmetric indefinite
  journal =      j-CCPE,
  volume =       "29",
  number =       "5",
  pages =        "??--??",
  day =          "10",
  month =        mar,
  year =         "2017",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Sat Feb 18 10:07:19 MST 2017",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Asim YarKhan and Jakub Kurzak and Piotr Luszczek and
                 Jack Dongarra",
  title =        "Porting the {PLASMA} Numerical Library to the {OpenMP}
  journal =      j-INT-J-PARALLEL-PROG,
  volume =       "45",
  number =       "3",
  pages =        "612--633",
  month =        jun,
  year =         "2017",
  CODEN =        "IJPPE5",
  DOI =          "",
  ISSN =         "0885-7458 (print), 1573-7640 (electronic)",
  ISSN-L =       "0885-7458",
  bibdate =      "Sat Jun 24 11:37:59 MDT 2017",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of Parallel Programming",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ahmad Abdelfattah and Azzam Haidar and Stanimire Tomov
                 and Jack Dongarra",
  title =        "Analysis and Design Techniques towards
                 High-Performance and Energy-Efficient Dense Linear
                 Solvers on {GPUs}",
  journal =      j-IEEE-TRANS-PAR-DIST-SYS,
  volume =       "29",
  number =       "12",
  pages =        "2700--2712",
  month =        dec,
  year =         "2018",
  CODEN =        "ITDSEO",
  DOI =          "",
  ISSN =         "1045-9219 (print), 1558-2183 (electronic)",
  ISSN-L =       "1045-9219",
  bibdate =      "Thu Nov 15 10:36:45 MST 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Transactions on Parallel and Distributed
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ahmad Abdelfattah and Azzam Haidar and Stanimire Tomov
                 and Jack Dongarra",
  title =        "Batched one-sided factorizations of tiny matrices
                 using {GPUs}: Challenges and countermeasures",
  journal =      j-J-COMPUT-SCI,
  volume =       "26",
  pages =        "226--236",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "1877-7503 (print), 1877-7511 (electronic)",
  ISSN-L =       "1877-7503",
  bibdate =      "Tue Sep 19 13:54:46 MDT 2023",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "J. Comput. Sci.",
  fjournal =     "Journal of Computational Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hartwig Anzt and Thomas K. Huckle and J{\"u}rgen
                 Br{\"a}ckle and Jack Dongarra",
  title =        "Incomplete Sparse Approximate Inverses for Parallel
  journal =      j-PARALLEL-COMPUTING,
  volume =       "71",
  number =       "??",
  pages =        "1--22",
  month =        jan,
  year =         "2018",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  MRclass =      "65F08 (65Y05)",
  MRnumber =     "3735016",
  bibdate =      "Tue Nov 6 11:59:37 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hartwig Anzt and Moritz Kreutzer and Eduardo Ponce and
                 Gregory D. Peterson and Gerhard Wellein and Jack
  title =        "Optimization and performance evaluation of the {IDR}
                 iterative {Krylov} solver on {GPUs}",
  journal =      j-IJHPCA,
  volume =       "32",
  number =       "2",
  pages =        "220--230",
  month =        mar,
  year =         "2018",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Mon Nov 5 17:34:16 MST 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hartwig Anzt and Edmond Chow and Jack Dongarra",
  title =        "{ParILUT} --- A New Parallel Threshold {$ I L U $}
  journal =      j-SIAM-J-SCI-COMP,
  volume =       "40",
  number =       "4",
  pages =        "C503--C519",
  month =        "????",
  year =         "2018",
  CODEN =        "SJOCE3",
  DOI =          "",
  ISSN =         "1064-8275 (print), 1095-7197 (electronic)",
  ISSN-L =       "1064-8275",
  MRclass =      "65F08 (65F50 65Y05 68W10)",
  MRnumber =     "3827194",
  MRreviewer =   "Atanaska Tencheva Georgieva",
  bibdate =      "Tue Nov 6 11:59:37 2018",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM Journal on Scientific Computing",
  journal-URL =  "",
  onlinedate =   "January 2018",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "M. Asch and T. Moore and R. Badia and M. Beck and P.
                 Beckman and T. Bidot and F. Bodin and F. Cappello and
                 A. Choudhary and B. de Supinski and E. Deelman and J.
                 Dongarra and A. Dubey and G. Fox and H. Fu and S.
                 Girona and W. Gropp and M. Heroux and Y. Ishikawa and
                 K. Keahey and D. Keyes and W. Kramer and J-F Lavignon
                 and Y. Lu and S. Matsuoka and B. Mohr and D. Reed and
                 S. Requena and J. Saltz and T. Schulthess and R.
                 Stevens and M. Swany and A. Szalay and W. Tang and G.
                 Varoquaux and J.-P. Vilotte and R. Wisniewski and Z. Xu
                 and I. Zacharov",
  title =        "Big data and extreme-scale computing",
  journal =      j-IJHPCA,
  volume =       "32",
  number =       "4",
  pages =        "435--479",
  month =        jul,
  year =         "2018",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Mon Nov 5 17:34:17 MST 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "George Bosilca and Aurelien Bouteiller and Amina
                 Guermouche and Thomas Herault and Yves Robert and
                 Pierre Sens and Jack Dongarra",
  title =        "A failure detector for {HPC} platforms",
  journal =      j-IJHPCA,
  volume =       "32",
  number =       "1",
  pages =        "139--158",
  month =        jan,
  year =         "2018",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Sat Jan 6 10:32:00 MST 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Edmond Chow and Hartwig Anzt and Jennifer Scott and
                 Jack Dongarra",
  title =        "Using {Jacobi} iterations and blocking for solving
                 sparse triangular systems in incomplete factorization
  journal =      j-J-PAR-DIST-COMP,
  volume =       "119",
  number =       "??",
  pages =        "219--230",
  month =        sep,
  year =         "2018",
  CODEN =        "JPDCER",
  DOI =          "",
  ISSN =         "0743-7315 (print), 1096-0848 (electronic)",
  ISSN-L =       "0743-7315",
  bibdate =      "Thu May 31 06:49:57 MDT 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of Parallel and Distributed Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Tingxing Dong and Azzam Haidar and Stanimire Tomov and
                 Jack Dongarra",
  title =        "Accelerating the {SVD} bi-diagonalization of a batch
                 of small matrices using {GPUs}",
  journal =      j-J-COMPUT-SCI,
  volume =       "26",
  pages =        "237--245",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "1877-7503 (print), 1877-7511 (electronic)",
  ISSN-L =       "1877-7503",
  bibdate =      "Tue Sep 19 13:54:46 MDT 2023",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "J. Comput. Sci.",
  fjournal =     "Journal of Computational Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Bernard Tourancheau",
  title =        "Guest editors' note",
  journal =      j-IJHPCA,
  volume =       "32",
  number =       "1",
  pages =        "3--3",
  month =        jan,
  year =         "2018",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Sat Jan 6 10:32:00 MST 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Michael A. Heroux and Piotr
  title =        "The high-performance conjugate gradients benchmark",
  journal =      j-SIAM-NEWS,
  volume =       "51",
  number =       "1",
  pages =        "12",
  year =         "2018",
  ISSN =         "1557-9573",
  MRclass =      "65F10 (68M14 68W10)",
  MRnumber =     "3823058",
  bibdate =      "Tue Jan 8 09:16:53 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM News",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Mark Gates and Azzam Haidar and
                 Jakub Kurzak and Piotr Luszczek and Stanimire Tomov and
                 Ichitaro Yamazaki",
  title =        "The singular value decomposition: anatomy of
                 optimizing an algorithm for extreme scale",
  journal =      j-SIAM-REVIEW,
  volume =       "60",
  number =       "4",
  pages =        "808--865",
  year =         "2018",
  CODEN =        "SIREAD",
  DOI =          "",
  ISSN =         "0036-1445 (print), 1095-7200 (electronic)",
  ISSN-L =       "0036-1445",
  MRclass =      "65F15 (15A18 15A23 65Y05)",
  MRnumber =     "3873018",
  MRreviewer =   "Andreas Frommer",
  bibdate =      "Tue Jan 8 09:17:10 2019",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "SIAM Review",
  journal-URL =  "",
  onlinedate =   "January 2018",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Mark Gates and Stanimire Tomov and Jack Dongarra",
  title =        "Accelerating the {SVD} two stage bidiagonal reduction
                 and divide and conquer using {GPUs}",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "74",
  pages =        "3--18",
  year =         "2018",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  MRclass =      "65F15 (65Y10)",
  MRnumber =     "3771320",
  bibdate =      "Tue Nov 6 11:59:37 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Azzam Haidar and Ahmad Abdelfattah and Mawussi Zounon
                 and Panruo Wu and Srikara Pranesh and Stanimire Tomov
                 and Jack Dongarra",
  booktitle =    "Computational science---{ICCS 2018}. {Part I}",
  title =        "The design of fast and energy-efficient linear
                 solvers: on the potential of half-precision arithmetic
                 and iterative refinement techniques",
  volume =       "10860",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "586--600",
  year =         "2018",
  DOI =          "",
  ISBN =         "3-319-93698-0; 3-319-93697-2",
  ISBN-13 =      "978-3-319-93698-7; 978-3-319-93697-0",
  MRclass =      "65Fxx (65Y10)",
  MRnumber =     "3815810",
  bibdate =      "Tue Jan 8 09:18:00 2019",
  bibsource =    ";
  series =       ser-LNCS,
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Azzam Haidar and Ahmad Abdelfattah and Mawussi Zounon
                 and Stanimire Tomov and Jack Dongarra",
  title =        "A Guide for Achieving High Performance with Very Small
                 Matrices on {GPU}: A Case Study of Batched {$ L U $}
                 and {Cholesky} Factorizations",
  journal =      j-IEEE-TRANS-PAR-DIST-SYS,
  volume =       "29",
  number =       "5",
  pages =        "973--984",
  month =        may,
  year =         "2018",
  CODEN =        "ITDSEO",
  DOI =          "",
  ISSN =         "1045-9219 (print), 1558-2183 (electronic)",
  ISSN-L =       "1045-9219",
  bibdate =      "Thu Apr 12 07:16:29 MDT 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Transactions on Parallel and Distributed
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Azzam Haidar and Stanimire Tomov and Jack Dongarra and
                 Nicholas J. Higham",
  editor =       "{IEEE}",
  booktitle =    "{SC '18 Proceedings of the International Conference
                 for High Performance Computing, Networking, Storage,
                 and Analysis, Dallas, Texas, November 11--16, 2018}",
  title =        "Harnessing {GPU} tensor cores for fast {FP16}
                 arithmetic to speed up mixed-precision iterative
                 refinement solvers",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "47:1--47:11",
  year =         "2018",
  DOI =          "",
  ISBN =         "1-5386-8384-9",
  ISBN-13 =      "978-1-5386-8384-2",
  LCCN =         "????",
  bibdate =      "Sat Jan 19 18:51:19 2019",
  bibsource =    ";
  URL =          ";
  abstract =     "Low-precision floating-point arithmetic is a powerful
                 tool for accelerating scientific computing
                 applications, especially those in artificial
                 intelligence. Here, we present an investigation showing
                 that other high-performance computing (HPC)
                 applications can also harness this power. Specifically,
                 we use the general HPC problem, Ax = b, where A is a
                 large dense matrix, and a double precision (FP64)
                 solution is needed for accuracy. Our approach is based
                 on mixed-precision (FP16 $ \to $ FP64) iterative
                 refinement, and we generalize and extend prior advances
                 into a framework, for which we develop
                 architecture-specific algorithms and highly tuned
                 implementations. These new methods show how using
                 half-precision Tensor Cores (FP16-TC) for the
                 arithmetic can provide up to 4X speedup. This is due to
                 the performance boost that the FP16-TC provide as well
                 as to the improved accuracy over the classical FP16
                 arithmetic that is obtained because the GEMM
                 accumulation occurs in FP32 arithmetic.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Heike Jagode and Anthony Danalis and Jack Dongarra",
  title =        "Accelerating {NWChem Coupled Cluster} through
                 dataflow-based execution",
  journal =      j-IJHPCA,
  volume =       "32",
  number =       "4",
  pages =        "540--551",
  month =        jul,
  year =         "2018",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Mon Nov 5 17:34:17 MST 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Heike Jagode and Anthony Danalis and Reazul Hoque and
                 Mathieu Faverge and Jack Dongarra",
  title =        "Evaluation of dataflow programming models for
                 electronic structure theory",
  journal =      j-CCPE,
  volume =       "30",
  number =       "17",
  pages =        "e4490:1--e4490:??",
  day =          "10",
  month =        sep,
  year =         "2018",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Thu Mar 28 08:07:51 MDT 2019",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  onlinedate =   "24 April 2018",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sergey V. Kovalchuk and Valeria V. Krzhizhanovskaya
                 and Petros Koumoutsakos and Eleni Chatzi and Michael H.
                 Lees and Jack Dongarra and Peter M. A. Sloot",
  title =        "The art of computational science: Bridging gaps ---
                 forming alloys",
  journal =      j-J-COMPUT-SCI,
  volume =       "26",
  pages =        "190--192",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "1877-7503 (print), 1877-7511 (electronic)",
  ISSN-L =       "1877-7503",
  bibdate =      "Tue Sep 19 13:54:46 MDT 2023",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "J. Comput. Sci.",
  fjournal =     "Journal of Computational Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ichitaro Yamazaki and Jakub Kurzak and Panruo Wu and
                 Mawussi Zounon and Jack Dongarra",
  title =        "Symmetric Indefinite Linear Solver Using {OpenMP} Task
                 on Multicore Architectures",
  journal =      j-IEEE-TRANS-PAR-DIST-SYS,
  volume =       "29",
  number =       "8",
  pages =        "1879--1892",
  month =        aug,
  year =         "2018",
  CODEN =        "ITDSEO",
  DOI =          "",
  ISSN =         "1045-9219 (print), 1558-2183 (electronic)",
  ISSN-L =       "1045-9219",
  bibdate =      "Wed Jul 25 09:07:14 MDT 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Transactions on Parallel and Distributed
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hartwig Anzt and Jack Dongarra and Goran Flegar and
                 Nicholas J. Higham and Enrique S. Quintana-Ort{\'\i}",
  title =        "Adaptive precision in block-{Jacobi} preconditioning
                 for iterative sparse linear system solvers",
  journal =      j-CCPE,
  volume =       "31",
  number =       "6",
  pages =        "e4460:1--e4460:??",
  day =          "25",
  month =        mar,
  year =         "2019",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Thu Mar 28 08:07:56 MDT 2019",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  onlinedate =   "12 March 2018",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hartwig Anzt and Jack Dongarra and Enrique S.
  title =        "Fine-grained bit-flip protection for relaxation
  journal =      j-J-COMPUT-SCI,
  volume =       "36",
  pages =        "??--??",
  month =        sep,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "1877-7503 (print), 1877-7511 (electronic)",
  ISSN-L =       "1877-7503",
  MRclass =      "15A06 (65F10)",
  MRnumber =     "4017508",
  bibdate =      "Tue Sep 19 13:55:19 MDT 2023",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "J. Comput. Sci.",
  articleno =    "100583",
  fjournal =     "Journal of Computational Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hartwig Anzt and Jack Dongarra and Goran Flegar and
                 Enrique S. Quintana-Ort{\'\i}",
  title =        "Variable-size batched {Gauss--Jordan} elimination for
                 block-{Jacobi} preconditioning on graphics processors",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "81",
  pages =        "131--146",
  month =        jan,
  year =         "2019",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  MRclass =      "65F08 (65Y10)",
  MRnumber =     "3913128",
  bibdate =      "Mon Jan 7 15:25:21 MST 2019",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Bernard Tourancheau",
  title =        "Guest editors' note: Special issue on clusters,
                 clouds, and data for scientific computing",
  journal =      j-IJHPCA,
  volume =       "33",
  number =       "6",
  pages =        "1067--1068",
  day =          "1",
  month =        nov,
  year =         "2019",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Wed Oct 9 14:35:54 MDT 2019",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Piotr Luszczek and Yaohung (Mike)
  title =        "{HPL-AI} Mixed-Precision Benchmark",
  howpublished = "Web site",
  month =        dec,
  year =         "2019",
  bibdate =      "Thu Dec 05 10:09:59 2019",
  bibsource =    "",
  URL =          ";
  abstract =     "The HPL-AI benchmark seeks to highlight the emerging
                 convergence of high-performance computing (HPC) and
                 artificial intelligence (AI) workloads. While
                 traditional HPC focused on simulation runs for modeling
                 phenomena in physics, chemistry, biology, and so on,
                 the mathematical models that drive these computations
                 require, for the most part, 64-bit accuracy. On the
                 other hand, the machine learning methods that fuel
                 advances in AI achieve desired results at 32-bit and
                 even lower floating-point precision formats. This
                 lesser demand for accuracy fueled a resurgence of
                 interest in new hardware platforms that deliver a mix
                 of unprecedented performance levels and energy savings
                 to achieve the classification and recognition fidelity
                 afforded by higher-accuracy formats.\par

                 HPL-AI strives to unite these two realms by delivering
                 a blend of modern algorithms and contemporary hardware
                 while simultaneously connecting to the solver
                 formulation of the decades-old HPL framework of
                 benchmarking the largest supercomputing installations
                 in the world. The solver method of choice is a
                 combination of $ L U $ factorization and iterative
                 refinement performed afterwards to bring the solution
                 back to 64-bit accuracy. The innovation of HPL-AI lies
                 in dropping the requirement of 64-bit computation
                 throughout the entire solution process and instead
                 opting for low-precision (likely 16-bit) accuracy for $
                 L U $, and a sophisticated iteration to recover the
                 accuracy lost in factorization. The iterative method
                 guaranteed to be numerically stable is the generalized
                 minimal residual method (GMRES), which uses application
                 of the $L$ and $U$ factors to serve as a
                 preconditioner. The combination of these algorithms is
                 demonstrably sufficient for high accuracy and may be
                 implemented in a way that takes advantage of the
                 current and upcoming devices for accelerating AI
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Mark Gates and Azzam Haidar and
                 Jakub Kurzak and Piotr Luszczek and Panruo Wu and
                 Ichitaro Yamazaki and Asim Yarkhan and Maksims
                 Abalenkovs and Negin Bagherpour and Sven Hammarling and
                 Jakub S{\'\i}stek and David Stevens and Mawussi Zounon
                 and Samuel D. Relton",
  title =        "{PLASMA}: Parallel Linear Algebra Software for
                 Multicore Using {OpenMP}",
  journal =      j-TOMS,
  volume =       "45",
  number =       "2",
  pages =        "16:1--16:35",
  month =        apr,
  year =         "2019",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  MRclass =      "65Fxx (65Y05)",
  MRnumber =     "3963988",
  bibdate =      "Mon May 6 18:23:42 MDT 2019",
  bibsource =    ";
  URL =          "",
  abstract =     "The recent version of the Parallel Linear Algebra
                 Software for Multicore Architectures (PLASMA) library
                 is based on tasks with dependencies from the OpenMP
                 standard. The main functionality of the library is
                 presented. Extensive benchmarks are targeted on three
                 recent multicore and manycore architectures, namely, an
                 Intel Xeon, Intel Xeon Phi, and IBM POWER 8
  acknowledgement = ack-nhfb,
  articleno =    "16",
  fjournal =     "ACM Transactions on Mathematical Software (TOMS)",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "J. Dongarra and S. Gottlieb and W. T. C. Kramer",
  title =        "Race to Exascale",
  journal =      j-COMPUT-SCI-ENG,
  volume =       "21",
  number =       "1",
  pages =        "4--5",
  month =        jan # "\slash " # feb,
  year =         "2019",
  CODEN =        "CSENFA",
  DOI =          "",
  ISSN =         "1521-9615 (print), 1558-366x (electronic)",
  ISSN-L =       "1521-9615",
  bibdate =      "Tue Mar 12 10:39:49 2019",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Computing in Science and Engineering",
  journal-URL =  "",
  keywords =     "Analytical models; Big Data; Data analysis; Data
                 models; Exascale computing; High performance computing;
                 Investments; Machine learning; Special issues and
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Valentin {Le F{\`e}vre} and Thomas Herault and Yves
                 Robert and Aurelien Bouteiller and Atsushi Hori and
                 George Bosilca and Jack Dongarra",
  title =        "Comparing the performance of rigid, moldable and
                 grid-shaped applications on failure-prone {HPC}
  journal =      j-PARALLEL-COMPUTING,
  volume =       "85",
  number =       "??",
  pages =        "1--12",
  month =        jul,
  year =         "2019",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Mon Oct 14 16:20:01 MDT 2019",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Azzam Haidar and Heike Jagode and Phil Vaccaro and
                 Asim YarKhan and Stanimire Tomov and Jack Dongarra",
  title =        "Investigating power capping toward energy-efficient
                 scientific applications",
  journal =      j-CCPE,
  volume =       "31",
  number =       "6",
  pages =        "e4485:1--e4485:??",
  day =          "25",
  month =        mar,
  year =         "2019",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Thu Mar 28 08:07:56 MDT 2019",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  onlinedate =   "22 March 2018",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Heike Jagode and Anthony Danalis and Hartwig Anzt and
                 Jack Dongarra",
  title =        "{PAPI} software-defined events for in-depth
                 performance analysis",
  journal =      j-IJHPCA,
  volume =       "33",
  number =       "6",
  pages =        "1113--1127",
  day =          "1",
  month =        nov,
  year =         "2019",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Wed Oct 9 14:35:54 MDT 2019",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sergey V. Kovalchuk and Valeria V. Krzhizhanovskaya
                 and Yong Shi and Haohuan Fua and Michael H. Lees and
                 Jack Dongarra and Peter M. A. Sloot",
  title =        "Science at the intersection of data, modelling, and
  journal =      j-J-COMPUT-SCI,
  volume =       "34",
  pages =        "117--119",
  month =        may,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "1877-7503 (print), 1877-7511 (electronic)",
  ISSN-L =       "1877-7503",
  bibdate =      "Tue Sep 19 13:55:17 MDT 2023",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "J. Comput. Sci.",
  fjournal =     "Journal of Computational Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "I. Masliah and A. Abdelfattah and A. Haidar and S.
                 Tomov and M. Baboulin and J. Falcou and J. Dongarra",
  title =        "Algorithms and optimization techniques for
                 high-performance matrix--matrix multiplications of very
                 small matrices",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "81",
  pages =        "1--21",
  month =        jan,
  year =         "2019",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  MRclass =      "65F99 (65Y05)",
  MRnumber =     "3874624",
  bibdate =      "Mon Jan 7 15:25:21 MST 2019",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ichitaro Yamazaki and Akihiro Ida and Rio Yokota and
                 Jack Dongarra",
  title =        "Distributed-memory lattice {$H$}-matrix
  journal =      j-IJHPCA,
  volume =       "33",
  number =       "5",
  pages =        "1046--1063",
  day =          "1",
  month =        sep,
  year =         "2019",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Wed Oct 9 14:35:54 MDT 2019",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ichitaro Yamazaki and Edmond Chow and Aurelien
                 Bouteiller and Jack Dongarra",
  title =        "Performance of asynchronous optimized {Schwarz} with
                 one-sided communication",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "86",
  pages =        "66--81",
  year =         "2019",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  MRclass =      "65N55 (65Y05)",
  MRnumber =     "3956061",
  bibdate =      "Thu Jun 20 13:48:30 2019",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Parallel Computing. Systems \& Applications",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "D. Zaitsev and S. Tomov and J. Dongarra",
  title =        "Solving Linear {Diophantine} Systems on Parallel
  journal =      j-IEEE-TRANS-PAR-DIST-SYS,
  volume =       "30",
  number =       "5",
  pages =        "1158--1169",
  month =        may,
  year =         "2019",
  CODEN =        "ITDSEO",
  DOI =          "",
  ISSN =         "1045-9219 (print), 1558-2183 (electronic)",
  ISSN-L =       "1045-9219",
  bibdate =      "Fri Aug 30 06:09:58 2019",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Transactions on Parallel and Distributed
  journal-URL =  "",
  keywords =     "application program interfaces; clan; discrete system
                 modeling; discrete-event systems; distributed memory
                 systems; distributed-memory computing nodes;
                 distributing systems; dynamic task-dispatching
                 subsystem; formal languages; linear Diophantine system;
                 linear Diophantine systems-of-equations; logic
                 programming; Mathematical model; mathematics computing;
                 Matrix decomposition; message passing; model checking;
                 MPI; multiple cores; nonnegative integer numbers;
                 OpenMP; parallel architectures; Parallel architectures;
                 parallel architectures; parallel-sequential
                 composition; Petri net; Petri nets; polynomials; single
                 indecomposable system; Software algorithms; Sparse
                 matrices; sparse matrices; sparse matrix; speed-up;
                 system clans; Task analysis; two-level parallelization
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ahmad Abdelfattah and Stan Tomov and Jack Dongarra",
  title =        "Investigating the Benefit of {FP16}-Enabled
                 Mixed-Precision Solvers for Symmetric Positive Definite
                 Matrices Using {GPUs}",
  crossref =     "Krzhizhanovskaya:2020:CSI",
  pages =        "237--250",
  year =         "2020",
  DOI =          "",
  MRclass =      "65F05 (65Y10)",
  MRnumber =     "4150067",
  bibdate =      "Thu Jun 25 08:49:09 2020",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ahmad Abdelfattah and Stanimire Tomov and Jack
  title =        "Matrix multiplication on batches of small matrices in
                 half and half-complex precisions",
  journal =      j-J-PAR-DIST-COMP,
  volume =       "145",
  number =       "??",
  pages =        "188--201",
  month =        nov,
  year =         "2020",
  CODEN =        "JPDCER",
  DOI =          "",
  ISSN =         "0743-7315 (print), 1096-0848 (electronic)",
  ISSN-L =       "0743-7315",
  bibdate =      "Wed May 26 16:11:03 MDT 2021",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "Journal of Parallel and Distributed Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Anonymous",
  title =        "{Jack Dongarra} Selected to Receive the {2020 IEEE
                 Computer Society's Computer Pioneer Award}",
  howpublished = "University of Tennessee Knoxville Web site.",
  day =          "4",
  month =        feb,
  year =         "2020",
  bibdate =      "Fri Aug 21 15:31:58 2020",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Hartwig Anzt and Terry Cojean and Chen Yen-Chen and
                 Jack Dongarra and Goran Flegar and Pratik Nayak and
                 Stanimire Tomov and Yuhsiang M. Tsai and Weichung
  title =        "Load-balancing Sparse Matrix Vector Product Kernels on
  journal =      j-TOPC,
  volume =       "7",
  number =       "1",
  pages =        "2:1--2:26",
  month =        apr,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-4949 (print), 2329-4957 (electronic)",
  ISSN-L =       "2329-4949",
  bibdate =      "Mon Apr 6 08:56:55 MDT 2020",
  bibsource =    ";
  URL =          "",
  abstract =     "Efficient processing of Irregular Matrices on Single
                 Instruction, Multiple Data (SIMD)-type architectures is
                 a persistent challenge. Resolving it requires
                 innovations in the development of data formats,
                 computational techniques, and implementations that
                 strike a balance between thread divergence, which is
                 inherent for Irregular Matrices, and padding, which
                 alleviates the performance-detrimental thread
                 divergence but introduces artificial overheads. To this
                 end, in this article, we address the challenge of
                 designing high performance sparse matrix-vector product
                 (SpMV) kernels designed for Nvidia Graphics Processing
                 Units (GPUs). We present a compressed sparse row (CSR)
                 format suitable for unbalanced matrices. We also
                 provide a load-balancing kernel for the coordinate
                 (COO) matrix format and extend it to a hybrid algorithm
                 that stores part of the matrix in SIMD-friendly Ellpack
                 format (ELL) format. The ratio between the ELL- and the
                 COO-part is determined using a theoretical analysis of
                 the nonzeros-per-row distribution. For the over 2,800
                 test matrices available in the Suite Sparse matrix
                 collection, we compare the performance against SpMV
                 kernels provided by NVIDIA's cuSPARSE library and a
                 heavily-tuned sliced ELL (SELL-P) kernel that prevents
                 unnecessary padding by considering the irregular
                 matrices as a combination of matrix blocks stored in
                 ELL format.",
  acknowledgement = ack-nhfb,
  articleno =    "2",
  fjournal =     "ACM Transactions on Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Alan Ayala and Stanimire Tomov and Azzam Haidar and
                 Jack Dongarra",
  booktitle =    "Computational science---{ICCS} 2020. {Part} {I}",
  title =        "{\it he{FFT}e}: highly efficient {FFT} for exascale",
  volume =       "12137",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "262--275",
  year =         "2020",
  DOI =          "",
  ISBN =         "3-030-50371-2; 3-030-50370-4",
  ISBN-13 =      "978-3-030-50371-0; 978-3-030-50370-3",
  MRclass =      "65T50 (65Y10)",
  MRnumber =     "4149894",
  bibdate =      "Tue Sep 19 12:50:04 2023",
  bibsource =    "",
  series =       "Lecture Notes in Comput. Sci.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Pedro J. S. Cardoso and Jo{\~a}o M. F. Rodrigues and
                 J{\^a}nio Monteiro and Roberto Lam and Valeria V.
                 Krzhizhanovskaya and Michael H. Lees and Jack Dongarra
                 and Peter M. A. Sloot",
  title =        "Computational Science in the Interconnected World:
                 Selected papers from {2019 International Conference on
                 Computational Science}",
  journal =      j-J-COMPUT-SCI,
  volume =       "47",
  pages =        "??--??",
  month =        nov,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "1877-7503 (print), 1877-7511 (electronic)",
  ISSN-L =       "1877-7503",
  MRclass =      "65-06",
  MRnumber =     "4156958",
  bibdate =      "Tue Sep 19 13:55:40 MDT 2023",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "J. Comput. Sci.",
  articleno =    "101222",
  fjournal =     "Journal of Computational Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Laura Grigori and Nicholas J.
  title =        "Numerical algorithms for high-performance
                 computational science",
  journal =      j-PHILOS-TRANS-R-SOC-LOND-SER-A,
  volume =       "378",
  number =       "2166",
  pages =        "20190066:1--20190066:18",
  year =         "2020",
  CODEN =        "PTRMAD, PTMSFB",
  DOI =          "",
  ISSN =         "1364-503X (print), 1471-2962 (electronic)",
  ISSN-L =       "1364-503X",
  MRclass =      "65Y10",
  MRnumber =     "4072450",
  bibdate =      "Fri Jul 9 15:12:06 2021",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ajournal =     "Philos. Trans. Roy. Soc. A",
  fjournal =     "Philosophical Transactions of the Royal Society A.
                 Mathematical, Physical and Engineering Sciences",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Mohammed {Al Farhan} and Ahmad Abdelfattah and
                 Stanimire Tomov and Mark Gates and Dalal Sukkari and
                 Azzam Haidar and Robert Rosenberg and Jack Dongarra",
  title =        "{MAGMA} templates for scalable linear algebra on
                 emerging architectures",
  journal =      j-IJHPCA,
  volume =       "34",
  number =       "6",
  pages =        "645--658",
  day =          "1",
  month =        nov,
  year =         "2020",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Tue May 18 15:46:08 MDT 2021",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Azzam Haidar and Harun Bayraktar and Stanimire Tomov
                 and Jack Dongarra and Nicholas J. Higham",
  title =        "Mixed-precision iterative refinement using tensor
                 cores on {GPUs} to accelerate solution of linear
  journal =      j-PROC-R-SOC-LOND-SER-A,
  volume =       "476",
  number =       "2243",
  pages =        "20200110:1--20200110:30",
  year =         "2020",
  CODEN =        "PRLAAZ",
  DOI =          "",
  ISSN =         "1364-5021 (print), 1471-2946 (electronic)",
  ISSN-L =       "1364-5021",
  MRclass =      "65F10 (65Y10)",
  MRnumber =     "4187936",
  bibdate =      "Fri Jul 9 15:12:06 2021",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Proceedings of the Royal Society of London. Series A",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Yuechao Lu and Ichitaro Yamazaki and Fumihiko Ino and
                 Yasuyuki Matsushita and Stanimire Tomov and Jack
  title =        "Reducing the amount of out-of-core data access for
                 {GPU}-accelerated randomized {SVD}",
  journal =      j-CCPE,
  volume =       "32",
  number =       "19",
  pages =        "e5754:1--e5754:??",
  day =          "10",
  month =        oct,
  year =         "2020",
  CODEN =        "CCPEBO",
  DOI =          "",
  ISSN =         "1532-0626 (print), 1532-0634 (electronic)",
  ISSN-L =       "1532-0626",
  bibdate =      "Wed Mar 31 07:52:20 MDT 2021",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ajournal =     "Concurr. Comput.",
  fjournal =     "Concurrency and Computation: Practice and Experience",
  journal-URL =  "",
  onlinedate =   "13 April 2020",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ahmad Abdelfattah and Timothy Costa and Jack Dongarra
                 and Mark Gates and Azzam Haidar and Sven Hammarling and
                 Nicholas J. Higham and Jakub Kurzak and Piotr Luszczek
                 and Stanimire Tomov and Mawussi Zounon",
  title =        "A Set of Batched Basic Linear Algebra Subprograms and
                 {LAPACK} Routines",
  journal =      j-TOMS,
  volume =       "47",
  number =       "3",
  pages =        "21:1--21:23",
  month =        jun,
  year =         "2021",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  MRclass =      "65Fxx (65Y15)",
  MRnumber =     "4282536",
  bibdate =      "Sun Jun 27 07:42:02 MDT 2021",
  bibsource =    ";
  URL =          "",
  abstract =     "This article describes a standard API for a set of
                 Batched Basic Linear Algebra Subprograms (Batched BLAS
                 or BBLAS). The focus is on many independent BLAS
                 operations on small matrices that are grouped together
                 and processed by a single routine, called a Batched
                 BLAS routine. The matrices are grouped together in
                 uniformly sized groups, with just one group if all the
                 matrices are of equal size. The aim is to provide more
                 efficient, but portable, implementations of algorithms
                 on high-performance many-core platforms. These include
                 multicore and many-core CPU processors, GPUs and
                 coprocessors, and other hardware accelerators with
                 floating-point compute facility. As well as the
                 standard types of single and double precision, we also
                 include half and quadruple precision in the standard.
                 In particular, half precision is used in many very
                 large scale applications, such as those associated with
                 machine learning.",
  acknowledgement = ack-nhfb,
  articleno =    "21",
  fjournal =     "ACM Transactions on Mathematical Software (TOMS)",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ahmad Abdelfattah and Hartwig Anzt and Erik G. Boman
                 and Erin Carson and Terry Cojean and Jack Dongarra and
                 Alyson Fox and Mark Gates and Nicholas J. Higham and
                 Xiaoye S. Li and Jennifer Loe and Piotr Luszczek and
                 Srikara Pranesh and Siva Rajamanickam and Tobias
                 Ribizel and Barry F. Smith and Kasia Swirydowicz and
                 Stephen Thomas and Stanimire Tomov and Yaohung M. Tsai
                 and Ulrike Meier Yang",
  title =        "A survey of numerical linear algebra methods utilizing
                 mixed-precision arithmetic",
  journal =      j-IJHPCA,
  volume =       "35",
  number =       "4",
  pages =        "344--369",
  day =          "1",
  month =        jul,
  year =         "2021",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Wed Apr 6 08:31:21 MDT 2022",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Mark Gates and Piotr Luszczek and
                 Stanimire Tomov",
  title =        "Translational process: Mathematical software
  journal =      j-J-COMPUT-SCI,
  volume =       "52",
  pages =        "??--??",
  month =        may,
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "1877-7503 (print), 1877-7511 (electronic)",
  ISSN-L =       "1877-7503",
  bibdate =      "Tue Sep 19 13:55:49 MDT 2023",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "J. Comput. Sci.",
  articleno =    "101216",
  fjournal =     "Journal of Computational Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Tzanio Kolev and Paul Fischer and Misun Min and Jack
                 Dongarra and Jed Brown and Veselin Dobrev and Tim
                 Warburton and Stanimire Tomov and Mark S. Shephard and
                 Ahmad Abdelfattah and Valeria Barra and Natalie Beams
                 and Jean-Sylvain Camier and Noel Chalmers and Yohann
                 Dudouit and Ali Karakus and Ian Karlin and Stefan
                 Kerkemeier and Yu-Hsiang Lan and David Medina and Elia
                 Merzari and Aleksandr Obabko and Will Pazner and
                 Thilina Rathnayake and Cameron W. Smith and Lukas Spies
                 and Kasia Swirydowicz and Jeremy Thompson and Ananias
                 Tomboulides and Vladimir Tomov",
  title =        "Efficient exascale discretizations: High-order finite
                 element methods",
  journal =      j-IJHPCA,
  volume =       "35",
  number =       "6",
  pages =        "527--552",
  day =          "1",
  month =        nov,
  year =         "2021",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Wed Apr 6 08:31:22 MDT 2022",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sergey V. Kovalchuk and Valeria V. Krzhizhanovskaya
                 and Maciej Paszy{\'n}ski and G{\'a}bor Z{\'a}vodszky
                 and Michael H. Lees and Jack Dongarra and Peter M. A.
  title =        "20 years of computational science: Selected papers
                 from {2020 International Conference on Computational
  journal =      j-J-COMPUT-SCI,
  volume =       "53",
  pages =        "??--??",
  month =        jul,
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "1877-7503 (print), 1877-7511 (electronic)",
  ISSN-L =       "1877-7503",
  bibdate =      "Tue Sep 19 13:55:52 MDT 2023",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "J. Comput. Sci.",
  articleno =    "101395",
  fjournal =     "Journal of Computational Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sameh Abdulah and Qinglei Cao and Yu Pei and George
                 Bosilca and Jack Dongarra and Marc G. Genton and David
                 E. Keyes and Hatem Ltaief and Ying Sun",
  title =        "Accelerating Geostatistical Modeling and Prediction
                 With Mixed-Precision Computations: a High-Productivity
                 Approach With {PaRSEC}",
  journal =      j-IEEE-TRANS-PAR-DIST-SYS,
  volume =       "33",
  number =       "4",
  pages =        "964--976",
  month =        apr,
  year =         "2022",
  CODEN =        "ITDSEO",
  DOI =          "",
  ISSN =         "1045-9219 (print), 1558-2183 (electronic)",
  ISSN-L =       "1045-9219",
  bibdate =      "Thu Nov 11 08:39:34 2021",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Transactions on Parallel and Distributed
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "James Demmel and Jack Dongarra and Mark Gates and Greg
                 Henry and Julien Langou and Xiaoye Li and Piotr
                 Luszczek and Weslley Pereira and Jason Riedy and Cindy
  title =        "Proposed Consistent Exception Handling for the {BLAS}
                 and {LAPACK}",
  journal =      "",
  volume =       "??",
  number =       "??",
  pages =        "92",
  day =          "19",
  month =        jul,
  year =         "2022",
  bibdate =      "Mon Sep 11 06:47:01 2023",
  bibsource =    ";
  URL =          "",
  abstract =     "Numerical exceptions, which may be caused by overflow,
                 operations like division by 0 or sqrt(-1), or
                 convergence failures, are unavoidable in many cases, in
                 particular when software is used on unforeseen and
                 difficult inputs. As more aspects of society become
                 automated, e.g., self-driving cars, health monitors,
                 and cyber-physical systems more generally, it is
                 becoming increasingly important to design software that
                 is resilient to exceptions, and that responds to them
                 in a consistent way. Consistency is needed to allow
                 users to build higher-level software that is also
                 resilient and consistent (and so on recursively). In
                 this paper we explore the design space of consistent
                 exception handling for the widely used BLAS and LAPACK
                 linear algebra libraries, pointing out a variety of
                 instances of inconsistent exception handling in the
                 current versions, and propose a new design that
                 balances consistency, complexity, ease of use, and
                 performance. Some compromises are needed, because there
                 are preexisting inconsistencies that are outside our
                 control, including in or between existing vendor BLAS
                 implementations, different programming languages, and
                 even compilers for the same programming language. And
                 user requests from our surveys are quite diverse. We
                 also propose our design as a possible model for other
                 numerical software, and welcome comments on our design
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "James Demmel and Jack Dongarra and Mark Gates and Greg
                 Henry and Julien Langou and Xiaoye Li and Piotr
                 Luszczek and Weslley Pereira and Jason Riedy and Cindy
  editor =       "{IEEE}",
  booktitle =    "{Correctness 2022: Sixth International Workshop on
                 Software Correctness for HPC Applications: Held in
                 conjunction with SC22: The International Conference for
                 High Performance Computing, Networking, Storage and
                 Analysis. Dallas, Texas, USA, November 13-18, 2022}",
  title =        "Proposed Consistent Exception Handling for the {BLAS}
                 and {LAPACK}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "??--??",
  year =         "2022",
  DOI =          "",
  ISBN =         "1-66546-335-X",
  ISBN-13 =      "978-1-66546-335-5",
  LCCN =         "????",
  bibdate =      "Wed Aug 07 14:39:23 2024",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack J. Dongarra",
  title =        "{Turing} lecture: The evolution of mathematical
  journal =      j-CACM,
  volume =       "65",
  number =       "12",
  pages =        "66--72",
  month =        dec,
  year =         "2022",
  CODEN =        "CACMA2",
  DOI =          "",
  ISSN =         "0001-0782 (print), 1557-7317 (electronic)",
  ISSN-L =       "0001-0782",
  bibdate =      "Thu Dec 8 15:33:46 MST 2022",
  bibsource =    ";
  URL =          "",
  abstract =     "Tracing how software and algorithms follow the
  acknowledgement = ack-nhfb,
  fjournal =     "Communications of the ACM",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sergey V. Kovalchuk and Valeria V. Krzhizhanovskaya
                 and Maciej Paszy{\'n}ski and Dieter Kranzlm{\"u}ller
                 and Jack Dongarra and Peter M. A. Sloot",
  title =        "Computational science for a better future",
  journal =      j-J-COMPUT-SCI,
  volume =       "62",
  pages =        "??--??",
  month =        jul,
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "1877-7503 (print), 1877-7511 (electronic)",
  ISSN-L =       "1877-7503",
  bibdate =      "Tue Sep 19 13:56:13 MDT 2023",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "J. Comput. Sci.",
  articleno =    "101745",
  fjournal =     "Journal of Computational Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Neil Lindquist and Piotr Luszczek and Jack Dongarra",
  title =        "Accelerating Restarted {GMRES} With Mixed Precision
  journal =      j-IEEE-TRANS-PAR-DIST-SYS,
  volume =       "33",
  number =       "4",
  pages =        "1027--1037",
  month =        apr,
  year =         "2022",
  CODEN =        "ITDSEO",
  DOI =          "",
  ISSN =         "1045-9219 (print), 1558-2183 (electronic)",
  ISSN-L =       "1045-9219",
  bibdate =      "Thu Nov 11 08:39:34 2021",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE Transactions on Parallel and Distributed
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Dong Zhong and Qinglei Cao and George Bosilca and Jack
  title =        "Using long vector extensions for {MPI} reductions",
  journal =      j-PARALLEL-COMPUTING,
  volume =       "109",
  number =       "??",
  pages =        "??--??",
  month =        mar,
  year =         "2022",
  CODEN =        "PACOEJ",
  DOI =          "",
  ISSN =         "0167-8191 (print), 1872-7336 (electronic)",
  ISSN-L =       "0167-8191",
  bibdate =      "Fri Feb 18 10:07:18 MST 2022",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  articleno =    "102871",
  fjournal =     "Parallel Computing",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Jack Dongarra and Bernard Tourancheau",
  title =        "Guest editors note: Special issue on clusters, clouds,
                 and data for scientific computing",
  journal =      j-IJHPCA,
  volume =       "37",
  number =       "3-4",
  pages =        "211--212",
  day =          "1",
  month =        jul,
  year =         "2023",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Thu May 30 07:31:48 MDT 2024",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "????",
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Sergey V. Kovalchuk and Cl{\'e}lia de Mulatier and
                 Derek Groen and Maciej Paszy{\'n}ski and Valeria V.
                 Krzhizhanovskaya and Jack Dongarra and Peter M. A.
  title =        "The computational planet",
  journal =      j-J-COMPUT-SCI,
  volume =       "72",
  pages =        "??--??",
  month =        sep,
  year =         "2023",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "1877-7503 (print), 1877-7511 (electronic)",
  ISSN-L =       "1877-7503",
  bibdate =      "Tue Sep 19 13:56:54 MDT 2023",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "J. Comput. Sci.",
  articleno =    "102102",
  fjournal =     "Journal of Computational Science",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Piotr Luszczek and Wissam M. Sid-Lakhdar and Jack
  title =        "Combining multitask and transfer learning with deep
                 {Gaussian} processes for autotuning-based performance
  journal =      j-IJHPCA,
  volume =       "37",
  number =       "3-4",
  pages =        "229--244",
  day =          "1",
  month =        jul,
  year =         "2023",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Thu May 30 07:31:48 MDT 2024",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "????",
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782; Luszczek,

  author =       "Daniel Reed and Dennis Gannon and Jack Dongarra",
  title =        "Contributed Articles: {HPC} Forecast: Cloudy and
  journal =      j-CACM,
  volume =       "66",
  number =       "2",
  pages =        "82--90",
  month =        feb,
  year =         "2023",
  CODEN =        "CACMA2",
  DOI =          "",
  ISSN =         "0001-0782 (print), 1557-7317 (electronic)",
  ISSN-L =       "0001-0782",
  bibdate =      "Mon Feb 6 12:23:39 MST 2023",
  bibsource =    ";
  URL =          "",
  abstract =     "An examination of how the technology landscape has
                 changed and possible future directions for HPC
                 operations and innovation.",
  acknowledgement = ack-nhfb,
  fjournal =     "Communications of the ACM",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Ahmad Abdelfattah and Natalie Beams and Robert Carson
                 and Pieter Ghysels and Tzanio Kolev and Thomas Stitt
                 and Arturo Vargas and Stanimire Tomov and Jack
  title =        "{MAGMA}: Enabling exascale performance with
                 accelerated {BLAS} and {LAPACK} for diverse {GPU}
  journal =      j-IJHPCA,
  volume =       "38",
  number =       "5",
  pages =        "468--490",
  day =          "1",
  month =        sep,
  year =         "2024",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Fri Feb 7 16:00:18 MST 2025",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "????",
  fjournal =     "International Journal of High Performance Computing
  ORCID-numbers = "Abdelfattah, Ahmad/0000-0001-5054-4784; Beams,
                 Natalie/0000-0001-6060-4082; Dongarra,

  author =       "Anonymous",
  title =        "Retraction Notice: {Azzam Haidar and Tingxing Dong and
                 Piotr Luszczek and Stanimire Tomov and Jack Dongarra,
                 \booktitle{Batched matrix computations on hardware
                 accelerators based on GPUs}, Int. J. High Perform.
                 Comput. Appl. {\bf 29}(2) 193--208 (2015)}",
  journal =      j-IJHPCA,
  volume =       "38",
  number =       "4",
  pages =        "377",
  day =          "1",
  month =        jul,
  year =         "2024",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Sat Aug 10 06:42:57 MDT 2024",
  bibsource =    ";
  note =         "See \cite{Haidar:2015:BMC}.",
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "Int. J. High Perform. Comput. Appl.",
  fjournal =     "International Journal of High Performance Computing
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Neil Lindquist and Piotr Luszczek and Jack Dongarra",
  title =        "Generalizing Random Butterfly Transforms to Arbitrary
                 Matrix Sizes",
  journal =      j-TOMS,
  volume =       "50",
  number =       "4",
  pages =        "26:1--26:??",
  month =        dec,
  year =         "2024",
  CODEN =        "ACMSCU",
  DOI =          "",
  ISSN =         "0098-3500 (print), 1557-7295 (electronic)",
  ISSN-L =       "0098-3500",
  bibdate =      "Sat Dec 14 17:48:45 MST 2024",
  bibsource =    ";
  URL =          "",
  abstract =     "Parker and L{\^e} introduced random butterfly
                 transforms (RBTs) as a preprocessing technique to
                 replace pivoting in dense LU factorization.
                 Unfortunately, their FFT-like recursive structure
                 restricts the dimensions of the matrix. Furthermore, on
                 multinode systems, efficient management of the
                 communication overheads restricts the matrix's
                 distribution even more. To remove these limitations, we
                 have generalized the RBT to arbitrary matrix sizes by
                 truncating the dimensions of each layer in the
                 transform. We expanded Parker's theoretical analysis to
                 generalized RBT, specifically that in exact arithmetic,
                 Gaussian elimination with no pivoting will succeed with
                 probability 1 after transforming a matrix with
                 full-depth RBTs. Furthermore, we experimentally show
                 that these generalized transforms improve performance
                 over Parker's formulation by up to 62\% while retaining
                 the ability to replace pivoting. This generalized RBT
                 is available in the SLATE numerical software library.",
  acknowledgement = ack-nhfb,
  ajournal =     "ACM Trans. Math. Softw.",
  articleno =    "26",
  fjournal =     "ACM Transactions on Mathematical Software (TOMS)",
  journal-URL =  "",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  author =       "Piotr Luszczek and Anthony Castaldo and Yaohung M.
                 Tsai and Daniel Mishler and Jack Dongarra",
  title =        "Numerical eigen-spectrum slicing, accurate orthogonal
                 eigen-basis, and mixed-precision eigenvalue refinement
                 using {OpenMP} data-dependent tasks and accelerator
  journal =      j-IJHPCA,
  volume =       "38",
  number =       "6",
  pages =        "671--691",
  day =          "1",
  month =        nov,
  year =         "2024",
  CODEN =        "IHPCFL",
  DOI =          "",
  ISSN =         "1094-3420 (print), 1741-2846 (electronic)",
  ISSN-L =       "1094-3420",
  bibdate =      "Fri Feb 7 16:00:18 MST 2025",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "????",
  fjournal =     "International Journal of High Performance Computing
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782; Luszczek,

%%% ====================================================================
%%% Part 2: Publications about Jack J. Dongarra and his works.
  author =       "Garrett Birkhoff",
  title =        "Book Review: {{\booktitle{Computational analysis with
                 the HP 25 pocket calculator}}, by Peter Henrici, John
                 Wiley, New York, 1977, 280 pp.; \booktitle{Compact
                 numerical methods for computers: linear algebra and
                 function minimization}, by J. C. Nash, John Wiley \&
                 Sons, New York, 1979, x + 227 pp.; \booktitle{LINPACK:
                 User's guide}, by J. J. Dongarra, J. R. Bunch, C. B.
                 Moler, and G. W. Stewart, Society for Industrial and
                 Applied Mathematics, Philadelphia, 1979 368 pp.}",
  journal =      j-BULL-AMS,
  volume =       "2",
  number =       "3",
  pages =        "503--505",
  month =        may,
  year =         "1980",
  CODEN =        "BAMOAD",
  DOI =          "",
  ISSN =         "0002-9904 (print), 1936-881X (electronic)",
  ISSN-L =       "0002-9904",
  bibdate =      "Wed Nov 01 08:26:39 2023",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  author-dates = "Garrett Birkhoff (19 January 1911--22 November 1996)",
  fjournal =     "Bulletin of the American Mathematical Society",
  gb-number =    "191b",
  journal-URL =  "",
  subject-dates = "Peter Karl Henrici (13 September 1923--13 March

  author =       "Michael Feldman",
  title =        "Tweaked Math Libraries Exploit {AI} Hardware For
                 Traditional {HPC}",
  howpublished = "Web site.",
  day =          "3",
  month =        dec,
  year =         "2019",
  bibdate =      "Thu Dec 05 10:00:01 2019",
  bibsource =    "",
  note =         "Jack Dongarra describes work to benchmark, and
                 utilize, 16-bit floating-point formats. The new
                 benchmark is called HPL-AI.",
  URL =          ";
  acknowledgement = ack-nhfb,
  remark =       "The article includes a link to a 12m video of an
                 interview with Jack Dongarra.",

  author =       "Sven Hammarling and Nicholas J. Higham",
  title =        "The Influence and Contribution of {Jack Dongarra} to
                 Numerical Linear Algebra",
  journal =      j-COMPUT-SCI-ENG,
  volume =       "24",
  number =       "4",
  pages =        "6--11",
  month =        jul # "\slash " # aug,
  year =         "2022",
  CODEN =        "CSENFA",
  DOI =          "",
  ISSN =         "1521-9615 (print), 1558-366X (electronic)",
  ISSN-L =       "1521-9615",
  bibdate =      "Fri Mar 3 06:06:17 2023",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Computing in Science and Engineering",
  journal-URL =  "",

  author =       "Torsten Hoefler and Marcin Copik and Pete Beckman and
                 Andrew Jones and Ian Foster and Manish Parashar and
                 Daniel Reed and Matthias Troyer and Thomas Schulthess
                 and Daniel Ernst and Jack Dongarra",
  title =        "{XaaS}: Acceleration as a Service to Enable Productive
                 High-Performance Cloud Computing",
  journal =      j-COMPUT-SCI-ENG,
  volume =       "26",
  number =       "3",
  pages =        "40--51",
  month =        jul # "\slash " # sep,
  year =         "2024",
  CODEN =        "CSENFA",
  DOI =          "",
  ISSN =         "1521-9615 (print), 1558-366X (electronic)",
  ISSN-L =       "1521-9615",
  bibdate =      "Wed Dec 4 16:56:42 2024",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Computing in Science and Engineering",
  journal-URL =  "",
  keywords =     "Artificial intelligence; Climate change; Cloud
                 computing; Computational modeling; Computer
                 architecture; Containers; Ecosystems; High performance
                 computing; Machine learning; Meteorology; Resource
                 management; Serverless computing; Simulation",

  author =       "Sergey V. Kovalchuk and Cl{\'e}lia de Mulatier and
                 Valeria V. Krzhizhanovskaya and Ji{\v{r}}{\'\i}
                 Miky{\v{s}}ka and Maciej Paszy{\'n}ski and Jack
                 Dongarra and Peter M. A. Sloot",
  title =        "Computation at the Cutting Edge of Science",
  journal =      j-J-COMPUT-SCI,
  volume =       "81",
  number =       "??",
  pages =        "??--??",
  month =        sep,
  year =         "2024",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "1877-7503 (print), 1877-7511 (electronic)",
  ISSN-L =       "1877-7503",
  bibdate =      "Wed Aug 28 10:41:44 MDT 2024",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  ajournal =     "J. Comput. Sci.",
  articleno =    "102379",
  fjournal =     "Journal of Computational Science",
  journal-URL =  "",

  author =       "Manish Parashar",
  title =        "{Jack Dongarra}: Catalyzing the Transformation of
                 High-Performance Computing",
  journal =      j-COMPUT-SCI-ENG,
  volume =       "24",
  number =       "4",
  pages =        "4--5",
  month =        jul # "\slash " # aug,
  year =         "2022",
  CODEN =        "CSENFA",
  DOI =          "",
  ISSN =         "1521-9615 (print), 1558-366X (electronic)",
  ISSN-L =       "1521-9615",
  bibdate =      "Fri Mar 3 06:06:17 2023",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Computing in Science and Engineering",
  journal-URL =  "",

  author =       "Richard W. Vuduc",
  title =        "{Jack}, The Autotuner",
  journal =      j-COMPUT-SCI-ENG,
  volume =       "24",
  number =       "4",
  pages =        "24--27",
  month =        jul # "\slash " # aug,
  year =         "2022",
  CODEN =        "CSENFA",
  DOI =          "",
  ISSN =         "1521-9615 (print), 1558-366X (electronic)",
  ISSN-L =       "1521-9615",
  bibdate =      "Fri Mar 3 06:06:17 2023",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Computing in Science and Engineering",
  journal-URL =  "",

%%% ====================================================================
%%% These entries must occur last because they are cross-referenced by
%%% entries above.
  editor =       "G. Rodrigue",
  title =        "Parallel processing for scientific computing",
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "428",
  year =         "1989",
  ISBN =         "0-89871-228-9",
  ISBN-13 =      "978-0-89871-228-5",
  LCCN =         "QA76.5 .S515 1987",
  bibdate =      "Mon Jan 2 13:12:21 MST 2006",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  meetingname =  "SIAM Conference on Parallel Processing for Scientific
                 Computing (3rd: 1987: Los Angeles, Calif.)",
  remark =       "Proceedings of the Third SIAM Conference on Parallel
                 Processing for Scientific Computing, Los Angeles,
                 California, December 1--4, 1987. This conference was
                 sponsored by the SIAM Activity Group on
  subject =      "Parallel processing (Electronic computers);

  author =       "Jason Sanders and Edward Kandrot",
  title =        "{CUDA} by Example: an Introduction to General-purpose
                 {GPU} Programming",
  publisher =    pub-AW,
  address =      pub-AW:adr,
  pages =        "xix + 290",
  year =         "2010",
  ISBN =         "0-13-138768-5",
  ISBN-13 =      "978-0-13-138768-3",
  LCCN =         "QA76.76.A65",
  bibdate =      "Wed Jul 28 23:24:12 MDT 2010",
  bibsource =    ";
  abstract =     "CUDA is a computing architecture designed to
                 facilitate the development of parallel programs. This
                 book shows programmers how to employ this new
                 technology. Each area of CUDA development is introduced
                 through working examples. After a concise introduction
                 to the CUDA platform and architecture, as well as a
                 quick-start guide to CUDA C, the book details the
                 techniques and trade-offs associated with each key CUDA
  acknowledgement = ack-nhfb,
  keywords =     "CUDA; GPU",
  subject =      "application software; development; computer
                 architecture; parallel programming (computer science)",
  tableofcontents = "Why CUDA? why now? \\
                 Getting started \\
                 Introduction to CUDA C \\
                 Parallel programming in CUDA C \\
                 Thread cooperation \\
                 Constant memory and events \\
                 Texture memory \\
                 Graphics interoperability \\
                 Atomics \\
                 Streams \\
                 CUDA C on multiple GPUs \\
                 The final countdown \\
                 Appendix A: Advanced atomics",

  author =       "Georg Hager and Gerhard Wellein",
  title =        "Introduction to high performance computing for
                 scientists and engineers",
  volume =       "7",
  publisher =    pub-CRC,
  address =      pub-CRC:adr,
  pages =        "xxv + 330 + 4",
  year =         "2011",
  ISBN =         "1-4398-1192-X",
  ISBN-13 =      "978-1-4398-1192-4",
  LCCN =         "QA76.88 .H34 2011",
  bibdate =      "Wed Sep 15 13:26:35 MDT 2010",
  bibsource =    ";
  series =       "Chapman and Hall/CRC computational science series",
  acknowledgement = ack-nhfb,
  subject =      "high performance computing",
  tableofcontents = "Modern Processors \\
                 Stored-program computer architecture \\
                 General-purpose cache-based microprocessor architecture
                 Memory hierarchies \\
                 Multicore processors \\
                 Multithreaded processors \\
                 Vector processors \\
                 Basic Optimization Techniques for Serial Code \\
                 Scalar profiling \\
                 Common sense optimizations \\
                 Simple measures, large impact \\
                 The role of compilers \\
                 C++ optimizations \\
                 Data Access Optimization \\
                 Balance analysis and lightspeed estimates \\
                 Storage order \\
                 Case study: The Jacobi algorithm \\
                 Case study: Dense matrix transpose \\
                 Algorithm classification and access optimizations \\
                 Case study: Sparse matrix-vector multiply \\
                 Parallel Computers \\
                 Taxonomy of parallel computing paradigms \\
                 Shared-memory computers \\
                 Distributed-memory computers \\
                 Hierarchical (hybrid) systems \\
                 Networks \\
                 Basics of Parallelization \\
                 Why parallelize? \\
                 Parallelism \\
                 Parallel scalability \\
                 Shared-Memory Parallel Programming with OpenMP \\
                 Short introduction to OpenMP \\
                 Case study: OpenMP-parallel Jacobi algorithm \\
                 Advanced OpenMP: Wavefront parallelization \\
                 Efficient OpenMP Programming \\
                 Profiling OpenMP programs \\
                 Performance pitfalls \\
                 Case study: Parallel sparse matrix-vector multiply \\
                 Locality Optimizations on ccNUMA Architectures \\
                 Locality of access on ccNUMA \\
                 Case study: ccNUMA optimization of sparse MVM \\
                 Placement pitfalls \\
                 ccNUMA issues with C++ \\
                 Distributed-Memory Parallel Programming with MPI \\
                 Message passing \\
                 A short introduction to MPI \\
                 Example: MPI parallelization of a Jacobi solver \\
                 Efficient MPI Programming \\
                 MPI performance tools \\
                 Communication parameters \\
                 Synchronization, serialization, contention \\
                 Reducing communication overhead \\
                 Understanding intranode point-to-point communication
                 Hybrid Parallelization with MPI and OpenMP \\
                 Basic MPI/OpenMP programming models \\
                 MPI taxonomy of thread interoperability \\
                 Hybrid decomposition and mapping \\
                 Potential benefits and drawbacks of hybrid programming
                 Appendix A: Topology and Affinity in Multicore
                 Environments \\
                 Appendix B: Solutions to the Problems \\
                 Bibliography \\

  editor =       "B. L. Buzbee and J. F. Morrison",
  booktitle =    "Proceedings of the 1978 {LASL} Workshop on Vector and
                 Parallel Processors held at Los Alamos Scientific
                 Laboratory, Los Alamos, New Mexico, September 20--22,
  title =        "Proceedings of the 1978 {LASL} Workshop on Vector and
                 Parallel Processors held at Los Alamos Scientific
                 Laboratory, Los Alamos, New Mexico, September 20--22,
  publisher =    "Los Alamos Scientific Laboratory",
  address =      "Los Alamos, NM, USA",
  pages =        "x + 251",
  year =         "1978",
  bibdate =      "Mon Jan 15 11:05:11 1996",
  bibsource =    "",
  note =         "U.S. Scientific Laboratory, Los Alamos, NM Conference
                 proceedings LA-7491-C.",
  acknowledgement = ack-nhfb,

  editor =       "Wayne R. Cowell",
  booktitle =    "Sources and Development of Mathematical Software",
  title =        "Sources and Development of Mathematical Software",
  publisher =    pub-PH,
  address =      pub-PH:adr,
  pages =        "xii + 404",
  year =         "1984",
  ISBN =         "0-13-823501-5",
  ISBN-13 =      "978-0-13-823501-7",
  LCCN =         "QA76.95 .S68 1984",
  bibdate =      "Tue Dec 14 22:44:45 1993",
  bibsource =    ";
  series =       "Prentice-Hall Series in Computational Mathematics,
                 Cleve Moler, Advisor",
  acknowledgement = ack-nhfb,
  tableofcontents = "Observations on the mathematical software effort /
                 W. J. Cody \\
                 LINPACK: A package for solving linear systems / J. J.
                 Dongarra and G. W. Stewart \\
                 FUNPACK: A package of special function routines / W. J.
                 Cody \\
                 EISPACK: A package for solving matrix eigenvalue
                 problems / J. J. Dongarra and C. B. Moler \\
                 The MINPACK project / J. More, D. Sorensen, B. Garbow,
                 and K. Hillstrom \\
                 Software for ordinary differential equations / L. F.
                 Shampine and H. A. Watts \\
                 Sources of information on quadrature software / D.
                 Kahaner \\
                 A survey of sparse matrix software / Iain S. Duff \\
                 Mathematical software for elliptic boundary value
                 problems \\
                 Ronald F. Boisvert and Roland A. Sweet \\
                 The IMSL Library / Thomas J. Aird \\
                 The SLATEC common mathematical library / Bill L. Buzbee
                 The Boeing mathematical software library / A. H.
                 Erisman, K. W. Neves, and I. R. Philips \\
                 The PORT mathematical subroutine Library / Phyllis Fox
                 The evolving NAG library service / Brian Ford and James
                 C. T. Pool",

  editor =       "Jack Dongarra and Gene Golub and Jorge Mor{\'e} and
                 Danny Sorensen",
  booktitle =    "{Informal proceedings of the Symposium on
                 Computational Mathematics --- State of the Art: held at
                 Argonne National Laboratory, September 20--21, 1984, in
                 honor of James H. Wilkinson}",
  title =        "{Informal proceedings of the Symposium on
                 Computational Mathematics --- State of the Art: held at
                 Argonne National Laboratory, September 20--21, 1984, in
                 honor of James H. Wilkinson}",
  publisher =    inst-ANL,
  address =      inst-ANL:adr,
  pages =        "v + 264",
  month =        dec,
  year =         "1984",
  LCCN =         "QA297.S879 1984",
  bibdate =      "Sat Sep 24 01:25:08 1994",
  bibsource =    ";
  note =         "Technical Report MCS-TM-42. It consists of copies of
                 lecture slides from the ten symposium talks.",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxISBN =       "none",

  editor =       "R. Glowinski and J.-L. Lions",
  booktitle =    "Computing Methods in Applied Sciences and Engineering,
                 {VI}: Proceedings of the Sixth International Symposium
                 on Computing Methods in Applied Sciences and
                 Engineering, Versailles, France, December 12--16,
  title =        "Computing Methods in Applied Sciences and Engineering,
                 {VI}: Proceedings of the Sixth International Symposium
                 on Computing Methods in Applied Sciences and
                 Engineering, Versailles, France, December 12--16,
  publisher =    pub-NH,
  address =      pub-NH:adr,
  pages =        "xiii + 728",
  year =         "1984",
  ISBN =         "0-444-87597-2",
  ISBN-13 =      "978-0-444-87597-6",
  LCCN =         "QA297 .I57 1983",
  bibdate =      "Mon Jan 15 11:05:19 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "Kai Hwang",
  booktitle =    "Proceedings: 7th Symposium on Computer Arithmetic,
                 June 4--6, 1985, University of Illinois, Urbana,
  title =        "Proceedings: 7th Symposium on Computer Arithmetic,
                 June 4--6, 1985, University of Illinois, Urbana,
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xi + 343",
  year =         "1985",
  ISBN =         "0-8186-0632-0 (paperback), 0-8186-8632-4 (hard),
                 0-8186-4632-2 (microfiche)",
  ISBN-13 =      "978-0-8186-0632-8 (paperback), 978-0-8186-8632-0
                 (hard), 978-0-8186-4632-4 (microfiche)",
  LCCN =         "QA76.9.C62 S95 1985",
  bibdate =      "Thu Sep 08 00:11:41 1994",
  bibsource =    "",
  acknowledgement = ack-nj,

  editor =       "Alan G. Bell",
  booktitle =    "Digest of papers / Compcon 86, March 3--6, Spring;
                 Thirty-first {IEEE} Computer Society International
                 Conference, Cathedral Hill Hotel, San Francisco,
  title =        "Digest of papers / Compcon 86, March 3--6, Spring;
                 Thirty-first {IEEE} Computer Society International
                 Conference, Cathedral Hill Hotel, San Francisco,
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xv + 518",
  year =         "1986",
  CODEN =        "PCICDQ",
  ISBN =         "0-8186-0692-4 (paperback), 0-8186-4692-6
  ISBN-13 =      "978-0-8186-0692-2 (paperback), 978-0-8186-4692-8
  LCCN =         "QA75.5.C58 1986",
  bibdate =      "Fri Aug 23 13:30:42 1996",
  bibsource =    "",
  note =         "IEEE Computer Society order number 692; IEEE catalog
                 number 86CH2285-5",
  acknowledgement = ack-nhfb,

  editor =       "Jane Cullum and Ralph A. Willoughby",
  booktitle =    "Large scale eigenvalue problems: proceedings of the
                 {IBM} Europe Institute Workshop on Large Scale
                 Eigenvalue Problems held in Oberlech, Austria, July
                 8--12, 1985",
  title =        "Large Scale Eigenvalue Problems. Proceedings of the
                 {IBM} European Institute Workshop",
  publisher =    pub-NH,
  address =      pub-NH:adr,
  pages =        "viii + 330",
  year =         "1986",
  ISBN =         "0-444-70074-9",
  ISBN-13 =      "978-0-444-70074-2",
  LCCN =         "QA193 .I261 1985",
  bibdate =      "Sat Mar 22 18:32:44 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "M. Feilmeier and G. Joubert and U. Schendel",
  booktitle =    "Parallel Computing 85: Proceedings of the Second
                 International Conference on Parallel Computing, held at
                 the Freie Universit{\"a}t Berlin, 23--25, September
  title =        "Parallel Computing 85: Proceedings of the Second
                 International Conference on Parallel Computing, held at
                 the Freie Universit{\"a}t Berlin, 23--25, September
  publisher =    pub-NH,
  address =      pub-NH:adr,
  pages =        "xiv + 534",
  year =         "1986",
  ISBN =         "0-444-70009-9",
  ISBN-13 =      "978-0-444-70009-4",
  LCCN =         "QA76.6 .I5471 1985",
  bibdate =      "Mon Jan 15 11:05:23 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "Arthur Wouk",
  booktitle =    "New computing environments: parallel, vector and
                 systolic (Stanford University, Stanford, {CA}, November
                 7--9, 1984)",
  title =        "New computing environments: parallel, vector and
                 systolic (Stanford University, Stanford, {CA}, November
                 7--9, 1984)",
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "270",
  year =         "1986",
  ISBN =         "0-89871-201-7",
  ISBN-13 =      "978-0-89871-201-8",
  LCCN =         "QA76.9.A73 N49 1986",
  bibdate =      "Mon Jan 15 11:06:47 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "Anonymous",
  booktitle =    "International Seminar on Scientific Supercomputers",
  title =        "International Seminar on Scientific Supercomputers",
  publisher =    "Inst. Nat. Rech. and Inf. Autom",
  address =      "Le Chesnay, France",
  pages =        "504",
  year =         "1987",
  bibdate =      "Mon Sep 9 14:56:14 MDT 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  confdate =     "2--6 Feb. 1987",
  conflocation = "Paris, France",
  pubcountry =   "France",

  editor =       "Leah H. Jamieson and Dennis B. Gannon and Robert J.
  booktitle =    "The Characteristics of Parallel Algorithms",
  title =        "The Characteristics of Parallel Algorithms",
  volume =       "30",
  publisher =    pub-MIT,
  address =      pub-MIT:adr,
  pages =        "440",
  year =         "1987",
  ISBN =         "0-262-10036-3",
  ISBN-13 =      "978-0-262-10036-6",
  LCCN =         "QA76.6 .C42981 1987",
  bibdate =      "Mon Jan 15 11:05:44 1996",
  bibsource =    "",
  series =       "MIT Press series in scientific computation",
  acknowledgement = ack-nhfb,

  editor =       "E. N. Houstis and T. S. Papatheodorou and C. D.
  booktitle =    "{Supercomputing: 1st International Conference, Athens,
                 Greece, June 8--12, 1987: proceedings}",
  title =        "{Supercomputing: 1st International Conference, Athens,
                 Greece, June 8--12, 1987: proceedings}",
  volume =       "297",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "x + 1093",
  year =         "1988",
  CODEN =        "LNCSD9",
  ISBN =         "0-387-18991-2, 3-540-18991-2",
  ISBN-13 =      "978-0-387-18991-8, 978-3-540-18991-6",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA267.A1 L43 no.297",
  bibdate =      "Mon Sep 9 14:56:14 MDT 1996",
  bibsource =    ";
                 University of California MELVYL catalog.",
  note =         "The conference was organized and sponsored by the
                 Computer Technology Institute (C.T.I.) of Greece.",
  series =       ser-LNCS,
  acknowledgement = ack-nhfb,
  confdate =     "8--12 June 1987",
  conflocation = "Athens, Greece",
  confsponsor =  "Comput. Technol. Inst. Greece",
  keywords =     "supercomputers --- congresses",
  pubcountry =   "West Germany",

  editor =       "{IEEE}",
  booktitle =    "Proceedings, Supercomputing '88: November 14--18,
                 1988, Orlando, Florida",
  title =        "Proceedings, Supercomputing '88: November 14--18,
                 1988, Orlando, Florida",
  volume =       "1",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xii + 458",
  year =         "1988",
  ISBN =         "0-8186-0882-X (v. 1; paper), 0-8186-8882-3 (v. 1;
                 case), 0-8186-4882-1 (v. 1: microfiche) 0-8186-8923-4
                 (v. 2), 0-8186-5923-X (v. 2: microfiche), 0-8186-8923-4
                 (v. 2: case)",
  ISBN-13 =      "978-0-8186-0882-7 (v. 1; paper), 978-0-8186-8882-9 (v.
                 1; case), 978-0-8186-4882-3 (v. 1: microfiche)
                 978-0-8186-8923-9 (v. 2), 978-0-8186-5923-2 (v. 2:
                 microfiche), 978-0-8186-8923-9 (v. 2: case)",
  LCCN =         "QA76.5 .S894 1988",
  bibdate =      "Fri Aug 23 13:34:23 1996",
  bibsource =    "",
  note =         "Two volumes. Available from IEEE Service Center
                 (Catalog number 88CH2617-9), Piscataway, NJ, USA.",
  acknowledgement = ack-nhfb,
  classification = "C5220 (Computer architecture); C5440 (Multiprocessor
                 systems and techniques); C5470 (Performance evaluation
                 and testing); C5540 (Terminals and graphic displays);
                 C6150C (Compilers, interpreters and other processors);
                 C6150J (Operating systems)",
  keywords =     "algorithms; architecture; benchmarking; compiler
                 evaluation; compiler technology; computer graphic
                 equipment; data-flow systems; Horizon superconducting
                 system; mass storage systems; operating systems;
                 operating systems (computers); parallel algorithms;
                 parallel architectures; parallel machines; performance
                 evaluation; program compilers; program development;
                 supercomputer performance; supercomputing center
                 management; visualization",

  editor =       "George Paul and George S. Almasi",
  booktitle =    "{Parallel systems and computation: proceedings of the
                 1986 IBM Europe Institute---Seminar on Parallel
                 Computing, Oberlech, Austria, August 11--15, 1986}",
  title =        "{Parallel systems and computation: proceedings of the
                 1986 IBM Europe Institute---Seminar on Parallel
                 Computing, Oberlech, Austria, August 11--15, 1986}",
  publisher =    pub-NH,
  address =      pub-NH:adr,
  pages =        "x + 294",
  year =         "1988",
  ISBN =         "0-444-70371-3",
  ISBN-13 =      "978-0-444-70371-2",
  LCCN =         "QA76.5 .I147 1986",
  bibdate =      "Mon Jan 2 15:34:19 MST 2006",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  meetingname =  "IBM Europe Institute--Seminar on Parallel Computing
                 (1986: Oberlech, Austria)",
  subject =      "Parallel processing (Electronic computers);

  editor =       "Martin Schultz",
  booktitle =    "Numerical algorithms for modern parallel computer
                 architectures (Minneapolis, {MN, 1986--87)}",
  title =        "Numerical algorithms for modern parallel computer
                 architectures (Minneapolis, {MN}, 1986--87)",
  volume =       "13",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "vi + 232",
  year =         "1988",
  ISBN =         "0-387-96733-8",
  ISBN-13 =      "978-0-387-96733-2",
  LCCN =         "QA76.5.N79 1988",
  bibdate =      "Mon Jan 15 11:22:00 1996",
  bibsource =    "",
  series =       "The IMA volumes in mathematics and its applications",
  acknowledgement = ack-nhfb,

  editor =       "Graham F. Carey",
  booktitle =    "Parallel supercomputing: methods, algorithms and
  title =        "Parallel supercomputing: methods, algorithms and
  publisher =    pub-WILEY,
  address =      pub-WILEY:adr,
  pages =        "x + 287",
  year =         "1989",
  ISBN =         "0-471-92436-9",
  ISBN-13 =      "978-0-471-92436-4",
  LCCN =         "M89.E02452; QA76.6",
  bibdate =      "Mon Jan 2 15:42:42 MST 2006",
  bibsource =    ";
  series =       "Wiley series in parallel computing",
  acknowledgement = ack-nhfb,
  subject =      "Parallel programming (Computer science)",

  editor =       "Michel Cosnard and Y. Robert and P. Quinton and M.
  booktitle =    "Parallel \& distributed algorithms: proceedings of the
                 International Workshop on Parallel \& Distributed
                 Algorithms, Chateau de Bonas, Gers, France, 3--6
                 October, 1988",
  title =        "Parallel \& distributed algorithms: proceedings of the
                 International Workshop on Parallel \& Distributed
                 Algorithms, Chateau de Bonas, Gers, France, 3--6
                 October, 1988",
  publisher =    pub-NH,
  address =      pub-NH:adr,
  pages =        "xiv + 343",
  year =         "1989",
  ISBN =         "0-444-87367-8",
  ISBN-13 =      "978-0-444-87367-5",
  LCCN =         "QA76.5 .I6191 1988",
  bibdate =      "Sat Mar 22 18:36:25 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "Jack Dongarra and Iain S. Duff and Patrick W. Gaffney
                 and Sean {StJ}. McKee",
  booktitle =    "Vector and Parallel Computing: Issues in Applied
                 Research and Development (Papers from {LOEN II}, a
                 conference held June 6--10, 1988, in Troms{\o},
  title =        "Vector and Parallel Computing: Issues in Applied
                 Research and Development (Papers from {LOEN II}, a
                 conference held June 6--10, 1988, in Troms{\o},
  publisher =    pub-EH,
  address =      pub-EH:adr,
  pages =        "viii + 410",
  year =         "1989",
  ISBN =         "0-7458-0756-9 (Ellis Horwood), 0-470-21571-2 (Halsted
  ISBN-13 =      "978-0-7458-0756-0 (Ellis Horwood), 978-0-470-21571-5
                 (Halsted Press)",
  LCCN =         "QA76.5 .V398 1989",
  MRclass =      "65-06 (00B25)",
  MRnumber =     "91k:65014",
  bibdate =      "Thu Dec 19 14:23:48 1996",
  bibsource =    ";
  price =        "UK\pounds 29.95",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "D. J. Evans and C. Sutti",
  booktitle =    "Parallel Computing. Methods, Algorithms and
                 Applications Proceedings of the International Meeting
                 on Parallel Computing",
  title =        "Parallel Computing. Methods, Algorithms and
                 Applications Proceedings of the International Meeting
                 on Parallel Computing",
  publisher =    "Adam Hilger",
  address =      "Bristol, UK",
  pages =        "x + 287",
  year =         "1989",
  ISBN =         "0-85274-224-x",
  ISBN-13 =      "978-0-85274-224-2",
  LCCN =         "QA76.5.I5775 1988",
  bibdate =      "Mon Sep 9 14:56:14 MDT 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  confdate =     "28--30 Sept. 1988",
  conflocation = "Verona, Italy",
  confsponsor =  "Univ. Verona; Univ. Calabria; et al",
  pubcountry =   "UK",

  editor =       "M. Wright",
  booktitle =    "Aspects of Computation on Asynchronous Parallel
                 Processors. {Proceedings of the IFIP WG 2.5 Working
                 Conference, Stanford, CA, USA, 22--26 August, 1988}",
  title =        "Aspects of Computation on Asynchronous Parallel
                 Processors. {Proceedings of the IFIP WG 2.5 Working
                 Conference, Stanford, CA, USA, 22--26 August, 1988}",
  publisher =    pub-NH,
  address =      pub-NH:adr,
  pages =        "xi + 271",
  year =         "1989",
  ISBN =         "0-444-87310-4",
  ISBN-13 =      "978-0-444-87310-1",
  LCCN =         "QA76.5 .I2775 1988",
  bibdate =      "Sat Mar 22 17:55:21 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "M. G. Cox and S. Hammarling",
  booktitle =    "Reliable numerical computation",
  title =        "Reliable numerical computation",
  publisher =    pub-OXFORD,
  address =      pub-OXFORD:adr,
  pages =        "xvi + 339",
  year =         "1990",
  ISBN =         "0-19-853564-3",
  ISBN-13 =      "978-0-19-853564-5",
  LCCN =         "QA297 .R435 1990",
  MRclass =      "65-06",
  MRnumber =     "91k:65011",
  bibdate =      "Fri Dec 20 18:34:52 1996",
  bibsource =    ";
  note =         "Based on papers from a conference in honour of the
                 late James Hardy Wilkinson (died Sunday 5th October
                 1986) held at National Physical Laboratory, Teddington,
                 Middlesex, UK, 8th--10th July 1987.",
  price =        "US\$75.00",
  abstract =     "Published to honor the late Jim Wilkinson, the
                 respected pioneer in numerical analysis, this book
                 includes contributions from his colleagues and
                 collaborators, leading experts in their own right. The
                 breadth of Wilkinson's research is reflected in the
                 topics covered, which include linear algebra, error
                 analysis and computer arithmetic algorithms, and
                 mathematical software. An invaluable reference, the
                 book is completely up-to-date with the latest
                 developments on the Lanczos algorithm,
                 QR-factorizations, error propagation models, parameter
                 estimation problems, sparse systems, and
                 shape-preserving splines. Reflecting the current growth
                 and vitality of this field, the volume is an essential
                 reference for all numerical analysts.",
  acknowledgement = ack-nhfb,
  tableofcontents = "List of contributors / / xv \\
                 Prologue. Reflections on Jim Wilkinson / Gene Golub / 1
                 1. Misconvergence in the Lanczos algorithm / Beresford
                 Parlett / 7 \\
                 2. The Lanczos algorithm for a pure imaginary Hermitian
                 matrix / Charles L. Lawson and Kajal K. Gupta / 25 \\
                 3. Nearest defective matrices and the geometry of
                 ill-conditioning / James Demmel / 35 \\
                 4. Computational aspects of the Jordan canonical form /
                 Theo Beelen and Paul Van Dooren / 57 \\
                 5. Some aspects of generalized QR factorizations / C.
                 C. Paige / 73 \\
                 6. The multifrontal method in a parallel environment /
                 I. S. Duff, N. I. M. Gould, M. Lescrenier, and J. K.
                 Reid / 93 \\
                 7. A Schur-complement method for sparse quadratic
                 programming / Philip E. Gill, Walter Murray, Michael A.
                 Saunders, and Margaret H. Wright / 113 \\
                 8. A probabilistic round-off error propagation model.
                 Application to the eigenvalue problem / Fran{\c{c}}oise
                 Chatelin and Marie Christine Brunet / 139 \\
                 9. Analysis of the Cholesky decomposition of a
                 semi-definite matrix / Nicholas J. Higham / 161 \\
                 10. On the conditioning of parameter estimation
                 problems / James M. Varah / 187 \\
                 11. Rounding errors in algebraic process-in level-index
                 arithmetic / F. W J. Olver / 197 \\
                 12. Experiments in tearing large sparse systems / Mario
                 Arioli and lain S. Duff / 207 \\
                 13. The least-squares solution of linear equations with
                 block-angular observation matrix / M. G. Cox / 227 \\
                 14. An iterative method for solving linear inequalities
                 / G. W Stewart / 241 \\
                 15. Iterative refinement and reliable computing / Ake
                 Bjorck / 249 \\
                 16. Software for shape-preserving spline interpolation
                 / Christian H. Reinsch / 267 \\
                 17. Experiences with some software engineering
                 practices in numerical software / D. A. H. Jacobs and
                 G. Markham / 277 \\
                 18. Evolution of numerical software for dense linear
                 algebra / Jack Dongarra and Sven Hammarling / 297 \\
                 Epilogue. Jim Wilkinson: some after-dinner sentiments /
                 L. Fox / 329",

  editor =       "Jack Dongarra and Paul Messina and Danny C. Sorensen
                 and Robert G. Voigt",
  key =          "DongarraMessinaSorensenVoigt90",
  booktitle =    "{Parallel Processing for Scientific Computing:
                 Proceedings of the Fourth SIAM Conference on Parallel
                 Processing for Scientific Computing, Chicago, Illinois,
                 December 11--13, 1989}",
  title =        "{Parallel Processing for Scientific Computing:
                 Proceedings of the Fourth SIAM Conference on Parallel
                 Processing for Scientific Computing, Chicago, Illinois,
                 December 11--13, 1989}",
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "454",
  year =         "1990",
  ISBN =         "0-89871-262-9",
  ISBN-13 =      "978-0-89871-262-9",
  LCCN =         "QA76.58.S55 1989",
  MRclass =      "00B25 (65-06 68-06 68Q10)",
  MRnumber =     "91k:00041",
  bibdate =      "Thu Dec 19 14:26:07 1996",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "{IEEE}",
  booktitle =    "Proceedings, Supercomputing '90: November 12--16,
                 1990, New York Hilton at Rockefeller Center, New York,
                 New York",
  title =        "Proceedings, Supercomputing '90: November 12--16,
                 1990, New York Hilton at Rockefeller Center, New York,
                 New York",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xxv + 982",
  year =         "1990",
  ISBN =         "0-8186-2056-0 (paperback) (IEEE Computer Society),
                 0-89791-412-0 (paperback) (ACM)",
  ISBN-13 =      "978-0-8186-2056-0 (paperback) (IEEE Computer Society),
                 978-0-89791-412-3 (paperback) (ACM)",
  LCCN =         "QA 76.88 S87 1990",
  bibdate =      "Wed Aug 28 06:48:31 MDT 1996",
  bibsource =    ";
                 University of California MELVYL catalog",
  note =         "ACM order number 415903. IEEE Computer Society Press
                 order number 2056. IEEE catalog number 90CH2916-5.",
  acknowledgement = ack-nhfb,
  classification = "C5440 (Multiprocessor systems and techniques); C5470
                 (Performance evaluation and testing); C6110 (Systems
                 analysis and programming); C7000 (Computer
  keywords =     "biological applications; computer applications;
                 computer chess; innovative architectures; linear
                 algebra algorithms; memory; networking computing;
                 parallel languages; parallel processing; particle
                 transport; partitioning; performance evaluation;
                 performance visualizations; pipeline processing;
                 program analysis; program restructuring; scheduling;
                 supercomputers --- congresses; vector algorithms",

  editor =       "Aad J. {Van der Steen}",
  booktitle =    "Evaluating supercomputers. Strategies for exploiting,
                 evaluating and benchmarking computers with advanced
  title =        "Evaluating supercomputers. Strategies for exploiting,
                 evaluating and benchmarking computers with advanced
  volume =       "8",
  publisher =    pub-CHAPMAN-HALL,
  address =      pub-CHAPMAN-HALL:adr,
  pages =        "289",
  year =         "1990",
  ISBN =         "0-412-37860-4, 0-442-31198-2 (U.S.)",
  ISBN-13 =      "978-0-412-37860-7, 978-0-442-31198-8 (U.S.)",
  LCCN =         "QA76.9.E94 E93 1990; QA76.88.E93 1990",
  bibdate =      "Mon Sep 09 14:49:03 1996",
  bibsource =    "",
  series =       "Unicom applied information technology reports",
  acknowledgement = ack-nhfb,

  editor =       "Henk A. van der Vorst and Paul {Van Dooren}",
  booktitle =    "Parallel algorithms for numerical linear algebra",
  title =        "Parallel algorithms for numerical linear algebra",
  volume =       "1",
  publisher =    pub-NH,
  address =      pub-NH:adr,
  pages =        "x + 330",
  year =         "1990",
  ISBN =         "0-444-88621-4",
  ISBN-13 =      "978-0-444-88621-7",
  LCCN =         "QA76.5 .P31458 1990",
  MRclass =      "65-06 (65Fxx 65Y05)",
  MRnumber =     "MR1068142 (91f:65005)",
  bibdate =      "Sat Dec 31 06:28:14 2005",
  bibsource =    ";
                 MathSciNet database;",
  series =       "Advances in Parallel Computing",
  acknowledgement = ack-nhfb,
  remark =       "Reprinted from the Journal of computational and
                 applied mathematics, vol. 27, numbers 1 and 2
                 (September 1989).",
  subject =      "Parallel algorithms; Parallel processing (Electronic
                 computers); Algebras, Linear; Numerical calculations",
  tableofcontents = "Preface / H. van der Vorst and P. van Dooren\par

                 A quadratically convergent parallel Jacobi process for
                 diagonally dominant matrices with distinct eigenvalues
                 / M. H. C. Paardekooper\par

                 A Jacobi-like algorithm for computing the generalized
                 Schur form of a regular pencil / J.-P. Charlier and P.
                 van Dooren\par

                 Canonical correlations and generalized SVD :
                 applications and new algorithms / L. M. Ewerbring and
                 F. T. Luk\par

                 From Bareiss' algorithm to the stable computation of
                 partial correlations / J.-M. Delosme and I. C. F.

                 A recursive doubling algorithm for solution of
                 tridiagonal systems on hypercube multiprocessors / ?.
                 Egecioglu, C. K. Koc and A. J. Laub - Least squares
                 modifications with inverse factorizations : parallel
                 implications / C.-T. Pan and R. J. Plemmons. Solution
                 of sparse positive definite systems on a hypercube / A.
                 George ... [et al.]\par

                 Some aspects of parallel implementation of the
                 finite-element method on message passing architectures
                 / I. Babuska and H. C. Elman\par

                 An overview of parallel algorithms for the singular
                 value and symmetric eigenvalue problems / M. Berry and
                 A. Sameh\par

                 Block reduction of matrices to condensed forms for
                 eigenvalue computations / J. J. Dongarra, S. J.
                 Hammarling and D. C. Sorensen\par

                 Multiprocessing a sparse matrix code on the Alliant
                 FX-8 / I. S. Duff\par

                 Vector and parallel methods for the direct solution of
                 Poissson's equation / P. N. Swartztrauber and R. A.

                 Factoring with the quadratic sieve on large vector
                 computers / H. te Riele, W. Lioen and D. Winter.
                 Efficient vectorizable PDE solvers / W. Sch?nauer and
                 R. Weiss\par

                 Vectorizable preconditioners for elliptic difference
                 equations in three space dimensions / O. Axelsson and
                 V. Eijkhout\par

                 Solving 3D block bidiagonal linear systems on vector
                 computers / J. J. F. M. Schlichting and H. A. van der

  editor =       "Anonymous",
  booktitle =    "International Symposium on Supercomputing '91",
  title =        "International Symposium on Supercomputing '91",
  publisher =    "Amsterdam Universities Computing Centre (SARA)",
  address =      "Amsterdam, The Netherlands",
  pages =        "33--38",
  month =        nov,
  year =         "1991",
  CODEN =        "SPCOEL",
  ISSN =         "0168-7875",
  bibdate =      "Mon Sep 9 07:55:25 MDT 1996",
  bibsource =    "",
  note =         "Supercomputer, vol. 8, no. 6, Nov. (1991).",
  acknowledgement = ack-nhfb,
  confdate =     "6--8 Nov. 1991",
  conflocation = "Fukuoka, Japan",
  pubcountry =   "Netherlands",

  editor =       "Anonymous",
  booktitle =    "Proceedings of the International Symposium on
                 Supercomputing: Fukuoka, Japan, November 6--8, 1991",
  title =        "Proceedings of the International Symposium on
                 Supercomputing: Fukuoka, Japan, November 6--8, 1991",
  publisher =    "Kyushu University Press",
  address =      "Fukouka, Japan",
  pages =        "iv + 261",
  year =         "1991",
  ISBN =         "4-87378-284-8",
  ISBN-13 =      "978-4-87378-284-3",
  LCCN =         "QA76.88 .I587 1991",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "D. F. Griffiths and G. A. Watson",
  booktitle =    "Numerical analysis, 1991: proceedings of the 14th
                 Dundee Conference, June 1991",
  title =        "Numerical analysis, 1991: proceedings of the 14th
                 Dundee Conference, June 1991",
  volume =       "260",
  publisher =    pub-LONGMAN,
  address =      pub-LONGMAN:adr,
  pages =        "292",
  year =         "1991",
  ISBN =         "0-582-08908-5",
  ISBN-13 =      "978-0-582-08908-2",
  LCCN =         "QA297 .D85 1991",
  bibdate =      "Mon Jan 15 11:05:56 1996",
  bibsource =    "",
  series =       "Pitman Res. Notes Math. Ser.",
  acknowledgement = ack-nhfb,

  editor =       "IEE",
  booktitle =    "Second International Specialist Seminar on the Design
                 and Application of Parallel Digital Processors (Conf.
                 Publ. No. 334)",
  title =        "Second International Specialist Seminar on the Design
                 and Application of Parallel Digital Processors (Conf.
                 Publ. No. 334)",
  publisher =    pub-IEE,
  address =      pub-IEE:adr,
  pages =        "vii + 152",
  year =         "1991",
  ISBN =         "0-85296-519-2",
  ISBN-13 =      "978-0-85296-519-1",
  ISSN =         "0537-9989",
  LCCN =         "QA76.58.I567 1991",
  bibdate =      "Mon Sep 9 07:55:25 MDT 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  confdate =     "15--19 April 1991",
  conflocation = "Lisbon, Portugal",
  confsponsor =  "Office of Naval Res. Eur. Office",
  pubcountry =   "UK",

  editor =       "{IEEE}",
  booktitle =    "Proceedings, Supercomputing '91: Albuquerque, New
                 Mexico, November 18--22, 1991",
  title =        "Proceedings, Supercomputing '91: Albuquerque, New
                 Mexico, November 18--22, 1991",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xxiii + 917",
  year =         "1991",
  ISBN =         "0-8186-9158-1 (IEEE case), 0-8186-2158-3 (IEEE paper),
                 0-8186-6158-5 (IEEE microfiche), 0-89791-459-7 (ACM)",
  ISBN-13 =      "978-0-8186-9158-4 (IEEE case), 978-0-8186-2158-1 (IEEE
                 paper), 978-0-8186-6158-7 (IEEE microfiche),
                 978-0-89791-459-8 (ACM)",
  LCCN =         "QA76.5 .S894 1991",
  bibdate =      "Fri Aug 30 08:01:51 MDT 1996",
  bibsource =    ";
                 University of California MELVYL catalog",
  note =         "ACM order number 415913. IEEE Computer Society Press
                 order number 2158. IEEE catalog number 91CH3058-5.",
  acknowledgement = ack-nhfb,
  classification = "C5440 (Multiprocessor systems and techniques); C5470
                 (Performance evaluation and testing); C6110P (Parallel
  keywords =     "combinatorial algorithms; data dependence; distributed
                 memory code generation; high school environment;
                 latency tolerance; memory access; numerical algorithms;
                 parallel processing; parallel programming; performance
                 evaluation; performance tools; processor design;
                 program analysis; storage hierarchy optimization;
                 supercomputer benchmarks; supercomputer congresses;
                 supercomputing; system issues",

  editor =       "Quentin Stout and Michael Wolfe",
  booktitle =    "The Sixth Distributed Memory Computing Conference
                 Proceedings: April 28--May 1, 1991, Portland, Oregon",
  title =        "The Sixth Distributed Memory Computing Conference
                 Proceedings: April 28--May 1, 1991, Portland, Oregon",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xx + 736",
  year =         "1991",
  ISBN =         "0-8186-2290-3 (paperback), 0-8186-2291-1 (fiche)",
  ISBN-13 =      "978-0-8186-2290-8 (paperback), 978-0-8186-2291-5
  LCCN =         "QA76.5 .D58 1991",
  bibdate =      "Mon Jan 15 11:06:03 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "Hojjat Adeli",
  booktitle =    "Supercomputing in engineering analysis",
  title =        "Supercomputing in engineering analysis",
  volume =       "1",
  publisher =    pub-DEKKER,
  address =      pub-DEKKER:adr,
  pages =        "xi + 362",
  year =         "1992",
  ISBN =         "0-8247-8559-2",
  ISBN-13 =      "978-0-8247-8559-8",
  LCCN =         "TA345.S87; TA345 .S87 1991; TA345 .S87 1992",
  bibdate =      "Mon Jan 2 16:25:45 MST 2006",
  bibsource =    ";
  series =       "New generation computing",
  acknowledgement = ack-nhfb,
  subject =      "Engineering; Data processing; Supercomputers; Vector
                 processing (Computer science); Parallel processing
                 (Electronic computers)",

  editor =       "Jack Dongarra and Ken Kennedy and Paul Messina and
                 Danny C. Sorensen and Robert G. Voigt",
  booktitle =    "{Proceedings of the Fifth SIAM Conference on Parallel
                 Processing for Scientific Computing (Houston, TX, March
                 25--27, 1991)}",
  title =        "{Proceedings of the Fifth SIAM Conference on Parallel
                 Processing for Scientific Computing (Houston, TX, March
                 25--27, 1991)}",
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "xvii + 648",
  year =         "1992",
  ISBN =         "0-89871-303-X",
  ISBN-13 =      "978-0-89871-303-9",
  LCCN =         "QA76.58 .P76 1992",
  MRclass =      "65Y05 (65Fxx 90-04 90C30)",
  MRnumber =     "93g:65178",
  bibdate =      "Thu Dec 19 14:26:03 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "D. F. Griffiths and G. A. Watson",
  booktitle =    "Numerical analysis, 1991: proceedings of the 14th
                 Dundee Conference, June 1991",
  title =        "Numerical analysis, 1991: proceedings of the 14th
                 Dundee Conference, June 1991",
  volume =       "260",
  publisher =    pub-LONGMAN,
  address =      pub-LONGMAN:adr,
  pages =        "292",
  year =         "1992",
  ISBN =         "0-582-08908-5",
  ISBN-13 =      "978-0-582-08908-2",
  LCCN =         "QA297.D85 1991",
  bibdate =      "Mon Jan 15 11:24:40 1996",
  bibsource =    "",
  series =       "Pitman Res. Notes Math. Ser.",
  acknowledgement = ack-nhfb,

  editor =       "{IEEE}",
  key =          "SHPCC-92",
  booktitle =    "Scalable High Performance Computing Conference,
                 {SHPCC-92}, April 26--29, 1992, Williamsburg,
  title =        "Scalable High Performance Computing Conference,
                 {SHPCC}-92, April 26--29, 1992, Williamsburg,
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xiii + 448",
  year =         "1992",
  ISBN =         "0-8186-2775-1",
  ISBN-13 =      "978-0-8186-2775-0",
  LCCN =         "QA76.76.A65 S33 1992",
  bibdate =      "Fri Dec 30 11:18:38 1994",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "R. H. Perrott",
  booktitle =    "Software for parallel computers",
  title =        "Software for parallel computers",
  publisher =    pub-CHAPMAN-HALL,
  address =      pub-CHAPMAN-HALL:adr,
  pages =        "350",
  year =         "1992",
  ISBN =         "0-412-39960-1",
  ISBN-13 =      "978-0-412-39960-2",
  LCCN =         "QA76.58.S63 1992",
  bibdate =      "Mon Sep 09 08:27:07 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "H. J. Siegel",
  booktitle =    "The Fourth Symposium on the Frontiers of Massively
                 Parallel Computation: Frontiers '92 / October 19--21,
                 1992, {McLean}, Virginia",
  title =        "The Fourth Symposium on the Frontiers of Massively
                 Parallel Computation: Frontiers '92 / October 19--21,
                 1992, {McLean}, Virginia",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xviii + 592",
  year =         "1992",
  ISBN =         "0-8186-2772-7 (hardback), 0-8186-2771-9 (microfiche)",
  ISBN-13 =      "978-0-8186-2772-9 (hardback), 978-0-8186-2771-2
  LCCN =         "QA76.58 .S95 1992",
  bibdate =      "Mon Jan 15 11:06:11 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "Jack J. Dongarra and Wolfgang Gentzsch",
  booktitle =    "Computer Benchmarks",
  title =        "Computer Benchmarks",
  volume =       "8",
  publisher =    pub-NH,
  address =      pub-NH:adr,
  pages =        "xiv + 349",
  year =         "1993",
  ISBN =         "0-444-81518-X",
  ISBN-13 =      "978-0-444-81518-7",
  LCCN =         "QA76.9.E94 C63 1993",
  bibdate =      "Mon Jan 15 11:06:15 1996",
  bibsource =    ";
  series =       "Advances in Parallel Computing",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "J. J. Dongarra and B. Tourancheau",
  booktitle =    "Environments and Tools for Parallel Scientific
                 Computing (Saint Hilaire du Touvet, France, September
                 7--8, 1992)",
  title =        "Environments and Tools for Parallel Scientific
                 Computing (Saint Hilaire du Touvet, France, September
                 7--8, 1992)",
  publisher =    pub-NH,
  address =      pub-NH:adr,
  pages =        "xvii + 362",
  year =         "1993",
  ISBN =         "0-444-89963-4",
  ISBN-13 =      "978-0-444-89963-7",
  LCCN =         "QA76.642 .E58 1993",
  bibdate =      "Mon Jan 15 11:06:18 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "A. E. Fincham and B. Ford",
  booktitle =    "Parallel Computation Conference --- September 1991,
                 St. Catherine's College, Oxford, {UK}",
  title =        "Parallel Computation Conference --- September 1991,
                 St. Catherine's College, Oxford, {UK}",
  volume =       "46",
  publisher =    pub-CLARENDON,
  address =      pub-CLARENDON:adr,
  pages =        "x + 366",
  year =         "1993",
  ISBN =         "0-19-853680-1",
  ISBN-13 =      "978-0-19-853680-2",
  ISSN =         "0960-2526",
  LCCN =         "QA76.58.P3755 1993",
  bibdate =      "Fri Mar 1 10:04:10 MST 1996",
  bibsource =    "",
  series =       "Institute of Mathematics and its Applications
                 Conference Series",
  acknowledgement = ack-nhfb,
  sponsor =      "Institute of Mathematics and its Applications.",

  editor =       "Geerd-R. Hoffmann and Tuomo Kauranne",
  booktitle =    "Parallel supercomputing in atmospheric science:
                 proceedings of the fifth {ECMWF} Workshop on the Use of
                 Parallel Processors in Meteorology, Reading {UK},
                 November 23--27, 1992",
  title =        "Parallel supercomputing in atmospheric science:
                 proceedings of the fifth {ECMWF} Workshop on the Use of
                 Parallel Processors in Meteorology, Reading {UK},
                 November 23--27, 1992",
  publisher =    pub-WORLD-SCI,
  address =      pub-WORLD-SCI:adr,
  pages =        "ix + 532",
  year =         "1993",
  ISBN =         "981-02-1429-4",
  ISBN-13 =      "978-981-02-1429-6",
  LCCN =         "QA76.58 E354 1992",
  bibdate =      "Fri Mar 1 10:04:10 MST 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  sponsor =      "European Centre for Medium-Range Weather Forecasts.",

  editor =       "{IEEE}",
  key =          "Supercomputing'93",
  booktitle =    "Proceedings, Supercomputing '93: Portland, Oregon,
                 November 15--19, 1993",
  title =        "Proceedings, Supercomputing '93: Portland, Oregon,
                 November 15--19, 1993",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xxii + 935",
  year =         "1993",
  ISBN =         "0-8186-4340-4 (paperback), 0-8186-4341-2 (microfiche),
                 0-8186-4342-0 (hardback), 0-8186-4346-3 (CD-ROM)",
  ISBN-13 =      "978-0-8186-4340-8 (paperback), 978-0-8186-4341-5
                 (microfiche), 978-0-8186-4342-2 (hardback),
                 978-0-8186-4346-0 (CD-ROM)",
  ISSN =         "1063-9535",
  LCCN =         "QA76.5 .S96 1993",
  bibdate =      "Mon Jan 15 11:06:21 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classification = "631.1; 722.1; 722.3; 722.4; 723.2; 921.6",
  keywords =     "Algorithms; Cache coherence; Clustered workstations;
                 Computer graphics; Computer networks; Computer
                 programming languages; Data parallel compilers; Data
                 partitioning; Distributed computer systems; Eigenvalues
                 and eigenfunctions; Finite element method; Flow
                 visualization; Fluid mechanics; Linear algebra; Mass
                 storage; Massively parallel processors; Natural
                 sciences computing; Parallel languages; Parallel
                 processing systems; Parallel rendering; Program
                 compilers; Quantum theory; Scheduling; Sparse matrices;
  sponsor =      "Institute of Electrical and Electronics Engineers;
                 Computer Society. Association for Computing Machinery;

  editor =       "J. S. Kowalik and L. Grandinetti",
  booktitle =    "Software for Parallel Computation: Proceedings of the
                 {NATO} Advanced Workshop on Software for Parallel
                 Computation, held at Cetraro, Cosenza, Italy, June
                 22--26, 1992",
  title =        "Software for Parallel Computation: Proceedings of the
                 {NATO} Advanced Workshop on Software for Parallel
                 Computation, held at Cetraro, Cosenza, Italy, June
                 22--26, 1992",
  volume =       "106",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "ix + 363",
  year =         "1993",
  ISBN =         "3-540-56451-9 (Berlin), 0-387-56451-9 (New York)",
  ISBN-13 =      "978-3-540-56451-5 (Berlin), 978-0-387-56451-7 (New
  LCCN =         "QA76.58 .S629 1993",
  bibdate =      "Mon Jan 15 11:06:25 1996",
  bibsource =    "",
  series =       "NATO ASI Series F",
  acknowledgement = ack-nhfb,

  editor =       "R. F. Sincovec",
  booktitle =    "{SIAM} Conference on Parallel Processing for
                 Scientific Computing (6th: 1993: Norfolk, {VA},
  title =        "{SIAM} Conference on Parallel Processing for
                 Scientific Computing (6th: 1993: Norfolk, {VA},
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "xix + 1041 + iv",
  year =         "1993",
  ISBN =         "0-89871-315-3",
  ISBN-13 =      "978-0-89871-315-2",
  LCCN =         "QA 76.58 S55 1993",
  bibdate =      "Thu Feb 29 17:59:11 MST 1996",
  bibsource =    "",
  note =         "Two volumes.",
  acknowledgement = ack-nhfb,
  sponsor =      "Society for Industrial and Applied Mathematics.",

  editor =       "Anonymous",
  booktitle =    "High Performance Computing and Communications 1st
                 Symposium -- March 1994, Alexandria, {VA}, {USA}",
  title =        "High Performance Computing and Communications 1st
                 Symposium -- March 1994, Alexandria, {VA}, {USA}",
  publisher =    "ARPA-CSTO",
  address =      "Arlington, VA, USA",
  pages =        "????",
  year =         "1994",
  bibdate =      "Fri Mar 1 10:04:10 MST 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "Anonymous",
  booktitle =    "Object oriented numerics: Annual conference: 2nd ---
                 April 1994, Sunriver, {OR}",
  title =        "Object oriented numerics: Annual conference: 2nd ---
                 April 1994, Sunriver, {OR}",
  publisher =    "RWS",
  address =      "Corvallis, OR",
  pages =        "????",
  year =         "1994",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "J. J. Dongarra and Jerzy Wa{\'s}niewski",
  booktitle =    "{Parallel scientific computing: First International
                 Workshop, PARA '94, Lyngby, Denmark, June 20--23, 1994:
  title =        "{Parallel scientific computing: First International
                 Workshop, PARA '94, Lyngby, Denmark, June 20--23, 1994:
  volume =       "879",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xi + 566",
  year =         "1994",
  CODEN =        "LNCSD9",
  DOI =          "????",
  ISBN =         "3-540-58712-8 (Berlin), 0-387-58712-8 (New York)",
  ISBN-13 =      "978-3-540-58712-5 (Berlin), 978-0-387-58712-7 (New
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 .P35 1994",
  bibdate =      "Fri Apr 12 07:40:14 1996",
  bibsource =    "",
  price =        "DM104.00",
  series =       ser-LNCS,
  URL =          ";
  acknowledgement = ack-nhfb,
  keywords =     "parallel processing (electronic computers) ---
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  sponsor =      "Danish Computing Centre for Research and Education.
                 Technical University of Denmark; Institute for
                 Mathematical Modelling.",

  editor =       "J. J. Dongarra and B. Tourancheau",
  booktitle =    "Proceedings of the Second Workshop on Environments and
                 Tools for Parallel Scientific Computing, Townsend,
                 {TN}, {USA}, May 25--27, 1994",
  title =        "Proceedings of the Second Workshop on Environments and
                 Tools for Parallel Scientific Computing, Townsend,
                 {TN}, {USA}, May 25--27, 1994",
  publisher =    pub-SIAM,
  address =      pub-SIAM:adr,
  pages =        "x + 292",
  year =         "1994",
  ISBN =         "0-89871-343-9",
  ISBN-13 =      "978-0-89871-343-5",
  LCCN =         "QA76.58.I568 1994",
  bibdate =      "Sat May 11 12:16:44 MDT 1996",
  bibsource =    "",
  series =       "Proceedings of the Workshop on Environments and Tools
                 for Parallel Scientific Computing",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "John E. Gilbert and Donald Kershaw",
  booktitle =    "{Large-scale matrix problems and the numerical
                 solution of partial differential equations: 5th Summer
                 school in numerical analysis --- July 1992, Lancaster,
  title =        "{Large-scale matrix problems and the numerical
                 solution of partial differential equations: 5th Summer
                 school in numerical analysis --- July 1992, Lancaster,
  volume =       "3",
  publisher =    pub-CLARENDON,
  address =      pub-CLARENDON:adr,
  pages =        "viii + 212",
  year =         "1994",
  ISBN =         "0-19-853463-9",
  ISBN-13 =      "978-0-19-853463-1",
  LCCN =         "QA374.L335 1994",
  bibdate =      "Fri Mar 1 10:04:10 MST 1996",
  bibsource =    "",
  series =       "Advances in Numerical Analysis",
  acknowledgement = ack-nhfb,

  editor =       "{IEEE}",
  booktitle =    "Proceedings of the Scalable High-Performance Computing
                 Conference, May 23--25, 1994, Knoxville, Tennessee",
  title =        "Proceedings of the Scalable High-Performance Computing
                 Conference, May 23--25, 1994, Knoxville, Tennessee",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xviii + 852",
  year =         "1994",
  ISBN =         "0-8186-5680-8, 0-8186-5681-6",
  ISBN-13 =      "978-0-8186-5680-4, 978-0-8186-5681-1",
  LCCN =         "QA76.58.S32 1994",
  bibdate =      "Thu Feb 29 17:59:11 MST 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  sponsor =      "IEEE Computer Society; Technical Committee on
                 Supercomputing Applications.",

  editor =       "{IEEE}",
  booktitle =    "Proceedings of the Scalable Parallel Libraries
                 Conference, October 6--8, 1993, Mississippi State,
  title =        "Proceedings of the Scalable Parallel Libraries
                 Conference, October 6--8, 1993, Mississippi State,
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "vii + 261",
  year =         "1994",
  ISBN =         "0-8186-4980-1 (paper), 0-8186-4981-X (microfiche)",
  ISBN-13 =      "978-0-8186-4980-6 (paper), 978-0-8186-4981-3
  LCCN =         "QA76.58 .S34 1993",
  bibdate =      "Sat Mar 22 18:40:38 1997",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "{IEEE}",
  booktitle =    "Proceedings of the Third {IEEE} International
                 Symposium on High Performance Distributed Computing,
                 August 2-5, 1994, San Francisco, {CA}, {USA}",
  title =        "Proceedings of the Third {IEEE} International
                 Symposium on High Performance Distributed Computing,
                 August 2-5, 1994, San Francisco, {CA}, {USA}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xiii + 304",
  year =         "1994",
  ISBN =         "0-8186-6395-2, 0-8186-6396-0",
  ISBN-13 =      "978-0-8186-6395-6, 978-0-8186-6396-3",
  LCCN =         "QA76.9.D5I328 1994",
  bibdate =      "Fri Mar 1 10:04:10 MST 1996",
  bibsource =    "",
  note =         "IEEE catalog number 94TH0667-6.",
  acknowledgement = ack-nhfb,
  sponsor =      "IEEE; Computer Society; Technical Committee on
                 Distributed Processing.",

  editor =       "Howard Jay Siegel",
  booktitle =    "Proceedings: Eighth International Parallel Processing
                 Symposium, April 26--29, 1994, Cancun, Mexico",
  title =        "Proceedings: Eighth International Parallel Processing
                 Symposium, April 26--29, 1994, Cancun, Mexico",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xxx + 966",
  year =         "1994",
  ISBN =         "0-8186-5602-6, 0-8186-5601-8",
  ISBN-13 =      "978-0-8186-5602-6, 978-0-8186-5601-9",
  ISSN =         "1063-7133",
  LCCN =         "QA 76.58 I56 1994",
  bibdate =      "Fri Mar 1 10:04:10 MST 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  sponsor =      "IEEE.",

  editor =       "J. J. Dongarra and others",
  booktitle =    "High performance computing: technology, methods, and
                 applications (Advanced workshop, June 1994, Cetraro,
  title =        "High performance computing: technology, methods, and
                 applications (Advanced workshop, June 1994, Cetraro,
  volume =       "10",
  publisher =    pub-ELSEVIER,
  address =      pub-ELSEVIER:adr,
  pages =        "viii + 427",
  year =         "1995",
  ISBN =         "0-444-82163-5",
  ISBN-13 =      "978-0-444-82163-8",
  ISSN =         "0927-5452",
  LCCN =         "QA76.88.H55 1995",
  bibdate =      "Thu Feb 29 17:59:11 MST 1996",
  bibsource =    "",
  series =       "Advances in Parallel Computing",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "{IEEE}",
  booktitle =    "Digest of papers / the Twenty-fifth International
                 Symposium on Fault-Tolerant Computing, June 27--30,
                 1995, Pasadena, California",
  title =        "Digest of papers / the Twenty-fifth International
                 Symposium on Fault-Tolerant Computing, June 27--30,
                 1995, Pasadena, California",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xxiii + 547",
  year =         "1995",
  CODEN =        "DPFTDL",
  ISBN =         "0-8186-7079-7, 0-8186-7145-9",
  ISBN-13 =      "978-0-8186-7079-4, 978-0-8186-7145-6",
  ISSN =         "0731-3071",
  LCCN =         "QA 76.9 F38 I57 1995",
  bibdate =      "Fri Mar 1 10:04:10 MST 1996",
  bibsource =    "",
  note =         "IEEE catalog number 95CH35823.",
  series =       "FTCS 25th",
  acknowledgement = ack-nhfb,
  sponsor =      "IEEE. Computer Society. Technical Committee on Fault-
                 Tolerant Computing.",

  editor =       "{IEEE}",
  booktitle =    "Fourth heterogeneous computing workshop: April 25,
                 1995, Santa Barbara, {CA}",
  title =        "Fourth heterogeneous computing workshop: April 25,
                 1995, Santa Barbara, {CA}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "viii + 121",
  year =         "1995",
  ISBN =         "0-8186-7121-1",
  ISBN-13 =      "978-0-8186-7121-0",
  LCCN =         "QA76.9.D5 H48 1995",
  bibdate =      "Tue Feb 26 06:09:52 2002",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "{IEEE}",
  booktitle =    "Proceedings of the Fifth {IEEE} Computer Society
                 Workshop on Future Trends of Distributed Computing
                 Systems, August 28--30, 1995, Cheju Island, Korea",
  title =        "Proceedings of the Fifth {IEEE} Computer Society
                 Workshop on Future Trends of Distributed Computing
                 Systems, August 28--30, 1995, Cheju Island, Korea",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xi + 531",
  year =         "1995",
  ISBN =         "0-8186-7125-4",
  ISBN-13 =      "978-0-8186-7125-8",
  LCCN =         "QA76.9.D5 I24 1995",
  bibdate =      "Fri Mar 1 10:04:10 MST 1996",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  sponsor =      "IEEE. Computer Society. Technical Committee on
                 Distributed Processing.",

  editor =       "Sidney Karin",
  booktitle =    "Proceedings of the 1995 {ACM\slash IEEE}
                 Supercomputing Conference, December 3--8, 1995, San
                 Diego Convention Center, San Diego, {CA}, {USA}",
  title =        "Proceedings of the 1995 {ACM\slash IEEE}
                 Supercomputing Conference, December 3--8, 1995, San
                 Diego Convention Center, San Diego, {CA}, {USA}",
  publisher =    pub-ACM # " and " # pub-IEEE,
  address =      pub-ACM:adr # " and " # pub-IEEE:adr,
  year =         "1995",
  ISBN =         "0-7803-3604-6, 0-89791-862-2, 0-7803-3605-4",
  ISBN-13 =      "978-0-7803-3604-9, 978-0-89791-862-6,
  ISSN =         "1063-9535",
  LCCN =         "QA76.88 .S856 1995",
  bibdate =      "Thu Nov 7 06:34:19 1996",
  bibsource =    "",
  note =         "ACM order number 415932. IEEE Order Plan catalog
                 number 95CB35990. These proceedings are not available
                 in printed form. However, they are available on the
                 World Wide Web, and on CD-ROM, available from ACM (ACM
                 Press order number 415952) and IEEE (IEEE Computer
                 Society Press order number FW07435).",
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "{ACM}",
  booktitle =    "Supercomputing '96 Conference Proceedings: November
                 17--22, Pittsburgh, {PA}",
  title =        "Supercomputing '96 Conference Proceedings: November
                 17--22, Pittsburgh, {PA}",
  publisher =    pub-ACM # " and " # pub-IEEE,
  address =      pub-ACM:adr # " and " # pub-IEEE:adr,
  pages =        "????",
  year =         "1996",
  ISBN =         "0-89791-854-1",
  ISBN-13 =      "978-0-89791-854-1",
  LCCN =         "A76.88 .S8573 1996",
  bibdate =      "Mon Mar 23 12:30:13 1998",
  bibsource =    "",
  note =         "ACM Order Number: 415962, IEEE Computer Society Press
                 Order Number: RS00126.",
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Arndt Bode and J. Dongarra and T. Ludwig and V.
  booktitle =    "Parallel virtual machine, {EuroPVM} '96: third
                 European {PVM} conference, Munich, Germany, October
                 7--9, 1996: proceedings",
  title =        "Parallel virtual machine, {EuroPVM} '96: third
                 European {PVM} conference, Munich, Germany, October
                 7--9, 1996: proceedings",
  volume =       "1156",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xiv + 362",
  year =         "1996",
  ISBN =         "3-540-61779-5",
  ISBN-13 =      "978-3-540-61779-2",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 .E975 1996 Bar",
  bibdate =      "Sat Dec 21 16:06:37 MST 1996",
  bibsource =    "",
  series =       ser-LNCS,
  acknowledgement = ack-nhfb,
  keywords =     "Parallel computers -- Congresses; Virtual computer
                 systems -- Congresses.",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "L. (Luc) Bouge",
  booktitle =    "{Euro-Par'96}: parallel processing: second
                 International {Euro-Par} Conference, Lyon, France,
                 August 26--29, 1996: proceedings",
  title =        "{Euro-Par'96}: parallel processing: second
                 International {Euro-Par} Conference, Lyon, France,
                 August 26--29, 1996: proceedings",
  volume =       "1123, 1124",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "various",
  year =         "1996",
  ISBN =         "3-540-61626-8 (vol. 1), 3-540-61627-6 (vol. 2)",
  ISBN-13 =      "978-3-540-61626-9 (vol. 1), 978-3-540-61627-6 (vol.
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58.I554 1996",
  bibdate =      "Sat Sep 7 08:18:27 MDT 1996",
  bibsource =    "",
  series =       ser-LNCS,
  acknowledgement = ack-nhfb,
  keywords =     "Parallel processing (Electronic computers) ---

  editor =       "J. J. Dongarra and Kaj Madsen and Jerzy
  booktitle =    "Applied parallel computing: computations in physics,
                 chemistry, and engineering science: second
                 international workshop, {PARA} '95, Lyngby, Denmark,
                 August 21--24, 1995: proceedings",
  title =        "Applied parallel computing: computations in physics,
                 chemistry, and engineering science: second
                 international workshop, {PARA} '95, Lyngby, Denmark,
                 August 21--24, 1995: proceedings",
  volume =       "1041",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "562",
  year =         "1996",
  CODEN =        "LNCSD9",
  ISBN =         "3-540-60902-4",
  ISBN-13 =      "978-3-540-60902-5",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 .P35 1995",
  MRclass =      "65-06",
  MRnumber =     "1 320 056",
  bibdate =      "Thu Dec 19 14:25:58 1996",
  bibsource =    "",
  series =       ser-LNCS,
  acknowledgement = ack-nhfb,
  keywords =     "Chemistry -- Data processing -- Congresses;
                 Engineering -- Data processing -- Congresses.; Parallel
                 processing (Electronic computers) -- Congresses;
                 Physics -- Data processing -- Congresses",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "{IEEE}",
  booktitle =    "Frontiers '96: The Sixth Symposium of Massively
                 Parallel Computing: October 27--31, 1996, Annapolis,
  title =        "Frontiers '96: The Sixth Symposium of Massively
                 Parallel Computing: October 27--31, 1996, Annapolis,
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xiv + 372",
  year =         "1996",
  ISBN =         "0-8186-7551-9 (paper), 0-8186-7553-5 (microfiche)",
  ISBN-13 =      "978-0-8186-7551-5 (paper), 978-0-8186-7553-9
  ISSN =         "1088-4955",
  LCCN =         "QA76.58 .S95 1996",
  bibdate =      "Tue Dec 10 09:22:15 1996",
  bibsource =    "",
  note =         "IEEE Computer Society Press Order Number PR07551. IEEE
                 order plan catalog number 96TB100062.",
  series =       "Symposium on the Frontiers of Massively Parallel
  acknowledgement = ack-nhfb,

  editor =       "{IEEE}",
  booktitle =    "Heterogeneous computing workshop: 5th --- April 1996,
                 Honolulu, {HI}",
  title =        "Heterogeneous computing workshop: 5th --- April 1996,
                 Honolulu, {HI}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "????",
  year =         "1996",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "Heather Mary Liddell and A. Colbrook and B.
                 Hertzberger and P. Sloot",
  booktitle =    "High-performance computing and networking:
                 international conference and exhibition, {HPCN}
                 {EUROPE} 1966, Brussels, Belgium, April 15--19, 1996:
  title =        "High-performance computing and networking:
                 international conference and exhibition, {HPCN}
                 {EUROPE} 1966, Brussels, Belgium, April 15--19, 1996:
  volume =       "1067",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xxv + 1040",
  year =         "1996",
  ISBN =         "3-540-61142-8 (paperback)",
  ISBN-13 =      "978-3-540-61142-4 (paperback)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.88 .H52 1996",
  bibdate =      "Sat Dec 21 16:06:37 MST 1996",
  bibsource =    "",
  series =       ser-LNCS,
  acknowledgement = ack-nhfb,
  keywords =     "computer networks --- congresses; supercomputers ---

  editor =       "Jerzy Wa{\'s}niewski and J. Dongarra and K. Madsen and
                 D. Olesen",
  booktitle =    "Applied parallel computing: industrial-strength
                 computation and optimization: Third International
                 Workshop, {PARA} 96, Lyngby, Denmark, August 18--21,
                 1996: proceedings",
  title =        "Applied parallel computing: industrial-strength
                 computation and optimization: Third International
                 Workshop, {PARA} 96, Lyngby, Denmark, August 18--21,
                 1996: proceedings",
  volume =       "1184",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xiii + 722",
  year =         "1996",
  ISBN =         "3-540-62095-8 (softcover)",
  ISBN-13 =      "978-3-540-62095-2 (softcover)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 .P35 1996",
  bibdate =      "Sat Dec 21 16:06:37 MST 1996",
  bibsource =    "",
  series =       ser-LNCS,
  acknowledgement = ack-nhfb,
  keywords =     "Parallel processing (Electronic computers) --
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "{ACM}",
  booktitle =    "{SC'97: High Performance Networking and Computing:
                 Proceedings of the 1997 ACM\slash IEEE SC97 Conference:
                 November 15--21, 1997, San Jose, California, USA}",
  title =        "{SC'97: High Performance Networking and Computing:
                 Proceedings of the 1997 ACM\slash IEEE SC97 Conference:
                 November 15--21, 1997, San Jose, California, USA}",
  publisher =    pub-ACM # " and " # pub-IEEE,
  address =      pub-ACM:adr # " and " # pub-IEEE:adr,
  pages =        "vii + 159",
  year =         "1997",
  ISBN =         "0-89791-985-8",
  ISBN-13 =      "978-0-89791-985-2",
  LCCN =         "QA76.9.A25 A265 1997",
  bibdate =      "Sat Mar 21 09:10:00 1998",
  bibsource =    ";
  note =         "ACM SIGARCH order number 415972. IEEE Computer Society
                 Press order number RS00160.",
  URL =          ";
  acknowledgement = ack-nhfb,
  xxnote =       "Check ISBN: UC/Melvyl has this one for ``Proceedings /
                 Second ACM Workshop on Role-Based Access Control,
                 Fairfax, Virginia, USA, November 6--7, 1997''.",

  editor =       "Anonymous",
  booktitle =    "Vector and parallel computing: Workshop: 21st ---
                 March 1997",
  title =        "Vector and parallel computing: Workshop: 21st ---
                 March 1997",
  volume =       "11(1)",
  publisher =    "SPEEDUP Society",
  address =      "Manno, Switzerland",
  pages =        "????",
  year =         "1997",
  ISSN =         "1421-6337",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  sponsor =      "Speedup.",

  editor =       "R. F. Boisvert",
  booktitle =    "Quality of numerical software: assessment and
                 enhancement / proceedings of the {IFIP} {TC2/WG2.5}
                 Working Conference on the Quality of Numerical
                 Software, Assessment and Enhancement, Oxford, United
                 Kingdom, 8--12 July 1996",
  title =        "Quality of numerical software: assessment and
                 enhancement / proceedings of the {IFIP} {TC2}/{WG2}.5
                 Working Conference on the Quality of Numerical
                 Software, Assessment and Enhancement, Oxford, United
                 Kingdom, 8--12 July 1996",
  publisher =    pub-CHAPMAN-HALL,
  address =      pub-CHAPMAN-HALL:adr,
  pages =        "vii + 384",
  year =         "1997",
  ISBN =         "0-412-80530-8",
  ISBN-13 =      "978-0-412-80530-1",
  LCCN =         "QA297 .I35 1996",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  sponsor =      "IFIP; Technical Committee 2/Working Group 2.5.",

  editor =       "Marian Bubak and J. J. Dongarra and Jerzy
  booktitle =    "Recent advances in parallel virtual machine and
                 message passing interface: 4th European {PVM}\slash
                 {MPI} user's group meeting Cracow, Poland, November
                 3--5, 1997: proceedings",
  title =        "Recent advances in parallel virtual machine and
                 message passing interface: 4th European {PVM}\slash
                 {MPI} user's group meeting Cracow, Poland, November
                 3--5, 1997: proceedings",
  volume =       "1332",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xv + 518",
  year =         "1997",
  CODEN =        "LNCSD9",
  ISBN =         "3-540-63697-8 (paperback)",
  ISBN-13 =      "978-3-540-63697-7 (paperback)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58.E973 1997",
  bibdate =      "Mon Nov 24 09:49:54 MST 1997",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "Computer networks -- Congresses.; Parallel computers
                 -- Congresses.",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "J. J. Dongarra and Bernard Tourancheau",
  booktitle =    "Proceedings of the Third Workshop on Environments and
                 Tools for Parallel Scientific Computing",
  title =        "Proceedings of the Third Workshop on Environments and
                 Tools for Parallel Scientific Computing",
  volume =       "11(2)",
  publisher =    "Sage Science Press",
  address =      "Thousand Oaks, CA, USA",
  pages =        "83--176",
  year =         "1997",
  LCCN =         "QA 76.5 I55 v.11 no.2 1997",
  bibdate =      "Wed Mar 18 12:33:29 MST 1998",
  bibsource =    "",
  series =       "International Journal of Supercomputer Applications
                 and High Performance Computing",
  acknowledgement = ack-nhfb,
  alttitle =     "Environments and Tools for Parallel Scientific
  keywords =     "Parallel processing (Electronic computers) ---
                 Congresses.; Parallel programming (Computer science)
                 --- Congresses.",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",
  xxISBN =       "none",

  editor =       "J. J. Dongarra and Jose M. L. M. Palma",
  booktitle =    "{Vector and parallel processing---VECPAR '96: Second
                 International Conference on Vector and Parallel
                 Processing-Systems and Applications, Porto, Portugal,
                 September 25--27, 1996: Selected Papers}",
  title =        "{Vector and parallel processing---VECPAR '96: Second
                 International Conference on Vector and Parallel
                 Processing-Systems and Applications, Porto, Portugal,
                 September 25--27, 1996: Selected Papers}",
  volume =       "1215",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xi + 469",
  year =         "1997",
  CODEN =        "LNCSD9",
  DOI =          "????",
  ISBN =         "3-540-62828-2",
  ISBN-13 =      "978-3-540-62828-6",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 .I552 1996",
  bibdate =      "Mon Aug 25 09:50:07 MDT 1997",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          ";
  acknowledgement = ack-nhfb,
  keywords =     "parallel processing (electronic computers) ---
                 congresses; vector processing (computer science) ---
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Andrzej Goscinski and Michael Hobbs and Wanlei Zhou",
  booktitle =    "1997 3rd International Conference on Algorithms and
                 Architectures for Parallel Processing: {ICA3PP/97}:
                 Melbourne, Australia, December 10--12, 1997",
  title =        "1997 3rd International Conference on Algorithms and
                 Architectures for Parallel Processing: {ICA3PP}/97:
                 Melbourne, Australia, December 10--12, 1997",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xiii + 765",
  year =         "1997",
  ISBN =         "0-7803-4229-1 (softbound), 0-7803-4230-5
  ISBN-13 =      "978-0-7803-4229-3 (softbound), 978-0-7803-4230-9
  LCCN =         "QA76.58 .I528 1997",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  sponsor =      "Deakin University; Faculty of Science and Technology.
                 Institute of Electrical and Electronics Engineers;
                 Victorian Section.",

  editor =       "Lucio Grandinetti and Janusz Kowalik and Marian
  booktitle =    "High performance computing: technology and
                 applications: {NATO} Advanced Research Workshop ---
                 24--26 June 1996, Cetraro, Italy",
  title =        "High performance computing: technology and
                 applications: {NATO} Advanced Research Workshop ---
                 24--26 June 1996, Cetraro, Italy",
  volume =       "30",
  publisher =    pub-KLUWER,
  address =      pub-KLUWER:adr,
  pages =        "xi + 355",
  year =         "1997",
  ISBN =         "0-7923-4550-9",
  ISBN-13 =      "978-0-7923-4550-3",
  LCCN =         "QA76.88 .A38 1997",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  series =       "NATO ASI Series 3 High Technology",
  acknowledgement = ack-nhfb,

  editor =       "{IEEE}",
  booktitle =    "High performance computing on the information
                 superhighway, {HPC} Asia '97: proceedings, Seoul,
                 Korea, April 28--May 2, 1997",
  title =        "High performance computing on the information
                 superhighway, {HPC} Asia '97: proceedings, Seoul,
                 Korea, April 28--May 2, 1997",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xxii + 760",
  year =         "1997",
  ISBN =         "0-8186-7901-8, 0-8186-7902-6 (casebound) ,
                 0-8186-7903-4 (microfiche)",
  ISBN-13 =      "978-0-8186-7901-8, 978-0-8186-7902-5 (casebound),
                 978-0-8186-7903-2 (microfiche)",
  LCCN =         "QA76.88 .H653 1997",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  note =         "IEEE Order Plan number 97TB100110.",
  series =       "HPC ASIA 1997",
  acknowledgement = ack-nhfb,

  editor =       "{IEEE}",
  booktitle =    "Proceedings: 1997 International Conference on Parallel
                 Architectures and Compilation Techniques: San
                 Francisco, California, November 10--14, 1997",
  title =        "Proceedings: 1997 International Conference on Parallel
                 Architectures and Compilation Techniques: San
                 Francisco, California, November 10--14, 1997",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "ix + 319",
  year =         "1997",
  ISBN =         "0-8186-8090-3",
  ISBN-13 =      "978-0-8186-8090-8",
  LCCN =         "QA76.58 .I5445 1997",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  sponsor =      "IEEE.",

  editor =       "Achim Sydow",
  booktitle =    "15th {IMACS} World Congress on Scientific Computation,
                 Modelling and Applied Mathematics: Berlin, August 1997:
  title =        "15th {IMACS} World Congress on Scientific Computation,
                 Modelling and Applied Mathematics: Berlin, August 1997:
  publisher =    "Wissenschaft and Technik",
  address =      "Berlin, Germany",
  pages =        "various",
  year =         "1997",
  ISBN =         "3-89685-550-6 (set), 3-89685-551-4 (vol. 1),
                 3-89685-552-2 (vol. 2), 3-89685-553-0 (vol.
                 3),3-89685-554-9 (vol. 4), 3-89685-555-7 (vol. 5),
                 3-89685-556-5 (vol. 6)",
  ISBN-13 =      "978-3-89685-550-3 (set), 978-3-89685-551-0 (vol. 1),
                 978-3-89685-552-7 (vol. 2), 978-3-89685-553-4 (vol. 3),
                 978-3-89685-554-1 (vol. 4), 978-3-89685-555-8 (vol. 5),
                 978-3-89685-556-5 (vol. 6)",
  LCCN =         "Q183.9 .I46 1997",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  note =         "In cooperation with R.-P. Schafer, W. Rufeger, and H.
  series =       "IMACS World Congress",
  acknowledgement = ack-nhfb,
  sponsor =      "IMACS.",

  editor =       "L. Thiele",
  booktitle =    "{IEEE} International Conference on
                 Application-Specific Systems, Architectures and
                 Processors: proceedings, July 14--16, 1997: Zurich,
  title =        "{IEEE} International Conference on
                 Application-Specific Systems, Architectures and
                 Processors: proceedings, July 14--16, 1997: Zurich,
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xii + 540",
  year =         "1997",
  ISBN =         "0-8186-7959-X (casebound), 0-8186-7958-1,
                 0-8186-7960-3 (microfiche)",
  ISBN-13 =      "978-0-8186-7959-9 (casebound), 978-0-8186-7958-2,
                 978-0-8186-7960-5 (microfiche)",
  ISSN =         "1063-6862",
  LCCN =         "TK7874.6 .I58 1997",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  sponsor =      "IEEE; Computer Society; Technical Committee on VLSI.",

  editor =       "{ACM}",
  booktitle =    "{ACM 1998} Workshop on Java for High-Performance
                 Network Computing, February 28 and March 1, 1998",
  title =        "{ACM} 1998 Workshop on Java for High-Performance
                 Network Computing, February 28 and March 1, 1998",
  publisher =    pub-ACM,
  address =      pub-ACM:adr,
  pages =        "????",
  year =         "1998",
  ISBN =         "????",
  ISBN-13 =      "????",
  LCCN =         "????",
  bibdate =      "Tue Feb 26 08:15:29 2002",
  bibsource =    "",
  note =         "Possibly unpublished, except electronically.",
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "{ACM}",
  booktitle =    "{SC'98}: High Performance Networking and Computing:
                 Proceedings of the 1998 {ACM\slash} {IEEE} {SC98}
                 Conference: Orange County Convention Center, Orlando,
                 Florida, {USA}, November 7--13, 1998",
  title =        "{SC}'98: High Performance Networking and Computing:
                 Proceedings of the 1998 {ACM}\slash {IEEE} {SC98}
                 Conference: Orange County Convention Center, Orlando,
                 Florida, {USA}, November 7--13, 1998",
  publisher =    pub-ACM # " and " # pub-IEEE,
  address =      pub-ACM:adr # " and " # pub-IEEE:adr,
  pages =        "????",
  year =         "1998",
  ISBN =         "????",
  ISBN-13 =      "????",
  LCCN =         "????",
  bibdate =      "Wed Oct 07 08:51:34 1998",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Vassil Alexandrov and J. J. Dongarra",
  booktitle =    "{Recent advances in parallel virtual machine and
                 message passing interface: 5th European {PVM\slash MPI}
                 User's Group Meeting, Liverpool, UK, September 7--9,
                 1998: Proceedings}",
  title =        "{Recent advances in parallel virtual machine and
                 message passing interface: 5th European {PVM\slash MPI}
                 User's Group Meeting, Liverpool, UK, September 7--9,
                 1998: Proceedings}",
  volume =       "1497",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xii + 412",
  year =         "1998",
  CODEN =        "LNCSD9",
  DOI =          "????",
  ISBN =         "3-540-65041-5 (softcover)",
  ISBN-13 =      "978-3-540-65041-6 (softcover)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA267.A1 L43 no.1497",
  bibdate =      "Mon May 3 11:00:13 MDT 1999",
  bibsource =    ";
  note =         "Jointly sponsored by the Computer Science Dept.,
                 University of Liverpool and Oak Ridge National
  series =       ser-LNCS,
  URL =          ";
  acknowledgement = ack-nhfb,
  keywords =     "data transmission systems --- congresses; parallel
                 computers --- congresses; virtual computer systems ---
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "John K. Antonio",
  booktitle =    "Proceedings: Seventh Heterogeneous Computing Workshop
                 {(HCW'98)}: March 30, 1998, Orlando, Florida, {USA}",
  title =        "Proceedings: Seventh Heterogeneous Computing Workshop
                 ({HCW}'98): March 30, 1998, Orlando, Florida, {USA}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "ix + 201",
  year =         "1998",
  ISBN =         "0-8186-8365-1, 0-8186-8367-8 (microfiche)",
  ISBN-13 =      "978-0-8186-8365-7, 978-0-8186-8367-1 (microfiche)",
  LCCN =         "QA76.88 .H48 1998",
  bibdate =      "Fri May 27 12:23:42 MDT 2005",
  bibsource =    "",
  note =         "IEEE catalog number 98EX126.",
  acknowledgement = ack-nhfb,
  subject =      "Heterogeneous computing Congresses; heterogeneous
                 computing; HCW; IEEE; parallel processing; naval

  editor =       "E. D'Hollander and others",
  booktitle =    "Parallel computing: fundamentals, applications, and
                 new directions: Papers from {ParCo97}, held in Bonn,
                 Germany, Sept. 19--22, 1997",
  title =        "Parallel computing: fundamentals, applications, and
                 new directions: Papers from {ParCo97}, held in Bonn,
                 Germany, Sept. 19--22, 1997",
  volume =       "12",
  publisher =    pub-ELSEVIER,
  address =      pub-ELSEVIER:adr,
  pages =        "xx + 748",
  year =         "1998",
  ISBN =         "0-444-82882-6",
  ISBN-13 =      "978-0-444-82882-8",
  LCCN =         "QA76.58.P3795 1997",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  series =       "Advances in Parallel Computing",
  acknowledgement = ack-nhfb,

  editor =       "{IEEE}",
  booktitle =    "Proceedings: the Seventh {IEEE} International
                 Symposium on High Performance Distributed Computing,
                 July 28--31, 1998, Chicago, Illinois",
  title =        "Proceedings: the Seventh {IEEE} International
                 Symposium on High Performance Distributed Computing,
                 July 28--31, 1998, Chicago, Illinois",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xii + 371",
  year =         "1998",
  ISBN =         "0-8186-8579-4, 0-8186-8581-6",
  ISBN-13 =      "978-0-8186-8579-8, 978-0-8186-8581-1",
  ISSN =         "1082-8907",
  LCCN =         "QA76.9.D5 I157 1998",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  note =         "IEEE Order Plan Catalog Number 98TB100244. IEEE
                 Computer Society Press order number PR08579.",
  acknowledgement = ack-nhfb,
  sponsor =      "IEEE; Computing Society; Technical Committee on
                 Distributed Processing.",

  editor =       "Kyriacos D. Papailiou",
  booktitle =    "Proceedings of the Fourth European Computational Fluid
                 Dynamics Conference, 7--11 September 1998, Athens,
  title =        "Proceedings of the Fourth European Computational Fluid
                 Dynamics Conference, 7--11 September 1998, Athens,
  volume =       "2",
  publisher =    pub-WILEY,
  address =      pub-WILEY:adr,
  pages =        "xviii + 1348 + xiv + 870",
  year =         "1998",
  ISBN =         "0-471-98579-1 (vol. 1), 0-471-98580-5 (vol. 2)",
  ISBN-13 =      "978-0-471-98579-2 (vol. 1), 978-0-471-98580-8 (vol.
  LCCN =         "QA911 .E95 1998",
  bibdate =      "Thu Sep 16 09:48:36 MDT 1999",
  bibsource =    "",
  note =         "Three volumes in two books.",
  acknowledgement = ack-nhfb,
  sponsor =      "European Community on Computational Methods in Applied

  editor =       "J. J. Dongarra and E. Luque and Tomas Margalef",
  booktitle =    "{Recent advances in parallel virtual machine and
                 message passing interface: 6th European PVM\slash {MPI}
                 Users' Group Meeting, Barcelona, Spain, September
                 26--29, 1999: Proceedings}",
  title =        "{Recent advances in parallel virtual machine and
                 message passing interface: 6th European PVM\slash {MPI}
                 Users' Group Meeting, Barcelona, Spain, September
                 26--29, 1999: Proceedings}",
  volume =       "1697",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xvii + 551",
  year =         "1999",
  CODEN =        "LNCSD9",
  DOI =          "????",
  ISBN =         "3-540-66549-8 (softcover)",
  ISBN-13 =      "978-3-540-66549-6 (softcover)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 E973 1999",
  bibdate =      "Wed Dec 8 06:34:56 MST 1999",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          ";
  acknowledgement = ack-nhfb,
  alttitle =     "PVM\slash MPI '99",
  keywords =     "Data transmission systems; Parallel computers; Virtual
                 computer systems",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Michael T. Heath and Abhiram Ranade and Robert S.
  booktitle =    "{Algorithms for parallel processing: Proceedings of
                 the Workshop on Algorithms for Parallel Processing,
                 held September 16--20, 1996, at the IMA, University of
  title =        "{Algorithms for parallel processing: Proceedings of
                 the Workshop on Algorithms for Parallel Processing,
                 held September 16--20, 1996, at the IMA, University of
  volume =       "105",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "x + 366",
  year =         "1999",
  ISBN =         "0-387-98680-4",
  ISBN-13 =      "978-0-387-98680-7",
  LCCN =         "QA76.58 .A543 1999",
  bibdate =      "Tue Feb 7 10:45:24 MST 2012",
  bibsource =    ";
  series =       "The IMA volumes in mathematics and its applications",
  URL =          "",
  acknowledgement = ack-nhfb,
  sponsor =      "University of Minnesota; Institute of Mathematics and
                 Its Applications.",
  subject =      "Parallel processing (Electronic computers);
                 Congresses; Computer algorithms",
  tableofcontents = "Models and Mechanisms in Parallel Computation \\
                 A General Purpose Shared-Memory Model For Parallel
                 Computation \\
                 Supporting A Coherent Shared Address Space Across SMP
                 Nodes: An Application-Driven Investigation \\
                 Single-Message Vs. Batch Communication \\
                 Some Simple and Practical Strategies For Parallelism;
                 Discrete and Combinatorial Algorithms \\
                 Locality In Computing Connected Components \\
                 Routing In Optical and Wireless Networks \\
                 Transparent Parallel Transactions On Replicated
                 Autonomous Databases; Mathematics of Parallelizing
                 Compilers \\
                 Mathematical Tools For Loop Transformations: From
                 Systems of Uniform Recurrence Equations To The Polytope
                 Model; Numerical Algorithms \\
                 The Scalability of Mesh Improvement Algorithms \\
                 Data Parallel Performance Optimizations Using Array
                 Aliasing \\
                 Coarsening, Sampling and Smoothing: Elements of The
                 Multilevel Method \\
                 Some Methods Of Parallel Pseudorandom Number Generation
                 / Michael Mascagni 277--288 \\
                 Performance of Parallel Sparse Triangular Solution \\
                 Determining An out-of-core FFT Decomposition Strategy
                 for Parallel Disks by Dynamic Programming; Parallel
                 Computer Systems and Software \\
                 Enabling Department-Scale Supercomputing \\
                 Providing Uniform Dynamic Access To Numerical Software
                 / H. Casanova and J. Dongarra 345--366",

  editor =       "Vicente Hernandez and Jose M. L. M. Palma and J. J.
  booktitle =    "Vector and parallel process --- {VECPAR} '98: Third
                 International Conference, Porto, Portugal, June 21--23,
                 1998: selected papers and invited talks",
  title =        "Vector and parallel process --- {VECPAR} '98: Third
                 International Conference, Porto, Portugal, June 21--23,
                 1998: selected papers and invited talks",
  volume =       "1573",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xvi + 706",
  year =         "1999",
  ISBN =         "3-540-66228-6 (softcover)",
  ISBN-13 =      "978-3-540-66228-0 (softcover)",
  LCCN =         "QA76.58 .I552 1998 Bar",
  bibdate =      "Mon Sep 13 11:29:25 MDT 1999",
  bibsource =    ";
  series =       ser-LNCS,
  acknowledgement = ack-nhfb,
  keywords =     "parallel processing (electronic computers) --
                 congresses; vector processing (computer science) --

  editor =       "Jos{\'e} M. L. M. Palma and J. J. Dongarra and Vicente
  booktitle =    "{Vector and parallel processing --- VECPAR '98: Third
                 International Conference, Porto, Portugal, June 21--23,
                 1998: selected papers and invited talks}",
  title =        "{Vector and parallel processing --- VECPAR '98: Third
                 International Conference, Porto, Portugal, June 21--23,
                 1998: selected papers and invited talks}",
  volume =       "1573",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xvi + 706",
  year =         "1999",
  CODEN =        "LNCSD9",
  ISBN =         "3-540-66228-6 (softcover)",
  ISBN-13 =      "978-3-540-66228-0 (softcover)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA267.A1 L43 no.1573",
  bibdate =      "Mon Oct 16 18:31:56 MDT 2000",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "parallel processing (electronic computers) --
                 congresses; vector processing (computer science) --
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "John G. Webster",
  booktitle =    "{Wiley} encyclopedia of electrical and electronics
  title =        "{Wiley} encyclopedia of electrical and electronics
  publisher =    pub-WILEY,
  address =      pub-WILEY:adr,
  pages =        "vi + 758",
  year =         "1999",
  ISBN =         "0-471-13946-7",
  ISBN-13 =      "978-0-471-13946-1",
  LCCN =         "TK9 .W55 1999",
  bibdate =      "Wed Jan 14 06:05:25 2004",
  bibsource =    "",
  note =         "24 volumes",
  acknowledgement = ack-nhfb,

  editor =       "{ACM}",
  booktitle =    "{SC2000: High Performance Networking and Computing.
                 Dallas Convention Center, Dallas, TX, USA, November
                 4--10, 2000}",
  title =        "{SC2000: High Performance Networking and Computing.
                 Dallas Convention Center, Dallas, TX, USA, November
                 4--10, 2000}",
  publisher =    pub-ACM # " and " # pub-IEEE,
  address =      pub-ACM:adr # " and " # pub-IEEE:adr,
  pages =        "????",
  year =         "2000",
  ISBN =         "????",
  ISBN-13 =      "????",
  LCCN =         "QA76.88",
  bibdate =      "Thu Feb 24 09:35:00 2000",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "J. J. Dongarra and P{\'e}ter Kacsuk and Norbert
  booktitle =    "Recent Advances in Parallel Virtual Machine and
                 Message Passing Interface: 7th European {PVM\slash}
                 {MPI} Users' Group Meeting, Balatonf{\"u}red, Hungary,
                 September 10--13, 2000. Proceedings",
  title =        "Recent Advances in Parallel Virtual Machine and
                 Message Passing Interface: 7th European {PVM\slash MPI}
                 Users' Group Meeting, Balatonf{\"u}red, Hungary,
                 September 10--13, 2000. Proceedings",
  volume =       "1908",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xv + 364",
  year =         "2000",
  CODEN =        "LNCSD9",
  ISBN =         "3-540-41010-4 (softcover)",
  ISBN-13 =      "978-3-540-41010-2 (softcover)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 .E973 2000",
  bibdate =      "Mon Nov 15 18:39:53 2004",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "data transmission systems -- congresses; parallel
                 computers -- congresses; virtual computer systems --
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "P. Sadayappan",
  booktitle =    "2000 International Workshops on Parallel Processing:
                 proceedings: 21--24 August, 2000, Toronto, Canada",
  title =        "2000 International Workshops on Parallel Processing:
                 proceedings: 21--24 August, 2000, Toronto, Canada",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  year =         "2000",
  ISBN =         "0-7695-0771-9, 0-7695-0773-5 (microfiche)",
  ISBN-13 =      "978-0-7695-0771-2, 978-0-7695-0773-6 (microfiche)",
  LCCN =         "QA76.58 .I575 2000",
  bibdate =      "Fri May 27 08:50:31 2005",
  bibsource =    "",
  note =         "IEEE Computer Society Order Number PR00771.",
  acknowledgement = ack-nhfb,

  editor =       "Adrian M. Tentner",
  booktitle =    "Proceedings of the High Performance Computing
                 Symposium: {HPC 2000: 2000 Advanced Simulation
                 Technologies Conference: Washington D.C., April 16--20,
                 2000, Wyndham City Center Hotel}",
  title =        "Proceedings of the High Performance Computing
                 Symposium: {HPC 2000: 2000 Advanced Simulation
                 Technologies Conference: Washington D.C., April 16--20,
                 2000, Wyndham City Center Hotel}",
  publisher =    "Society for Computer Simulation",
  address =      "San Diego, CA, USA",
  pages =        "ix + 402",
  year =         "2000",
  ISBN =         "1-56555-197-4",
  ISBN-13 =      "978-1-56555-197-8",
  LCCN =         "QA76.88 .H53 2000",
  bibdate =      "Fri May 27 08:56:15 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "{ACM}",
  booktitle =    "Proceedings of the {ACM 2001 Java Grande\slash ISCOPE
                 Conference: Palo Alto, Calif., June 2--4, 2001}",
  title =        "Proceedings of the {ACM 2001 Java Grande\slash ISCOPE
                 Conference: Palo Alto, Calif., June 2--4, 2001}",
  publisher =    pub-ACM,
  address =      pub-ACM:adr,
  pages =        "vi + 186",
  year =         "2001",
  ISBN =         "1-58113-359-6",
  ISBN-13 =      "978-1-58113-359-2",
  LCCN =         "QA76.9.O35 A26 2001",
  bibdate =      "Mon May 6 06:26:30 MDT 2002",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  keywords =     "Java (computer program language) -- congresses;
                 object-oriented methods (computer science) --

  editor =       "{ACM}",
  booktitle =    "{SC2001}: High Performance Networking and Computing.
                 Denver, {CO}, November 10--16, 2001",
  title =        "{SC2001}: High Performance Networking and Computing.
                 Denver, {CO}, November 10--16, 2001",
  publisher =    pub-ACM # " and " # pub-IEEE,
  address =      pub-ACM:adr # " and " # pub-IEEE:adr,
  pages =        "????",
  year =         "2001",
  ISBN =         "1-58113-293-X",
  ISBN-13 =      "978-1-58113-293-9",
  LCCN =         "QA76.88 .S85 2001",
  bibdate =      "Thu Feb 21 18:29:36 2002",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "Vassil Alexandrov and Jack J. Dongarra and Benjoe A.
                 Juliano and Ren{\'e} S. Renner and C. J. Kenneth Tan",
  booktitle =    "{Computational science --- ICCS 2001: International
                 Conference, San Francisco, CA, USA, May 28--30, 2001:
                 proceedings, Part I}",
  title =        "{Computational science --- ICCS 2001: International
                 Conference, San Francisco, CA, USA, May 28--30, 2001:
                 proceedings, Part I}",
  volume =       "2073",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xxviii + 1306",
  year =         "2001",
  CODEN =        "LNCSD9",
  DOI =          "????",
  ISBN =         "3-540-42232-3",
  ISBN-13 =      "978-3-540-42232-7",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA75.5 .I13 2001 v.1-2 (2001); QA267.A1 L43
                 no.2073-2074 Library has v.1-2",
  bibdate =      "Thu Jan 17 11:49:19 MST 2002",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          ";
  acknowledgement = ack-nhfb,
  keywords =     "computational complexity -- congresses; computer
                 science -- congresses",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Vassil Alexandrov and Jack J. Dongarra and Benjoe A.
                 Juliano and Ren{\'e} S. Renner and C. J. Kenneth Tan",
  booktitle =    "{Computational science --- ICCS 2001: International
                 Conference, San Francisco, CA, USA, May 28--30, 2001:
                 proceedings, Part II}",
  title =        "{Computational science --- ICCS 2001: International
                 Conference, San Francisco, CA, USA, May 28--30, 2001:
                 proceedings, Part II}",
  volume =       "2074",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xxviii + 1078",
  year =         "2001",
  CODEN =        "LNCSD9",
  DOI =          "????",
  ISBN =         "3-540-42233-1",
  ISBN-13 =      "978-3-540-42233-4",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA75.5 .I13 2001 v.1-2 (2001); QA267.A1 L43
                 no.2073-2074 Library has v.1-2",
  bibdate =      "Thu Jan 17 11:49:19 MST 2002",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          ";
  acknowledgement = ack-nhfb,
  keywords =     "computational complexity -- congresses; computer
                 science -- congresses",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Ronald F. Boisvert and Ping Tak Peter Tang",
  booktitle =    "The architecture of scientific software: {IFIP
                 TC2/WG2.5 Working Conference on the Architecture of
                 Scientific Software, October 2--4, 2000, Ottawa,
  title =        "The architecture of scientific software: {IFIP
                 TC2/WG2.5 Working Conference on the Architecture of
                 Scientific Software, October 2--4, 2000, Ottawa,
  volume =       "60",
  publisher =    pub-KLUWER,
  address =      pub-KLUWER:adr,
  pages =        "xx + 358",
  year =         "2001",
  ISBN =         "0-7923-7339-1",
  ISBN-13 =      "978-0-7923-7339-1",
  LCCN =         "QA76.758 .I345 2000",
  bibdate =      "Fri May 27 08:46:38 2005",
  bibsource =    "",
  series =       "IFIP",
  acknowledgement = ack-nhfb,
  tableofcontents = "Preface (p. ix)\\
                 Contributing Authors (p. xv)\\
                 Part I: Large-Scale Systems Integration\\
                 Network-Based Scientific Computing: Elias N. Houstis,
                 Ann Christine Catlin, Ganesh Balakrishnan, Nitesh
                 Dhanjani, GaHyun Park, John R. Rice, Spyros Lalis,
                 Manolis Stamatogiannakis, Catherine E. Houstis (pp.
                 3--28) \\
                 Future Generations of Problem-Solving Environments:
                 Jos{\'e} C. Cunha (pp. 29--38) \\
                 Developing an Architecture to Support the
                 Implementation and Development of Scientific computing
                 Applications: Dorian C. Arnold, Jack Dongarra (pp.
                 39--56) \\
                 PETSc and Overture: Lessons Learned Developing an
                 Interface between Components: Kristopher R. Buschelman,
                 William Gropp, Lois C. McInnes, Barry F. Smith (pp.
                 57--68) \\
                 Component Technology for High-Performance Scientific
                 Simulation Software: Tom Epperly, Scott R. Kohn, Gary
                 Kumfert (pp. 69--86) \\
                 A New Approach to Software Integration Frameworks for
                 Multi-physics Simulation Codes: Eric de Sturler, Jay
                 Hoeflinger, Laxmikant V. Kal{\'e}, Milind Bhandarkar
                 (pp. 87--104) \\
                 Code Coupling using Parallel CORBA Objects: Christophe
                 Ren{\'e}, Thierry Priol, Guillaume All{\'e}on (pp.
                 105--118) \\
                 A Collaborative Code Development Environment for
                 Computational Electro-magnetics: Matthew S. Shields,
                 Omer F. Rana, David W. Walker, David Colby (pp.
                 119--144) \\
                 Part II: The Architecture of Components\\
                 On the Role of Mathematical Abstractions for Scientific
                 Computing: Krister {\AA}hlander, Magne Haveraaen, Hans
                 Z. Munthe-Kaas (pp. 145--158) \\
                 Object-oriented Modeling of Parallel PDE Solvers:
                 Michael Thun{\'e}, Krister {\AA}hlander, Malin
                 Ljungberg, Markus Nord{\'e}n, Kurt Otto, Jarmo
                 Rantakokko (pp. 159--174) \\
                 Broadway: A Software Architecture for Scientific
                 Computing: Samuel Z. Guyer, Calvin Lin (pp. 175--192)
                 Formal Methods for High-Performance Linear Algebra
                 Libraries: John A. Gunnels, Robert A. van de Geijn (pp.
                 193--210) \\
                 New Generalized Matrix Data Structures Lead to a
                 Variety of High-Performance Algorithms: Fred G.
                 Gustavson (pp. 211--234) \\
                 A Comprehensive DFT API for Scientific Computing: Ping
                 Tak Peter Tang (pp. 235--256) \\
                 Using A Fortran Interface to POSIX Threads: Richard J.
                 Hanson, Clay P. Breshears, Henry A. Gabb (pp. 257--272)
                 Data Management Systems for Scientific Applications:
                 Reagan Moore (pp. 273--284) \\
                 Software Components for Application Development: Arnaud
                 Desitter, Antoine Le Hyaric, Geoff Morgan, Gareth Shaw,
                 Anne E. Trefethen (pp. 285--300) \\
                 Hierarchical Representation and Computation of
                 Approximate Solutions in Scientific Simulations: Wayne
                 H. Enright (pp. 301--316) \\
                 Software Architecture for the Investigation of
                 Controllable Models with Complex Data Sets: Dmitry
                 Belyshev, Vladimir I. Gurman (pp. 317--332) \\
                 A Mixed-Language Programming Methodology for High
                 Performance Java Computing: Vladimir Getov (pp.
                 333--350) \\
                 Part III: Conference Information\\
                 The Architecture of Scientific Software: the Conference
                 (pp. 351--356)\\
                 Index (pp. 357--358)",

  editor =       "Yiannis Cotronis and J. J. Dongarra",
  booktitle =    "{Recent advances in parallel virtual machine and
                 message passing interface: 8th European {PVM\slash MPI}
                 Users' Group Meeting, Santorini\slash Thera, Greece,
                 September 23--26, 2001: Proceedings}",
  title =        "{Recent advances in parallel virtual machine and
                 message passing interface: 8th European {PVM\slash MPI}
                 Users' Group Meeting, Santorini\slash Thera, Greece,
                 September 23--26, 2001: Proceedings}",
  volume =       "2131",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xv + 438",
  year =         "2001",
  CODEN =        "LNCSD9",
  DOI =          "????",
  ISBN =         "3-540-42609-4 (paperback)",
  ISBN-13 =      "978-3-540-42609-7 (paperback)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 E975 2001; QA267.A1 L43 no.2131",
  bibdate =      "Thu Jan 17 11:49:19 MST 2002",
  bibsource =    "",
  series =       ser-LNCS # " and " # ser-LNAI,
  URL =          ";
  acknowledgement = ack-nhfb,
  keywords =     "data transmission systems --- congresses; parallel
                 computers --- congresses; virtual computer systems ---
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "{IEEE}",
  booktitle =    "{IEEE} International Symposium on Network Computing
                 and Applications: {NCA 2001}: proceedings: 8--10
                 October, 2001, Cambridge, Massachusetts, {USA}",
  title =        "{IEEE} International Symposium on Network Computing
                 and Applications: {NCA} 2001: proceedings: 8--10
                 October, 2001, Cambridge, Massachusetts, {USA}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xiii + 373",
  year =         "2001",
  ISBN =         "0-7695-1432-4; 0-7695-1433-2 (case); 0-7695-1434-0
  ISBN-13 =      "978-0-7695-1432-1; 978-0-7695-1433-8 (case);
                 978-0-7695-1434-5 (microfiche)",
  LCCN =         "TK5105.5 .I323 2001",
  bibdate =      "Fri May 27 12:30:51 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "Daniel S. Katz",
  booktitle =    "2001 {IEEE} International Conference on Cluster
                 Computing: 8--11 October 2001, Newport Beach,
                 California, {USA}: proceedings",
  title =        "2001 {IEEE} International Conference on Cluster
                 Computing: 8--11 October 2001, Newport Beach,
                 California, {USA}: proceedings",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xxii + 460",
  year =         "2001",
  ISBN =         "0-7695-1116-3; 0-7695-1117-1 (bookbroker);
                 0-7695-1118-X (microfiche)",
  ISBN-13 =      "978-0-7695-1116-0; 978-0-7695-1117-7 (bookbroker);
                 978-0-7695-1118-4 (microfiche)",
  ISSN =         "0272-5428",
  LCCN =         "QA76.58 .I38 2001",
  bibdate =      "Fri May 27 12:28:31 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "C. A. (Craig A.) Lee",
  booktitle =    "{Third annual International Workshop on Active
                 Middleware Services proceedings: 6 August 2001, San
                 Francisco, California}",
  title =        "{Third annual International Workshop on Active
                 Middleware Services proceedings: 6 August 2001, San
                 Francisco, California}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "viii + 123",
  year =         "2001",
  ISBN =         "0-7695-1528-2",
  ISBN-13 =      "978-0-7695-1528-1",
  LCCN =         "QA76.76.M54 I58 2001",
  bibdate =      "Fri May 27 08:59:39 2005",
  bibsource =    "",
  note =         "IEEE Computer Society Order Number PR01528.",
  acknowledgement = ack-nhfb,

  editor =       "Jos{\'e} M. L. M. Palma and Jack J. Dongarra and
                 Vicente Hern{\'a}ndez",
  booktitle =    "Vector and parallel processing --- {VECPAR 2000}: 4th
                 International Conference, Porto, Portugal, June 21--23,
                 2000: selected papers and invited talks",
  title =        "Vector and parallel processing --- {VECPAR 2000}: 4th
                 International Conference, Porto, Portugal, June 21--23,
                 2000: selected papers and invited talks",
  volume =       "1981",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xvi + 580",
  year =         "2001",
  CODEN =        "LNCSD9",
  ISBN =         "3-540-41999-3 (paperback)",
  ISBN-13 =      "978-3-540-41999-0 (paperback)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 .I552 2000",
  bibdate =      "Wed Sep 11 15:46:08 2002",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "parallel processing (electronic computers) --
                 congresses; vector processing (computer science) --
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "E. Sha",
  booktitle =    "Parallel and distributed computing systems:
                 proceedings of the {ISCA 14th International Conference:
                 Richardson, Texas, USA, August 8--10, 2001}",
  title =        "Parallel and distributed computing systems:
                 proceedings of the {ISCA 14th International Conference:
                 Richardson, Texas, USA, August 8--10, 2001}",
  publisher =    "International Society for Computers and Their
  address =      "Cary, NC, USA",
  pages =        "viii + 529",
  year =         "2001",
  ISBN =         "1-880843-39-0",
  ISBN-13 =      "978-1-880843-39-0",
  LCCN =         "QA76.58 .I5443 2001",
  bibdate =      "Fri May 27 09:05:08 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "Adrian M. Tentner",
  booktitle =    "Proceedings of the High Performance Computing
                 Symposium --- {HPC 2001}: 2001 Advanced Simulation
                 Technologies Conference, Seattle, Washington, April
                 22--26, 2001, Renaissance Madison Hotel",
  title =        "Proceedings of the High Performance Computing
                 Symposium --- {HPC} 2001: 2001 Advanced Simulation
                 Technologies Conference, Seattle, Washington, April
                 22--26, 2001, Renaissance Madison Hotel",
  publisher =    "Simulation Councils, Inc.",
  address =      "San Diego, CA, USA",
  pages =        "viii + 316",
  year =         "2001",
  ISBN =         "1-56555-237-7",
  ISBN-13 =      "978-1-56555-237-1",
  LCCN =         "????",
  bibdate =      "Fri May 27 08:38:29 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  xxpublisher =  "Society for Computer Simulation",

  author =       "James Abello and Panos M. Pardalos and Mauricio G. C.
  booktitle =    "Handbook of Massive Data Sets",
  title =        "Handbook of Massive Data Sets",
  publisher =    pub-KLUWER,
  address =      pub-KLUWER:adr,
  pages =        "xii + 1223",
  year =         "2002",
  ISBN =         "1-4020-0489-3",
  ISBN-13 =      "978-1-4020-0489-6",
  LCCN =         "QA76.9.D3 H3474 2002",
  bibdate =      "Wed Jan 14 06:38:54 2004",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "William Gropp",
  booktitle =    "Proceedings: 2002 {IEEE} International Conference on
                 Cluster Computing, 23--26 September 2002, Chicago,
  title =        "Proceedings: 2002 {IEEE} International Conference on
                 Cluster Computing, 23--26 September 2002, Chicago,
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xv + 501",
  year =         "2002",
  ISBN =         "0-7695-1745-5",
  ISBN-13 =      "978-0-7695-1745-2",
  LCCN =         "QA76.58 .I38 2002",
  bibdate =      "Fri May 27 12:33:24 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "{IEEE}",
  booktitle =    "{CCGrid2002: 2nd IEEE\slash ACM International
                 Symposium on Cluster Computing and the Grid:
                 proceedings: May 21--24, 2002, Berlin, Germany}",
  title =        "{CCGrid2002: 2nd IEEE\slash ACM International
                 Symposium on Cluster Computing and the Grid:
                 proceedings: May 21--24, 2002, Berlin, Germany}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xxii + 479",
  year =         "2002",
  ISBN =         "0-7695-1582-7, 0-7695-1583-5 (bookbroker),
                 0-7695-1584-3 (microfiche)",
  ISBN-13 =      "978-0-7695-1582-3, 978-0-7695-1583-0 (bookbroker),
                 978-0-7695-1584-7 (microfiche)",
  LCCN =         "QA76.9.C58 I33 2002a",
  bibdate =      "Fri May 27 12:36:02 2005",
  bibsource =    "",
  note =         "IEEE Computer Society order number PR01582.",
  acknowledgement = ack-nhfb,

  editor =       "{IEEE}",
  booktitle =    "{HPDC-11 2002: proceedings: 11th IEEE International
                 Symposium on High Performance Distributed Computing:
                 24--26 July, 2002, Edinburgh, Scotland}",
  title =        "{HPDC-11 2002: proceedings: 11th IEEE International
                 Symposium on High Performance Distributed Computing:
                 24--26 July, 2002, Edinburgh, Scotland}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xiv + 426",
  year =         "2002",
  ISBN =         "0-7695-1686-6; 0-7695-1688-2 (microfiche)",
  ISBN-13 =      "978-0-7695-1686-8; 978-0-7695-1688-2 (microfiche)",
  LCCN =         "QA76.9.D5I593 2002c",
  bibdate =      "Fri May 27 12:38:00 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "{IEEE}",
  booktitle =    "Proceedings / Fourth Annual International Workshop on
                 Active Middleware Services, {AMS 2002}: 23 July 2002,
                 Edinburgh, United Kingdom",
  title =        "Proceedings / Fourth Annual International Workshop on
                 Active Middleware Services, {AMS} 2002: 23 July 2002,
                 Edinburgh, United Kingdom",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "viii + 99",
  year =         "2002",
  ISBN =         "0-7695-1721-8, 0-7695-1723-4 (microfiche)",
  ISBN-13 =      "978-0-7695-1721-6, 978-0-7695-1723-0 (microfiche)",
  LCCN =         "QA76.76.M54 I58 2002",
  bibdate =      "Fri May 27 09:09:56 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "{IEEE}",
  booktitle =    "Proceedings: 16th International Parallel \&
                 Distributed Processing Symposium: {IPDPS 2002}: 15--19
                 April, 2002, Ft. Lauderdale, Florida, {USA}",
  title =        "Proceedings: 16th International Parallel \&
                 Distributed Processing Symposium: {IPDPS} 2002: 15--19
                 April, 2002, Ft. Lauderdale, Florida, {USA}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xlvii + 270",
  year =         "2002",
  ISBN =         "0-7695-1573-8, 0-7695-1574-6, 0-7695-1575-4",
  ISBN-13 =      "978-0-7695-1573-1, 978-0-7695-1574-8,
  LCCN =         "QA76.58.I583 2002",
  bibdate =      "Wed Jan 14 06:51:18 2004",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  xxbooktitle =  "Proceedings of NSF Next Generation Systems Program
                 Workshop (International Parallel and Distributed
                 Processing Symposium 2002), Fort Lauderdale, FL, April

  editor =       "Dieter Kranzlm{\"u}ller and Peter Kacsuk and Jack
                 Dongarra and Jens Volkert",
  booktitle =    "Recent advances in parallel virtual machine and
                 message passing interface: 9th European {PVM\slash MPI}
                 Users' Group Meeting, Linz, Austria, September
                 29--October 2, 2002: Proceedings",
  title =        "Recent Advances in Parallel Virtual Machine and
                 Message Passing Interface: 9th European {PVM\slash MPI}
                 Users' Group Meeting, Linz, Austria, September
                 29--October 2, 2002. Proceedings",
  volume =       "2474",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xvi + 462",
  year =         "2002",
  CODEN =        "LNCSD9",
  ISBN =         "3-540-44296-0 (softcover)",
  ISBN-13 =      "978-3-540-44296-7 (softcover)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 .E975 2002",
  bibdate =      "Thu Nov 11 19:26:30 MST 2004",
  bibsource =    "",
  note =         "Also available via the World Wide Web",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "data transmission systems --- congresses; parallel
                 computers -- congresses; virtual computer systems --

  editor =       "Burkhard Monien and Rainer Feldmann",
  booktitle =    "{Euro-Par} 2002, parallel processing: 8th
                 International {Euro-Par} Conference, Paderborn,
                 Germany, August 27--30, 2002: proceedings",
  title =        "{Euro-Par} 2002, parallel processing: 8th
                 International {Euro-Par} Conference, Paderborn,
                 Germany, August 27--30, 2002: proceedings",
  volume =       "2400",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xxix + 993",
  year =         "2002",
  ISBN =         "3-540-44049-6 (softcover)",
  ISBN-13 =      "978-3-540-44049-9 (softcover)",
  LCCN =         "QA76.58 .I553 2002",
  bibdate =      "Thu Aug 21 09:09:03 MDT 2003",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "parallel processing (electronic computers) ---

  editor =       "Rod Oldehoeft",
  booktitle =    "Special issue on software for high-performance
                 systems: papers from the symposium of the Los Alamos
                 Computer Science Institute, held in Santa Fe, {NM},
                 {USA} on October 15--18, 2001",
  title =        "Special issue on software for high-performance
                 systems: papers from the symposium of the Los Alamos
                 Computer Science Institute, held in Santa Fe, {NM},
                 {USA} on October 15--18, 2001",
  volume =       "23(1)",
  publisher =    pub-KLUWER,
  address =      pub-KLUWER:adr,
  pages =        "128",
  year =         "2002",
  CODEN =        "JOSUED",
  ISSN =         "0920-8542 (print), 1573-0484 (electronic)",
  bibdate =      "Wed Jan 14 07:13:03 2004",
  bibsource =    "",
  series =       "The journal of supercomputing",
  acknowledgement = ack-nhfb,

  editor =       "Manish Parashar",
  booktitle =    "Grid computing --- {GRID} 2002: third international
                 workshop, Baltimore, {MD}, {USA}, November 18, 2002:
  title =        "Grid computing --- {GRID} 2002: third international
                 workshop, Baltimore, {MD}, {USA}, November 18, 2002:
  volume =       "2536",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xi + 318",
  year =         "2002",
  ISBN =         "3-540-00133-6 (softcover)",
  ISBN-13 =      "978-3-540-00133-1 (softcover)",
  LCCN =         "QA76.9.C58 G74 2002",
  bibdate =      "Thu Aug 21 09:09:03 MDT 2003",
  bibsource =    ";
  note =         "Also available via the World Wide Web.",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "computational grids (computer systems) congresses",

  editor =       "Peter M. A. Sloot and C. J. Kenneth Tan and Jack J.
                 Dongarra and Alfons G. Hoekstra",
  booktitle =    "Computational {Science--ICCS 2002}: International
                 Conference, Amsterdam, The Netherlands, April 21--24,
                 2002. Proceedings, Part {I}",
  title =        "Computational Science--{ICCS 2002}: International
                 Conference, Amsterdam, The Netherlands, April 21--24,
                 2002. Proceedings, {Part I}",
  volume =       "2329",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xli + 1095",
  year =         "2002",
  CODEN =        "LNCSD9",
  ISBN =         "3-540-43591-3 (paperback)",
  ISBN-13 =      "978-3-540-43591-4 (paperback)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA75.5 .I13 2002 pt.1-3 (2002)",
  bibdate =      "Thu Nov 11 19:26:30 MST 2004",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "computer science -- congresses",

  editor =       "P. M. A. Sloot and C. J. Kenneth Tan and J. J.
                 Dongarra and A. G. Hoekstra",
  booktitle =    "Computational {Science--ICCS 2002}: International
                 Conference, Amsterdam, The Netherlands, April 21--24,
                 2002. Proceedings, Part {II}",
  title =        "Computational Science--{ICCS 2002}: International
                 Conference, Amsterdam, The Netherlands, April 21--24,
                 2002. Proceedings, {Part II}",
  volume =       "2330",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xli + 1115",
  year =         "2002",
  CODEN =        "LNCSD9",
  ISBN =         "3-540-43593-X (paperback)",
  ISBN-13 =      "978-3-540-43593-8 (paperback)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA75.5 .I13 2002",
  bibdate =      "Thu Nov 11 19:26:30 MST 2004",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "P. M. A. Sloot and C. J. Kenneth Tan and J. J.
                 Dongarra and A. G. Hoekstra",
  booktitle =    "Computational {Science--ICCS 2002}: International
                 Conference, Amsterdam, The Netherlands, April 21--24,
                 2002. Proceedings, Part {III}",
  title =        "Computational Science--{ICCS 2002}: International
                 Conference, Amsterdam, The Netherlands, April 21--24,
                 2002. Proceedings, {Part III}",
  volume =       "2331",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xli + 1227",
  year =         "2002",
  CODEN =        "LNCSD9",
  ISBN =         "3-540-43594-8 (paperback)",
  ISBN-13 =      "978-3-540-43594-5 (paperback)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA75.5 .I13 2002",
  bibdate =      "Thu Nov 11 19:26:30 MST 2004",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Roman Wyrzykowski and Jack Dongarra and Marcin
                 Paprzycki and Jerzy Was{\'n}iewski",
  booktitle =    "Parallel Processing and Applied Mathematics: 4th
                 International Conference, {PPAM 2001}
                 Nal{\k{e}}cz{\'o}w, Poland, September 9--12, 2001.
                 Revised Papers",
  title =        "Parallel Processing and Applied Mathematics: 4th
                 International Conference, {PPAM 2001}
                 Nal{\k{e}}cz{\'o}w, Poland, September 9--12, 2001.
                 Revised Papers",
  volume =       "2328",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xix + 915",
  year =         "2002",
  CODEN =        "LNCSD9",
  ISBN =         "3-540-43792-4 (softcover)",
  ISBN-13 =      "978-3-540-43792-5 (softcover)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 .P69 2001",
  bibdate =      "Thu Nov 11 19:26:30 MST 2004",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "mathematics -- congresses; parallel processing
                 (electronic computers) -- congresses",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "{ACM}",
  booktitle =    "Conference proceedings of the 2003 International
                 Conference on Supercomputing: June 23--26, 2003, San
                 Francisco, California, {USA}",
  title =        "Conference proceedings of the 2003 International
                 Conference on Supercomputing: June 23--26, 2003, San
                 Francisco, California, {USA}",
  publisher =    pub-ACM,
  address =      pub-ACM:adr,
  pages =        "x + 370",
  year =         "2003",
  ISBN =         "1-58113-733-8",
  ISBN-13 =      "978-1-58113-733-0",
  LCCN =         "QA76.5 .I547 2003",
  bibdate =      "Tue Jan 13 19:21:39 2004",
  bibsource =    "",
  note =         "ACM order number 415031.",
  acknowledgement = ack-nhfb,

  editor =       "Andrea Clematis",
  booktitle =    "{Eleventh Euromicro Conference on Parallel,
                 Distributed, and Network-Based Processing: proceedings:
                 Genova, Italy, February 5--7, 2003}",
  title =        "{Eleventh Euromicro Conference on Parallel,
                 Distributed, and Network-Based Processing: proceedings:
                 Genova, Italy, February 5--7, 2003}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xiv + 553",
  year =         "2003",
  ISBN =         "0-7695-1875-3",
  ISBN-13 =      "978-0-7695-1875-6",
  ISSN =         "1066-6192",
  LCCN =         "QA76.58",
  bibdate =      "Fri May 27 13:54:43 2005",
  bibsource =    "",
  note =         "IEEE Computer Society Order Number PR01875.",
  acknowledgement = ack-nhfb,

  editor =       "Jack Dongarra and Domenico Laforenza and Salvatore
  booktitle =    "Recent advances in parallel virtual machine and
                 message passing interface: 10th European {PVM\slash}
                 {MPI} User's group Meeting, Venice, Italy, September
                 29--October 2, 2003: Proceedings",
  title =        "Recent advances in parallel virtual machine and
                 message passing interface: 10th European {PVM}\slash
                 {MPI} User's group Meeting, Venice, Italy, September
                 29--October 2, 2003: Proceedings",
  volume =       "2840",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xviii + 693",
  year =         "2003",
  CODEN =        "LNCSD9",
  ISBN =         "3-540-20149-1",
  ISBN-13 =      "978-3-540-20149-6",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 .E973 2003",
  bibdate =      "Tue Jan 13 19:17:43 2004",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Jack Dongarra and Ian Foster and Geoffrey Fox and
                 William Gropp and Ken Kennedy and Linda Torczon and
                 Andy White",
  booktitle =    "The Sourcebook of Parallel Computing",
  title =        "The Sourcebook of Parallel Computing",
  publisher =    pub-MORGAN-KAUFMANN,
  address =      pub-MORGAN-KAUFMANN:adr,
  pages =        "xvi + 842 + 8",
  year =         "2003",
  ISBN =         "1-55860-871-0",
  ISBN-13 =      "978-1-55860-871-9",
  LCCN =         "QA76.58 S638 2003",
  bibdate =      "Tue Jun 17 13:39:32 2003",
  bibsource =    "",
  price =        "US\$59.95",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Michael Gerndt",
  booktitle =    "Proceedings / Eighth International Workshop on
                 High-Level Parallel Programming Models and Supportive
                 Environments, 22 April 2003, Nice, France: held in
                 conjunction with 17th International Parallel and
                 Distributed Processing Symposium {(IPDPS)}",
  title =        "Proceedings / Eighth International Workshop on
                 High-Level Parallel Programming Models and Supportive
                 Environments, 22 April 2003, Nice, France: held in
                 conjunction with 17th International Parallel and
                 Distributed Processing Symposium ({IPDPS})",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "vii + 97",
  year =         "2003",
  ISBN =         "0-7695-1880-X",
  ISBN-13 =      "978-0-7695-1880-0",
  LCCN =         "QA76.642 .I586 2003",
  bibdate =      "Tue Jan 13 19:30:43 2004",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "{IEEE}",
  booktitle =    "{CCGrid2003: 3rd IEEE\slash ACM International
                 Symposium on Cluster Computing and the Grid:
                 proceedings: Tokyo, Japan, 12--15 May, 2003}",
  title =        "{CCGrid2003: 3rd IEEE\slash ACM International
                 Symposium on Cluster Computing and the Grid:
                 proceedings: Tokyo, Japan, 12--15 May, 2003}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xviii + 745",
  year =         "2003",
  ISBN =         "0-7695-1919-9",
  ISBN-13 =      "978-0-7695-1919-7",
  LCCN =         "QA76.9.C58",
  bibdate =      "Fri May 27 13:59:31 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "IEEE",
  booktitle =    "{International Parallel and Distributed Processing
                 Symposium: proceedings: April 22--26, 2003, Nice,
  title =        "{International Parallel and Distributed Processing
                 Symposium: proceedings: April 22--26, 2003, Nice,
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "lxv + 304",
  year =         "2003",
  ISBN =         "0-7695-1926-1",
  ISBN-13 =      "978-0-7695-1926-5",
  ISSN =         "1530-2075",
  LCCN =         "QA76.58",
  bibdate =      "Fri May 27 13:56:59 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "{IEEE}",
  booktitle =    "Proceedings / {CCGrid 2003, 3rd IEEE/ACM International
                 Symposium on Cluster Computing and the Grid, Tokyo,
                 Japan, 12--15 May 2003}",
  title =        "Proceedings / {CCGrid 2003, 3rd IEEE\slash ACM
                 International Symposium on Cluster Computing and the
                 Grid, Tokyo, Japan, 12--15 May 2003}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xviii + 745",
  year =         "2003",
  ISBN =         "0-7695-1919-9",
  ISBN-13 =      "978-0-7695-1919-7",
  LCCN =         "????",
  bibdate =      "Tue Jan 13 19:26:35 2004",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "{IEEE}",
  booktitle =    "Proceedings: 17th International Parallel \&
                 Distributed Processing Symposium: {IPDPS 2003}: 22--26
                 April, 2003, Nice, France",
  title =        "Proceedings: 17th International Parallel \&
                 Distributed Processing Symposium: {IPDPS} 2003: 22--26
                 April, 2003, Nice, France",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "lxv + 304",
  year =         "2003",
  ISBN =         "0-7695-1926-1",
  ISBN-13 =      "978-0-7695-1926-5",
  LCCN =         "QA76.58 .M47 2003",
  bibdate =      "Wed Jan 14 07:03:10 2004",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  keywords =     "International Parallel and Distributed Processing
                 Symposium (IPDPS)",

  editor =       "Harald Kosch and L{\'a}szl{\'o}
                 B{\"o}sz{\"o}rm{\'e}nyi and Hermann Hellwagner",
  booktitle =    "{Euro-Par 2003 parallel processing: 9th International
                 Euro-Par Conference, Klagenfurt, Austria, August
                 26--29, 2003: proceedings}",
  title =        "{Euro-Par 2003 parallel processing: 9th International
                 Euro-Par Conference, Klagenfurt, Austria, August
                 26--29, 2003: proceedings}",
  volume =       "2790",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xxxv + 1320",
  year =         "2003",
  ISBN =         "3-540-40788-X",
  ISBN-13 =      "978-3-540-40788-1",
  LCCN =         "QA76.58 .I5443 2003",
  bibdate =      "Wed Jan 14 08:00:35 2004",
  bibsource =    "",
  series =       ser-LNCS,
  acknowledgement = ack-nhfb,

  editor =       "Jarek Nabrzyski and Jennifer M. Schopf and Jan
  booktitle =    "Grid resource management: state of the art and future
  title =        "Grid resource management: state of the art and future
  number =       "ISOR 64",
  publisher =    pub-KLUWER,
  address =      pub-KLUWER:adr,
  pages =        "xxi + 574",
  year =         "2003",
  ISBN =         "1-4020-7575-8",
  ISBN-13 =      "978-1-4020-7575-9",
  LCCN =         "QA76.9.C58 G78 2004",
  bibdate =      "Wed Jan 14 06:59:00 2004",
  bibsource =    "",
  series =       "International series in operations research \&
                 management science",
  acknowledgement = ack-nhfb,
  xxbooktitle =  "Resource Management in the {Grid}",

  editor =       "Jos{\'e} M. L. M. Palma and Jack Dongarra and Vicente
                 Hern{\'a}ndez and A. Augusto Sousa",
  booktitle =    "High performance computing for computational science,
                 {VECPAR 2002}: 5th International Conference, Porto,
                 Portugal, June 26--28, 2002: selected papers and
                 invited talks",
  title =        "High performance computing for computational science,
                 {VECPAR 2002}: 5th International Conference, Porto,
                 Portugal, June 26--28, 2002: selected papers and
                 invited talks",
  volume =       "2565",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xvii + 732",
  year =         "2003",
  CODEN =        "LNCSD9",
  ISBN =         "3-540-00852-7 (softcover)",
  ISBN-13 =      "978-3-540-00852-1 (softcover)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 .I552 2002",
  bibdate =      "Thu Aug 21 09:09:03 MDT 2003",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "high performance computing --- congresses",
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Peter M. A. Sloot and David Abramson and Alexander V.
                 Bogdanov and Jack J. Dongarra and Albert Y. Zomaya and
                 Yuriy E. Gorbachev",
  booktitle =    "Computational science --- {ICCS 2003}: International
                 Conference, Melbourne, Australia and St. Petersburg,
                 Russia, June 2--4, 2003: Proceedings, Part {I}",
  title =        "Computational science --- {ICCS 2003}: International
                 Conference, Melbourne, Australia and St. Petersburg,
                 Russia, June 2--4, 2003: Proceedings, {Part I}",
  volume =       "2657",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "lv + 1095",
  year =         "2003",
  CODEN =        "LNCSD9",
  ISBN =         "3-540-40194-6 (softcover)",
  ISBN-13 =      "978-3-540-40194-0 (softcover)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA75.5 .I13 2003 pt.1-4 2003",
  bibdate =      "Thu Aug 21 09:09:03 MDT 2003",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "computational complexity --- congresses; computer
                 science --- congresses",

  editor =       "Peter M. A. Sloot and David Abramson and Alexander V.
                 Bogdanov and Jack J. Dongarra and Albert Y. Zomaya and
                 Yuriy E. Gorbachev",
  booktitle =    "Computational science --- {ICCS 2003}: International
                 Conference, Melbourne, Australia and St. Petersburg,
                 Russia, June 2--4, 2003: Proceedings, Part {II}",
  title =        "Computational science --- {ICCS 2003}: International
                 Conference, Melbourne, Australia and St. Petersburg,
                 Russia, June 2--4, 2003: Proceedings, {Part II}",
  volume =       "2658",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "lv + 1129",
  year =         "2003",
  CODEN =        "LNCSD9",
  ISBN =         "3-540-40195-4 (softcover)",
  ISBN-13 =      "978-3-540-40195-7 (softcover)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA75.5 .I13 2003 pt.1-4 2003",
  bibdate =      "Thu Aug 21 09:09:03 MDT 2003",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "computational complexity --- congresses; computer
                 science --- congresses",

  editor =       "Peter M. A. Sloot and David Abramson and Alexander V.
                 Bogdanov and Jack J. Dongarra and Albert Y. Zomaya and
                 Yuriy E. Gorbachev",
  booktitle =    "Computational science --- {ICCS 2003}: International
                 Conference, Melbourne, Australia and St. Petersburg,
                 Russia, June 2--4, 2003: Proceedings, Part {III}",
  title =        "Computational science --- {ICCS 2003}: International
                 Conference, Melbourne, Australia and St. Petersburg,
                 Russia, June 2--4, 2003: Proceedings, {Part III}",
  volume =       "2659",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "lv + 1165",
  year =         "2003",
  CODEN =        "LNCSD9",
  ISBN =         "3-540-40196-2 (softcover)",
  ISBN-13 =      "978-3-540-40196-4 (softcover)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA75.5 .I13 2003 pt.1-4 2003",
  bibdate =      "Thu Aug 21 09:09:03 MDT 2003",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "computational complexity --- congresses; computer
                 science --- congresses",

  editor =       "Peter M. A. Sloot and David Abramson and Alexander V.
                 Bogdanov and Jack J. Dongarra and Albert Y. Zomaya and
                 Yuriy E. Gorbachev",
  booktitle =    "Computational science --- {ICCS 2003}: International
                 Conference, Melbourne, Australia and St. Petersburg,
                 Russia, June 2--4, 2003: Proceedings, Part {IV}",
  title =        "Computational science --- {ICCS 2003}: International
                 Conference, Melbourne, Australia and St. Petersburg,
                 Russia, June 2--4, 2003: Proceedings, {Part IV}",
  volume =       "2660",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "lvi + 1161",
  year =         "2003",
  CODEN =        "LNCSD9",
  ISBN =         "3-540-40197-0 (softcover)",
  ISBN-13 =      "978-3-540-40197-1 (softcover)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA75.5 .I13 2003 pt.1-4 2003",
  bibdate =      "Thu Aug 21 09:09:03 MDT 2003",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  keywords =     "computational complexity --- congresses; computer
                 science --- congresses",

  editor =       "Hamparsum Bozdogan",
  booktitle =    "Statistical Data Mining and Knowledge Discovery",
  title =        "Statistical Data Mining and Knowledge Discovery",
  publisher =    pub-CRC,
  address =      pub-CRC:adr,
  pages =        "588",
  year =         "2004",
  ISBN =         "1-58488-344-8",
  ISBN-13 =      "978-1-58488-344-9",
  LCCN =         "QA76.9.D343 S685 2004",
  bibdate =      "Tue Jan 13 19:24:46 2004",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "Marian Bubak and Geert Dick van Albada and Peter M. A.
                 Sloot and Jack J. Dongarra",
  booktitle =    "Computational {Science--ICCS 2004}: 4th International
                 Conference Krak{\'o}w, Poland, June 6--9, 2004
                 Proceedings, Part {I}",
  title =        "Computational Science--{ICCS 2004}: 4th International
                 Conference Krak{\'o}w, Poland, June 6--9, 2004
                 Proceedings, {Part I}",
  volume =       "3036",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "698",
  year =         "2004",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-22114-X",
  ISBN-13 =      "978-3-540-22114-2",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA75.5 .I13 2004",
  bibdate =      "Thu Nov 11 19:26:30 MST 2004",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Marian Bubak and Geert Dick van Albada and Peter M. A.
                 Sloot and Jack J. Dongarra",
  booktitle =    "Computational {Science--ICCS 2004}: 4th International
                 Conference Krak{\'o}w, Poland, June 6--9, 2004
                 Proceedings, Part {II}",
  title =        "Computational Science--{ICCS 2004}: 4th International
                 Conference Krak{\'o}w, Poland, June 6--9, 2004
                 Proceedings, {Part II}",
  volume =       "3037",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "729",
  year =         "2004",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-22115-8",
  ISBN-13 =      "978-3-540-22115-9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA75.5 .I13 2004",
  bibdate =      "Thu Nov 11 19:26:30 MST 2004",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Marian Bubak and Geert Dick van Albada and Peter M. A.
                 Sloot and Jack J. Dongarra",
  booktitle =    "Computational {Science--ICCS 2004}: 4th International
                 Conference Krak{\'o}w, Poland, June 6--9, 2004
                 Proceedings, Part {III}",
  title =        "Computational Science--{ICCS 2004}: 4th International
                 Conference Krak{\'o}w, Poland, June 6--9, 2004
                 Proceedings, {Part III}",
  volume =       "3038",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "1296",
  year =         "2004",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-22116-6",
  ISBN-13 =      "978-3-540-22116-6",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA75.5 .I13 2004",
  bibdate =      "Thu Nov 11 19:26:30 MST 2004",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Marian Bubak and Geert Dick van Albada and Peter M. A.
                 Sloot and Jack J. Dongarra",
  booktitle =    "Computational {Science--ICCS 2004}: 4th International
                 Conference Krak{\'o}w, Poland, June 6--9, 2004
                 Proceedings, Part {IV}",
  title =        "Computational Science--{ICCS 2004}: 4th International
                 Conference Krak{\'o}w, Poland, June 6--9, 2004
                 Proceedings, {Part IV}",
  volume =       "3039",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "1256",
  year =         "2004",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-22129-8",
  ISBN-13 =      "978-3-540-22129-6",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA75.5 .I13 2004",
  bibdate =      "Tue Nov 16 07:55:23 2004",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Rudolf Eigenmann",
  booktitle =    "{ICPP 2004: 2004 International Conference on Parallel
                 Processing: proceedings: 15--18 August, 2004, Montreal,
                 Quebec, Canada}",
  title =        "{ICPP 2004: 2004 International Conference on Parallel
                 Processing: proceedings: 15--18 August, 2004, Montreal,
                 Quebec, Canada}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xviii + 576",
  year =         "2004",
  ISBN =         "0-7695-2197-5",
  ISBN-13 =      "978-0-7695-2197-8",
  LCCN =         "QA76.6 .I548 2004",
  bibdate =      "Fri May 27 14:08:58 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "{IEEE}",
  booktitle =    "{CCGrid 2004: 2004 IEEE International Symposium on
                 Cluster Computing and the Grid: April 19--22, 2004,
                 Chicago, IL}",
  title =        "{CCGrid 2004: 2004 IEEE International Symposium on
                 Cluster Computing and the Grid: April 19--22, 2004,
                 Chicago, IL}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "vi + 806",
  year =         "2004",
  ISBN =         "0-7803-8430-X",
  ISBN-13 =      "978-0-7803-8430-9",
  LCCN =         "QA76.9.C58 I42 2004",
  bibdate =      "Fri May 27 09:23:44 2005",
  bibsource =    "",
  note =         "IEEE catalog number 04EX836.",
  acknowledgement = ack-nhfb,

  editor =       "IEEE",
  booktitle =    "{18th International Parallel and Distributed
                 Processing Symposium: Santa Fe, New Mexico, April
                 26--30, 2004: proceedings}",
  title =        "{18th International Parallel and Distributed
                 Processing Symposium: Santa Fe, New Mexico, April
                 26--30, 2004: proceedings}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "lvi + 289",
  year =         "2004",
  ISBN =         "0-7695-2132-0",
  ISBN-13 =      "978-0-7695-2132-9",
  LCCN =         "QA76.58",
  bibdate =      "Fri May 27 14:05:16 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "IEEE",
  booktitle =    "{Seventh International Conference on High Performance
                 Computing and Grid in Asia Pacific Region proceedings:
                 Omiya Sonic City, Tokyo, Japan, 20--22 July, 2004}",
  title =        "{Seventh International Conference on High Performance
                 Computing and Grid in Asia Pacific Region proceedings:
                 Omiya Sonic City, Tokyo, Japan, 20--22 July, 2004}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "xviii + 520",
  year =         "2004",
  ISBN =         "0-7695-2138-X",
  ISBN-13 =      "978-0-7695-2138-1",
  LCCN =         "QA76.88",
  bibdate =      "Fri May 27 14:01:15 2005",
  bibsource =    "",
  acknowledgement = ack-nhfb,

  editor =       "Dieter Kranzlm{\"u}ller and P{\'e}ter Kacsuk and Jack
                 J. Dongarra",
  booktitle =    "{Recent advances in parallel virtual machine and
                 message passing interface: 11th European PVM/MPI Users'
                 Group Meeting, Budapest, Hungary, September 19--22,
                 2004: proceedings}",
  title =        "{Recent advances in parallel virtual machine and
                 message passing interface: 11th European PVM/MPI Users'
                 Group Meeting, Budapest, Hungary, September 19--22,
                 2004: proceedings}",
  volume =       "3241",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xiii + 452",
  year =         "2004",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-23163-3",
  ISBN-13 =      "978-3-540-23163-9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 .E973 2004",
  bibdate =      "Sat Jun 4 05:55:05 MDT 2005",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          ";
  acknowledgement = ack-nhfb,
  meetingname =  "European PVM/MPI Users' Group Meeting (11th : 2004 :
                 Budapest, Hungary)",
  subject =      "Parallel computers; Congresses; Virtual computer
                 systems; Congresses; Data transmission systems;

  editor =       "Ralph H. Sprague",
  booktitle =    "Proceedings of the {37th Annual Hawaii International
                 Conference on System Sciences abstracts and CD-ROM of
                 full papers: 5--8 January, 2004, Big Island, Hawaii}",
  title =        "Proceedings of the {37th Annual Hawaii International
                 Conference on System Sciences abstracts and CD-ROM of
                 full papers: 5--8 January, 2004, Big Island, Hawaii}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "lxxi + 320",
  year =         "2004",
  ISBN =         "0-7695-2056-1",
  ISBN-13 =      "978-0-7695-2056-8",
  LCCN =         "Q350",
  bibdate =      "Fri May 27 09:25:56 2005",
  bibsource =    "",
  note =         "HICSS-37, Hilton Waikoloa Village, Big Island,
  acknowledgement = ack-nhfb,

  editor =       "Roman Wyrzykowski and Jack Dongarra and Marcin
                 Paprzycki and Jerzy Wa{\'s}niewski",
  booktitle =    "{Parallel Processing and Applied Mathematics: 5th
                 International Conference, PPAM 2003, Cz{\k{e}}stochowa,
                 Poland, September 7--10, 2003: Revised Papers}",
  title =        "{Parallel Processing and Applied Mathematics: 5th
                 International Conference, PPAM 2003, Cz{\k{e}}stochowa,
                 Poland, September 7--10, 2003: Revised Papers}",
  volume =       "3019",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xix + 1174",
  year =         "2004",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-21946-3",
  ISBN-13 =      "978-3-540-21946-0",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 .P69 2003",
  bibdate =      "Thu Nov 11 19:26:30 MST 2004",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Michel Dayd{\'e} and Jack J. Dongarra and Vicente
                 Hern{\'a}ndez and Jos{\'e} M. L. M. Palma",
  booktitle =    "{High Performance Computing for Computational Science:
                 VECPAR 2004: 6th International Conference Valencia,
                 Spain, June 28--30, 2004 Revised Selected and Invited
  title =        "{High Performance Computing for Computational Science:
                 VECPAR 2004: 6th International Conference Valencia,
                 Spain, June 28--30, 2004 Revised Selected and Invited
  volume =       "3402",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xi + 732",
  year =         "2005",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-25424-2",
  ISBN-13 =      "978-3-540-25424-9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.88 .V43 2004",
  bibdate =      "Thu Jun 02 07:52:30 2005",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Beniamino {Di Martino} and Dieter Kranzlm{\"u}ller and
                 J. J. Dongarra",
  booktitle =    "{Recent advances in parallel virtual machine and
                 message passing interface: 12th European PVM/MPI User's
                 Group Meeting, Sorrento, Italy, September 18--21, 2005:
  title =        "{Recent advances in parallel virtual machine and
                 message passing interface: 12th European PVM/MPI User's
                 Group Meeting, Sorrento, Italy, September 18--21, 2005:
  volume =       "3666",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xvii + 546",
  year =         "2005",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-29009-5 (paperback)",
  ISBN-13 =      "978-3-540-29009-4 (paperback)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 .E973 2005",
  bibdate =      "Wed Apr 5 19:31:25 MDT 2006",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  meetingname =  "European PVM/MPI Users' Group Meeting (12th : 2005 :
                 Sorrento, Italy)",
  subject =      "Parallel computers; Congresses; Virtual computer
                 systems; Data transmission systems",

  editor =       "{IEEE}",
  booktitle =    "{19th International Parallel and Distributed
                 Processing Symposium: proceedings: April 4--8, 2005,
                 Denver, Colorado}",
  title =        "{19th International Parallel and Distributed
                 Processing Symposium: proceedings: April 4--8, 2005,
                 Denver, Colorado}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  pages =        "lv + 311",
  year =         "2005",
  ISBN =         "0-7695-2312-9",
  ISBN-13 =      "978-0-7695-2312-5",
  LCCN =         "QA76.58 .I583 2005",
  bibdate =      "Fri May 27 14:11:22 2005",
  bibsource =    "",
  note =         "IEEE Computer Society Order Number P2312.",
  acknowledgement = ack-nhfb,

  editor =       "Yi Pan and Daoxu Chen and Minyi Guo and Jiannong Cao
                 and Jack J. Dongarra",
  booktitle =    "{Parallel and distributed processing and applications:
                 third international symposium, ISPA 2005, Nanjing,
                 China, November 2--5, 2005: proceedings}",
  title =        "{Parallel and distributed processing and applications:
                 third international symposium, ISPA 2005, Nanjing,
                 China, November 2--5, 2005: proceedings}",
  volume =       "3758",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xxiii + 1162",
  year =         "2005",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-29769-3",
  ISBN-13 =      "978-3-540-29769-7",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 .I88 2005",
  bibdate =      "Wed Apr 5 09:40:57 MDT 2006",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  meetingname =  "ISPA 2005 (2005: Nanjing Shi, China)",
  subject =      "Parallel processing (Electronic computers);
                 Congresses; Electronic data processing; Distributed

  editor =       "Vaidy S. Sunderam and Geert Dick van Albada and Peter
                 M. A. Sloot and Jack J. Dongarra",
  booktitle =    "{Computational science: ICCS 2005: 5th international
                 conference, Atlanta, GA, USA, May 22--25, 2005,
                 proceedings, Part I}",
  title =        "{Computational science: ICCS 2005: 5th international
                 conference, Atlanta, GA, USA, May 22--25, 2005,
                 proceedings, Part I}",
  volume =       "3514",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "lxiii + 1089",
  year =         "2005",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-26032-3 (softcover)",
  ISBN-13 =      "978-3-540-26032-5 (softcover)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA75.5 .I13 2005",
  bibdate =      "Thu Jun 2 09:16:09 MDT 2005",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          ";
  acknowledgement = ack-nhfb,

  editor =       "Vaidy S. Sunderam and Geert Dick van Albada and Peter
                 M. A. Sloot and Jack J. Dongarra",
  booktitle =    "{Computational science: ICCS 2005: 5th international
                 conference, Atlanta, GA, USA, May 22--25, 2005,
                 proceedings, Part II}",
  title =        "{Computational science: ICCS 2005: 5th international
                 conference, Atlanta, GA, USA, May 22--25, 2005,
                 proceedings, Part II}",
  volume =       "3515",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "????",
  year =         "2005",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-26043-9",
  ISBN-13 =      "978-3-540-26043-1",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "????",
  bibdate =      "Thu Jun 02 07:52:30 2005",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          ";
  acknowledgement = ack-nhfb,

  editor =       "Vaidy S. Sunderam and Geert Dick van Albada and Peter
                 M. A. Sloot and Jack J. Dongarra",
  booktitle =    "{Computational science: ICCS 2005: 5th international
                 conference, Atlanta, GA, USA, May 22--25, 2005,
                 proceedings, Part III}",
  title =        "{Computational science: ICCS 2005: 5th international
                 conference, Atlanta, GA, USA, May 22--25, 2005,
                 proceedings, Part III}",
  volume =       "3516",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "lxiii + 1143",
  year =         "2005",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-26044-7",
  ISBN-13 =      "978-3-540-26044-8",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "????",
  bibdate =      "Thu Jun 02 07:52:30 2005",
  bibsource =    "",
  series =       ser-LNCS,
  URL =          ";
  acknowledgement = ack-nhfb,

  editor =       "Laurence Tianruo Yang and Omer F. Rana and Beniamino
                 Di Martino and Jack Dongarra",
  booktitle =    "{High performance computing and communications: first
                 international conference, HPCC 2005, Sorrento, Italy,
                 September 21--23, 2005: proceedings}",
  title =        "{High performance computing and communications: first
                 international conference, HPCC 2005, Sorrento, Italy,
                 September 21--23, 2005: proceedings}",
  volume =       "3726",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xxvi + 1116",
  year =         "2005",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-29031-1 (softcover)",
  ISBN-13 =      "978-3-540-29031-5 (softcover)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.88 .H655 2005",
  bibdate =      "Wed Apr 5 19:38:30 MDT 2006",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  meetingname =  "HPCC 2005 (2005 : Sorrento, Italy)",
  subject =      "High performance computing; Congresses;

  editor =       "{ACM}",
  booktitle =    "{SC'06: Conference on High Performance Networking and
                 Computing: proceedings of the 2006 ACM/IEEE conference
                 on Supercomputing, November 11--17, 2006, Tampa
                 Convention Center, Tampa, Florida, USA}",
  title =        "{SC'06: Conference on High Performance Networking and
                 Computing: proceedings of the 2006 ACM/IEEE conference
                 on Supercomputing, November 11--17, 2006, Tampa
                 Convention Center, Tampa, Florida, USA}",
  publisher =    pub-ACM,
  address =      pub-ACM:adr,
  pages =        "????",
  year =         "2006",
  ISBN =         "0-7695-2700-0",
  ISBN-13 =      "978-0-7695-2700-0",
  LCCN =         "QA76.5 .P742 2006",
  bibdate =      "Thu Nov 8 20:03:51 MST 2007",
  bibsource =    ";
  note =         "Contains one CD-ROM.",
  acknowledgement = ack-nhfb,
  meetingname =  "Conference on High Performance Networking and
                 Computing 2006. Tampa, Florida",

  editor =       "Vassil N. Alexandrov and Geert Dick van Albada and
                 Peter M. A. Sloot and Jack Dongarra",
  booktitle =    "{Computational Science -- ICCS 2006: 6th International
                 Conference, Reading, UK, May 28--31, 2006. Proceedings,
                 Part II}",
  title =        "{Computational Science -- ICCS 2006: 6th International
                 Conference, Reading, UK, May 28--31, 2006. Proceedings,
                 Part II}",
  volume =       "3992",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "154 (est.)",
  year =         "2006",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-34381-4 (print), 3-540-34382-2 (e-book)",
  ISBN-13 =      "978-3-540-34381-3 (print), 978-3-540-34382-0
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:17:29 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Vassil N. Alexandrov and Geert Dick van Albada and
                 Peter M. A. Sloot and Jack Dongarra",
  booktitle =    "{Computational Science -- ICCS 2006: 6th International
                 Conference, Reading, UK, May 28--31, 2006. Proceedings,
                 Part III}",
  title =        "{Computational Science -- ICCS 2006: 6th International
                 Conference, Reading, UK, May 28--31, 2006. Proceedings,
                 Part III}",
  volume =       "3993",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "142 (est.)",
  year =         "2006",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-34383-0 (print), 3-540-34384-9 (e-book)",
  ISBN-13 =      "978-3-540-34383-7 (print), 978-3-540-34384-4
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:17:31 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Vassil N. Alexandrov and Geert Dick van Albada and
                 Peter M. A. Sloot and Jack Dongarra",
  booktitle =    "{Computational Science -- ICCS 2006: 6th International
                 Conference, Reading, UK, May 28--31, 2006, Proceedings,
                 Part IV}",
  title =        "{Computational Science -- ICCS 2006: 6th International
                 Conference, Reading, UK, May 28--31, 2006, Proceedings,
                 Part IV}",
  volume =       "3994",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "155 (est.)",
  year =         "2006",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-34385-7 (print), 3-540-34386-5 (e-book)",
  ISBN-13 =      "978-3-540-34385-1 (print), 978-3-540-34386-8
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:17:32 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Jack Dongarra and Kaj Madsen and Jerzy Wasniewski",
  booktitle =    "{Applied Parallel Computing: State of the Art in
                 Scientific Computing. 7th International Workshop, PARA
                 2004, Lyngby, Denmark, June 20--23, 2004. Revised
                 Selected Papers}",
  title =        "{Applied Parallel Computing: State of the Art in
                 Scientific Computing. 7th International Workshop, PARA
                 2004, Lyngby, Denmark, June 20--23, 2004. Revised
                 Selected Papers}",
  volume =       "3732",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  bookpages =    "xxii + 1174",
  pages =        "????",
  year =         "2006",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-29067-2 (softcover), 3-540-33498-X",
  ISBN-13 =      "978-3-540-29067-4 (softcover), 978-3-540-33498-9",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "QA76.58 .P353 2004",
  bibdate =      "Wed Apr 5 19:40:10 MDT 2006",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Minyi Guo and Laurence T. Yang and Beniamino {Di
                 Martino} and Hans P. Zima and Jack Dongarra and Feilong
  booktitle =    "{Parallel and Distributed Processing and Applications:
                 4th International Symposium, ISPA 2006, Sorrento,
                 Italy, December 4--6, 2006. Proceedings}",
  title =        "{Parallel and Distributed Processing and Applications:
                 4th International Symposium, ISPA 2006, Sorrento,
                 Italy, December 4--6, 2006. Proceedings}",
  volume =       "4330",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "182 (est.)",
  year =         "2006",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-68067-5 (print), 3-540-68070-5 (e-book)",
  ISBN-13 =      "978-3-540-68067-3 (print), 978-3-540-68070-3
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:24:42 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Bernd Mohr and Jesper Larsson Tr{\"a}ff and Joachim
                 Worringen and Jack Dongarra",
  booktitle =    "{Recent Advances in Parallel Virtual Machine and
                 Message Passing Interface: 13th European PVM\slash MPI
                 User's Group Meeting Bonn, Germany, September 17--20,
                 2006 Proceedings}",
  title =        "{Recent Advances in Parallel Virtual Machine and
                 Message Passing Interface: 13th European PVM\slash MPI
                 User's Group Meeting Bonn, Germany, September 17--20,
                 2006 Proceedings}",
  volume =       "4192",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "104 (est.)",
  year =         "2006",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-39110-X (print), 3-540-39112-6 (e-book)",
  ISBN-13 =      "978-3-540-39110-4 (print), 978-3-540-39112-8
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:21:40 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  author =       "S. A. Shahzadeh-Fazeli and N. Emad and J. Dongarra",
  editor =       "I. Lirkov and S. Margenov and J. Wasniewski",
  booktitle =    "Large-Scale Scientific Computing",
  title =        "Eigenvalue computation with {NetSolve} global
                 computing system",
  volume =       "3743",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "446--453",
  year =         "2006",
  DOI =          "",
  ISBN =         "3-540-31994-8",
  ISBN-13 =      "978-3-540-31994-8",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  LCCN =         "????",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  classification = "Sozopol, Bulgaria",
  conference-date = "Jun 06-10, 2005",
  conference-name = "5th International Conference on Large-Scale
                 Scientific Computing (LSSC 2005)",
  sponsor =      "Bulgarian Acad Sci, Inst Parallel Proc",

  editor =       "Roman Wyrzykowski and Jack Dongarra and Norbert
  booktitle =    "{Parallel Processing and Applied Mathematics: 6th
                 International Conference, PPAM 2005, Poznan, Poland,
                 September 11--14, 2005, Revised Selected Papers}",
  title =        "{Parallel Processing and Applied Mathematics: 6th
                 International Conference, PPAM 2005, Poznan, Poland,
                 September 11--14, 2005, Revised Selected Papers}",
  volume =       "3911",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xxiii + 1126",
  year =         "2006",
  ISBN =         "3-540-34141-2 (softcover)",
  ISBN-13 =      "978-3-540-34141-3 (softcover)",
  LCCN =         "QA76.58 .P69 2005",
  bibdate =      "Tue Jun 13 16:04:54 MDT 2006",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          ";
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Franck Cappello and Thomas Herault and Jack Dongarra",
  booktitle =    "{Recent Advances in Parallel Virtual Machine and
                 Message Passing Interface: 14th European PVM\slash MPI
                 User's Group Meeting, Paris, France, September 30 ---
                 October 3, 2007. Proceedings}",
  title =        "{Recent Advances in Parallel Virtual Machine and
                 Message Passing Interface: 14th European PVM\slash MPI
                 User's Group Meeting, Paris, France, September 30 ---
                 October 3, 2007. Proceedings}",
  volume =       "4757",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "116 (est.)",
  year =         "2007",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-75415-6 (print), 3-540-75416-4 (e-book)",
  ISBN-13 =      "978-3-540-75415-2 (print), 978-3-540-75416-9
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:25:09 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Andrew Oram and Greg Wilson",
  booktitle =    "Beautiful Code",
  title =        "Beautiful Code",
  publisher =    pub-ORA,
  address =      pub-ORA:adr,
  pages =        "xxi + 593",
  year =         "2007",
  ISBN =         "0-596-51004-7 (paperback)",
  ISBN-13 =      "978-0-596-51004-6 (paperback)",
  LCCN =         "QA76.758 .B428 2007; QA76.758 .B43 2007; QA76.758 .B48
  bibdate =      "Tue Aug 5 17:53:37 MDT 2008",
  bibsource =    ";
  series =       "Theory in practice",
  URL =          ";
  acknowledgement = ack-nhfb,
  subject =      "Software engineering",
  tableofcontents = "Foreword / Greg Wilson / xv \\
                 Preface / xvii \\
                 1 A Regular Expression Matcher / Brian Kernighan \\
                 The Practice of Programming / 2 \\
                 Implementation / 3 \\
                 Discussion / 4 \\
                 Alternatives / 5 \\
                 Building on It / 6 \\
                 Conclusion / 8 \\
                 2 Subversion's Delta Editor: Interface as Ontology /
                 Karl Fogel / 11 \\
                 Version Control and Tree Transformation / 12 \\
                 Expressing Tree Differences / 16 \\
                 The Delta Editor Interface / 17 \\
                 But Is It Art? / 23 \\
                 Abstraction As a Spectator Sport / 25 \\
                 Conclusions / 27 \\
                 The Most Beautiful Code I Never Wrote / Jon Bentley /
                 29 \\
                 The Most Beautiful Code I Ever Wrote / 30 \\
                 More and More with Less and Less / 31 \\
                 Perspective / 36 \\
                 What Is Writing? / 38 \\
                 Conclusion / 39 \\
                 Acknowledgments / 40 \\
                 Finding Things / Tim Bray / 41 \\
                 On Time / 41 \\
                 Problem: Weblog Data / 42 \\
                 Problem: Who Fetched What, When? / 50 \\
                 Search in the Large / 55 \\
                 Conclusion / 57 \\
                 5 Correct, Beautiful, Fast (in That Order): Lessons
                 From Designing XML Verifiers / Elliotte Rusty Harold /
                 59 \\
                 The Role of XML Validation / 59 \\
                 The Problem / 60 \\
                 Version 1: The Na{\''\i}ve Implementation / 62 \\
                 Version 2: Imitating the BNF Grammar O(N) / 63 \\
                 Version 3: First Optimization O(log N) / 64 \\
                 Version H: Second Optimization: Don't Check Twice / 66
                 Version 5: Third Optimization 0(1) / 68 \\
                 Version 6: Fourth Optimization: Caching / 72 \\
                 The Moral of the Story / 74 \\
                 6 Framework for Integrated Test: Beauty Through
                 Fragility / Michael Feathers / 75 \\
                 An Acceptance Testing Framework In Three Classes / 76
                 The Challenge of Framework Design / 78 \\
                 An Open Framework / 79 \\
                 How Simple Can an HTML Parser Be? / 80 \\
                 Conclusion / 83 \\
                 7 Beautiful Tests / Alberto Savoia / 85 \\
                 That Pesky Binary Search / 87 \\
                 Introducing JUnit / 89 \\
                 Nailing Binary Search / 90 \\
                 Conclusion / 102 \\
                 8 On-the-Fly Code Generation for Image Processing /
                 Charles Petzold / 105 \\
                 9 Top Down Operator Precedence / Douglas Crockford /
                 129 \\
                 JavaScript / 130 \\
                 Symbol Table / 131 \\
                 Tokens / 132 \\
                 Precedence / 133 \\
                 Expressions 134 / \\
                 Infix Operators / 134 \\
                 Prefix Operators / 136 \\
                 Assignment Operators / 137 \\
                 Constants / 138 \\
                 Scope / 138 \\
                 Statements / 140 \\
                 Functions / 143 \\
                 Array and Object Literals / 144 \\
                 Things to Do and Think About / 145 \\
                 10 The Quest for an Accelerated Population Count /
                 Henry S. Warren, Jr. / 147 \\
                 Basic Methods / 148 \\
                 Divide and Conquer / 149 \\
                 Other Methods / 151 \\
                 Sum and Difference of Population Counts of Two Words /
                 152 \\
                 Comparing the Population Counts of Two Words / 153 \\
                 Counting the 1-Bits in an Array 154 / \\
                 Applications / 158 \\
                 11 Secure Communication: the Technology of Freedom /
                 Ashish Gulhati / 161 \\
                 The Heart of the Start / 162 \\
                 Untangling the Complexity of Secure Messaging / 163 \\
                 Usability Is the Key / 165 \\
                 The Foundation / 167 \\
                 The Test Suite / 172 \\
                 The Functioning Prototype / 172 \\
                 Cleanup, Plug In, Rock On / 173 \\
                 Hacking in the Himalayas / 177 \\
                 The Invisible Hand Moves / 182 \\
                 Speed Does Matter 184 / \\
                 Communications Privacy for Individual Rights / 185 \\
                 Hacking the Civilization / 185 \\
                 12 Growing Beautiful Code in Bioperl / Lincoln Stein /
                 187 \\
                 BioPerl and the BiccGraphics Module / 188 \\
                 The Bio::Graphics Design Process / 192 \\
                 Extending Bio::Graphics / 210 \\
                 Conclusions and Lessons Learned 214 / \\
                 13 The Design of the Gene Sorter / Jim Kent / 217 \\
                 The User Interface of the Gene Sorter / 218 \\
                 Maintaining a Dialog with the User over the Web / 219
                 A Little Polymorphism Can Go a Long Way / 221 \\
                 Filtering Down to Just the Relevant Genes / 224 \\
                 Theory of Beautiful Code in the Large / 225 \\
                 Conclusion / 228 \\
                 14 How Elegant Code Evolves With Hardware: The Case of
                 Gaussian Elimination / Jack Dongarra and Piotr Luszczek
                 / 229 \\
                 The Effects of Computer Architectures on Matrix
                 Algorithms / 230 \\
                 A Decompositional Approach / 232 \\
                 A Simple Version / 233 \\
                 Linpack's DGEFA Subroutine / 235 \\
                 Lapack DGETRF / 237 \\
                 Recursive LU / 240 \\
                 ScaLAPACK PDGETRF / 243 \\
                 Multithreading for Multi-Core Systems / 247 \\
                 A Word About the Error Analysis and Operation Count /
                 250 \\
                 Future Directions for Research / 251 \\
                 Further Reading / 252 \\
                 15 The Long-Term Benefits of Beautiful Design / Adam
                 Kolawa / 253 \\
                 My Idea of Beautiful Code / 253 \\
                 Introducing the CERN Library / 254 \\
                 Outer Beauty / 255 \\
                 Inner Beauty / 261 \\
                 Conclusion / 266 \\
                 16 The Linux Kernel Driver Model: the Benefits of
                 Working Together / Greg Kroah-Hartman / 267 \\
                 Humble Beginnings / 268 \\
                 Reduced to Even Smaller Bits / 273 \\
                 Scaling Up to Thousands of Devices / 276 \\
                 Small Objects Loosely Joined / 277 \\
                 17 Another Level of Indirection / Diomidis Spinellis /
                 279 \\
                 From Code to Pointers / 280 \\
                 From Function Arguments to Argument Pointers / 282 \\
                 From Filesystems to Filesystem Layers / 285 \\
                 From Code to a Domain-Specific Language / 287 \\
                 Multiplexing and Demultiplexing / 289 \\
                 Layers Forever? / 290 \\
                 18 Python's Dictionary Implementation: Being All Things
                 To All People / Andrew Kuchling / 293 \\
                 Inside the Dictionary / 295 \\
                 Special Accommodations / 296 \\
                 Collisions / 298 \\
                 Resizing / 299 \\
                 Iterations and Dynamic Changes / 300 \\
                 Conclusion / 301 \\
                 Acknowledgments / 301 \\
                 19 Multidimensional Iterators in NumPy / Travis T.
                 Oliphant / 303 \\
                 Key Challenges in N-Dimensional Array Operations / 304
                 Memory Models for an N-Dimensional Array / 305 \\
                 NumPy Iterator Origins / 307 \\
                 Iterator Design / 307 \\
                 Iterator Interface / 313 \\
                 Iterator Use / 314 \\
                 Conclusion / 318 \\
                 20 A Highly Reliable Enterprise System for NASA's Mars
                 Rover Mission / Ronald Mak / 319 \\
                 The Mission and the Collaborative Information Portal /
                 320 \\
                 Mission Needs / 321 \\
                 System Architecture / 322 \\
                 Case Study: The Streamer Service / 325 \\
                 Reliability / 328 \\
                 Robustness / 336 \\
                 Conclusion / 338 \\
                 21 ERP5: Designing for Maximum Adaptability / Rogerio
                 Atem de Carualho and Rafael Monnerat / 339 \\
                 General Goals of ERP / 340 \\
                 ERP5 / 340 \\
                 The Underlying Zope Platform / 342 \\
                 ERP5 Project Concepts / 346 \\
                 Coding the ERP5 Project / 347 \\
                 Conclusion / 351 \\
                 22 A Spoonful of Sewage / Bryan Cantrill / 353 \\
                 23 Distributed Programming With Mapreduce / Jeffrey
                 Dean and Sanjay Ghemawat / 371 \\
                 A Motivating Example / 371 \\
                 The MapReduce Programming Model / 374 \\
                 Other MapReduce Examples / 375 \\
                 A Distributed MapReduce Implementation / 377 \\
                 Extensions to the Model / 380 \\
                 Conclusion / 381 \\
                 Further Reading / 381 \\
                 Acknowledgments / 382 \\
                 Appendix: Word Count Solution / 382 \\
                 21 Beautiful Concurrency / Simon Peyton Jones / 385 \\
                 A Simple Example: Bank Accounts / 386 \\
                 Software Transactional Memory / 388 \\
                 The Santa Claus Problem / 396 \\
                 Reflections on Haskell / 404 \\
                 Conclusion / 404 \\
                 Acknowledgments / 406 \\
                 25 Syntactic Abstraction: the Syntax-Case Expander / R.
                 Kent Dybvig / 407 \\
                 Brief Introduction to syntax-case / 411 \\
                 Expansion Algorithm / 413 \\
                 Example / 425 \\
                 Conclusion / 428 \\
                 26 Labor-Saving Architecture: an Object-Oriented / \\
                 Framework for Networked Software / William R. Otte and
                 Douglas C. Schmidt / 429 \\
                 Sample Application: Logging Service / 431 \\
                 Object-Oriented Design of the Logging Server Framework
                 / 433 \\
                 Implementing Sequential Logging Servers / 439 \\
                 Implementing Concurrent Logging Servers / 444 \\
                 Conclusion / 450 \\
                 27 Integrating Business Partners the Restful Way /
                 Andrew Patzer / 451 \\
                 Project Background / 452 \\
                 Exposing Services to External Clients / 452 \\
                 '' Routing the Service Using the Factory Pattern / 456
                 Exchanging Data Using E-Business Protocols / 457 \\
                 Conclusion / 462 \\
                 28 Beautiful Debugging / Andreas Zeller / 463 \\
                 Debugging a Debugger / 464 \\
                 A Systematic Process / 466 \\
                 A Search Problem / 467 \\
                 Finding the Failure Cause Automatically / 468 \\
                 Delta Debugging / 470 \\
                 Minimizing Input / 472 \\
                 Hunting the Defect / 473 \\
                 A Prototype Problem / 475 \\
                 Conclusion / 476 \\
                 Acknowledgments / 476 \\
                 Further Reading / 476 \\
                 29 Treating Code as an Essay / Yukihiro Matsumoto / 477
                 30 When A Button Is All That Connects You to the World
                 / Arun Mehta / 483 \\
                 Basic Design Model / 484 \\
                 Input Interface / 487 \\
                 Efficiency of the User Interface / 500 \\
                 Download / 500 \\
                 Future Directions / 500 \\
                 31 Emacspeak: the Complete Audio Desktop / T. V. Raman
                 / 503 \\
                 Producing Spoken Output / 504 \\
                 Speech-Enabling Emacs / 505 \\
                 Painless Access to Online Information / 516 \\
                 Summary / 522 \\
                 Acknowledgments / 525 \\
                 32 Code in Motion / Laura Wingerd and Christopher
                 Seiwald / 527 \\
                 On Being ``Bookish'' / 528 \\
                 Alike Looking Alike / 529 \\
                 The Perils of Indentation / 530 \\
                 Navigating Code / 531 \\
                 The Tools We Use / 532 \\
                 DiffMerge's Checkered Past / 534 \\
                 Conclusion / 536 \\
                 Acknowledgments / 536 \\
                 Further Reading / 536 \\
                 33 Writing Programs for ``The Book'' / Brian Hayes /
                 539 \\
                 The Nonroyal Road / 540 \\
                 Warning to Parenthophobes / 540 \\
                 Three in a Row / 541 \\
                 The Slippery Slope / 544 \\
                 The Triangle Inequality / 545 \\
                 Meandering On / 547 \\
                 ``Duh!'' --- I Mean ``Aha!'' / 548 \\
                 Conclusion / 550 \\
                 Further Reading / 550 \\
                 Afterword / Andy Oram / 553 \\
                 Contributors / 555 \\
                 Index / 565",

  editor =       "Leslie Hogben",
  booktitle =    "Handbook of Linear Algebra",
  title =        "Handbook of Linear Algebra",
  publisher =    pub-CHAPMAN-HALL-CRC,
  address =      pub-CHAPMAN-HALL-CRC:adr,
  pages =        "xxx + 1370",
  year =         "2007",
  ISBN =         "1-58488-510-6 (hardcover), 1-4200-1057-3 (e-book)",
  ISBN-13 =      "978-1-58488-510-8 (hardcover), 978-1-4200-1057-2
  LCCN =         "QA184.2 .H36 2007",
  MRclass =      "15-00 (00A20)",
  MRnumber =     "2279160 (2007j:15001)",
  bibdate =      "Fri Nov 21 06:49:56 2014",
  bibsource =    ";
  note =         "Associate editors: Richard Brualdi, Anne Greenbaum and
                 Roy Mathias.",
  series =       "Discrete Mathematics and its Applications (Boca
  URL =          ";
  abstract =     "\booktitle{Handbook of Linear Algebra} covers all
                 aspects of linear algebra, including fundamentals,
                 numerical linear algebra, software packages for
                 computation in linear algebra, and various
                 applications, such as quantum computing, control
                 theory, image compression, and computational biology.
                 The author addresses combinatorial Matrix theory and
                 features Matrix notation throughout the text. The book
                 includes a chapter on software that provides extensive
                 coverage of MATLAB, Maple, and Mathematica and contains
                 details of Fortran subroutines available for linear
                 algebra such as LAPACK and ARPACK. Rather than
                 presenting long mathematical proofs, the text provides
                 numerous references for additional information.",
  acknowledgement = ack-nhfb # " and " # ack-rah,
  keywords =     "Maple",
  remark =       "Associate editors: Richard Brualdi, Anne Greenbaum,
                 and Roy Mathias.",
  subject =      "Algebras, Linear",
  tableofcontents = "Preliminaries \\
                 I. Linear algebra \\
                 1: Vectors, matrices and systems of linear equations /
                 Jane Day \\
                 2: Linear independence, span, and bases / Mark Mills
                 3: Linear transformations / Francesco Barioli \\
                 4: Determinants and eigenvalues / Luz M. DeAlba \\
                 5: Inner product spaces, orthogonal projection, least
                 squares and singular value decomposition / Lixing Han
                 and Michael Neumann \\
                 6: Canonical forms / Leslie Hogben \\
                 7: Unitary similarity, normal matrices, and spectral
                 theory / Helene Shapiro \\
                 8: Hermitian and positive definite matrices / Wayne
                 Barrett \\
                 9: Nonnegative and stochastic matrices / Uriel G.
                 Rothblum \\
                 10: Partitioned matrices / Robert Reams \\
                 11: Functions of matrices / Nicholas J. Higham \\
                 12: Quadratic, bilinear and sesquilinear forms /
                 Raphael Lowey \\
                 13: Multilinear algebra / J. A. Dias de Silva and
                 Armando Machado \\
                 14: Matrix equalities and inequalities / Michael
                 Tsatsomeros \\
                 15: Matrix perturbation theory / Ren-Cang Li \\
                 16: Pseudospectra / Mark Embree \\
                 17: Singular values and singular value inequalities /
                 Roy Mathias \\
                 18: Numerical range / Chi-Kwong Li \\
                 19: Matrix stability and inertia / Daniel Hershkowitz
                 20: Inverse eigenvalue problems / Alberto Borobia \\
                 21: Totally positive and totally negative matrices /
                 Shaun M. Fallat \\
                 22: Linear preserver problems / Peter \v Semrl \\
                 23: Matrices over integral domains / Shmuel Friedland
                 24: Similarities of families of matrices / Shmuel
                 Friedland \\
                 25: Max-plus algebra / Marianne Akian, Ravindra Bapat,
                 St{\'e}phane Gaubert \\
                 26: Matrices leaving a cone invariant / Bit-Shun Tam
                 and Hans Schneider \\
                 II. Combinatorial matrix theory and graphs \\
                 27: Combinatorial matrix theory / Richard A. Brualdi
                 28: Matrices and graphs / Willem H. Haemers \\
                 29: Digraphs and matrices / Jeffrey L. Stuart \\
                 30: Bipartite graphs and matrices / Bryan L. Shader \\
                 31: Permanents / Ian M. Wanless \\
                 32: D-optimal designs / Michael G. Neubauer and William
                 Watkins \\
                 33: Sign pattern matrices / Frank J. Hall and Zhongshan
                 Li \\
                 34: Multiplicity lists for the eigenvalues of symmetric
                 matrices with a given graph / Charles R. Johnson,
                 Ant{\'o}nio Leal Duarte, and Carlos M. Saiago \\
                 35: Matrix completion problems / Leslie Hogben and Amy
                 Wangsness \\
                 36: Algebraic connectivity / Steve Kirkland \\
                 III. Numerical methods \\
                 37: Vector and matrix norms, error analysis, efficiency
                 and stability / Ralph Byers and Biswa Nath Datta \\
                 38: Matrix factorizations, and direct solution of
                 linear systems / Christopher Beattie \\
                 39: Least squares solution of linear systems / Per
                 Christian Hansen and Hans Bruun Nielsen \\
                 40: Sparse matrix methods / Esmond G. Ng \\
                 41: Iterative solution methods for linear systems /
                 Anne Greenbaum \\
                 42: Symmetric matrix eigenvalue techniques / Ivan
                 Slapni\v car \\
                 43: Unsymmetric matrix eigenvalue techniques / David S.
                 Watkins \\
                 44: The implicitly restarted Arnoldi method / D. C.
                 Sorensen \\
                 45: Computation of the singular value decomposition /
                 Alan Kaylor Cline and Inderjit S. Dhillon \\
                 46: Computing eigenvalues and singular values to high
                 relative accuracy / Zlatko Drma{\v{c}} \\
                 47: Fast matrix multiplication / Dario A. Bini \\
                 48: Structured matrix computations / Michael Ng \\
                 49: Large-scale matrix computations / Roland W. Freund
                 IV. Applications \\
                 50: Linear programming / Leonid S. Vaserstein \\
                 51: Semidefinite programming / Henry Wolkowicz \\
                 52: Random vectors and linear statistical models / Simo
                 Puntanen and George P. H. Styan \\
                 53: Multivariate statistical analysis / Simo Puntanen,
                 George A. F. Seber, and George P. H. Styan \\
                 54: Markov chains / Beatrice Meini \\
                 55: Differential equations and stability / Volker
                 Mehrmann and Tatjana Stykel \\
                 56: Dynamical systems and linear algebra / Fritz
                 Colonius and Wolfgang Kliemann \\
                 57: Control theory / Peter Benner \\
                 58: Fourier analysis / Kenneth Howell \\
                 59: Linear algebra and mathematical physics / Lorenzo
                 Sadun \\
                 60: Linear algebra in biomolecular modeling / Zhijun Wu
                 61: Coding theory / Joachim Rosenthal and Paul Weiner
                 62: Quantum computation / Zijian Diao \\
                 63: Information retrieval and web search / Amy
                 Langville and Carl Meyer \\
                 64: Signal processing / Michael Stewart \\
                 65: Geometry / Mark Hunacek \\
                 66: Some applications of matrices and graphs in
                 Euclidean geometry / Miroslav Fiedler \\
                 67: Matrix groups / Peter J. Cameron \\
                 68: Group representations / Randall Holmes and T. Y.
                 Tam \\
                 69: Nonassociative algebras / Murray R. Bremner, Lucia
                 I. Muakami and Ivan P. Shestakov \\
                 70: Lie algebras / Robert Wilson \\
                 V. Computational software \\
                 71: METLAB / Steven J. Leon \\
                 72: Linear algebra in Maple / David J. Jeffrey and
                 Robert M. Corless \\
                 73: Mathematica / Heikki Ruskeep{\"a}{\"a} \\
                 74: BLAS / Jack Dongarra, Victor Eijkhout, and Julien
                 Langou \\
                 75: LAPACK / Zhaojun Bai \\
                 76: Use of ARPACK and EIGS / D. C. Sorensen \\
                 77: Summary of Software for Linear Algebra Freely
                 Available on the Web / Jack Dongarra, Victor Eijkhout,
                 Julien Langou \\
                 G-1: Glossary \\
                 H-1: Notation Index",

  editor =       "Bo K{\aa}gstr{\"o}m and Erik Elmroth and Jack Dongarra
                 and Jerzy Wa{\'s}niewski",
  booktitle =    "{Applied Parallel Computing. State of the Art in
                 Scientific Computing: 8th International Workshop, PARA
                 2006, Ume{\aa}, Sweden, June 18--21, 2006, Revised
                 Selected Papers}",
  title =        "{Applied Parallel Computing. State of the Art in
                 Scientific Computing: 8th International Workshop, PARA
                 2006, Ume{\aa}, Sweden, June 18--21, 2006, Revised
                 Selected Papers}",
  volume =       "4699",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "167 (est.)",
  year =         "2007",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-75754-6 (print), 3-540-75755-4 (e-book)",
  ISBN-13 =      "978-3-540-75754-2 (print), 978-3-540-75755-9
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:23:58 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Yong Shi and Geert Dick van Albada and Jack Dongarra
                 and Peter M. A. Sloot",
  booktitle =    "{Computational Science -- ICCS 2007: 7th International
                 Conference, Beijing, China, May 27 --- 30, 2007,
                 Proceedings, Part I}",
  title =        "{Computational Science -- ICCS 2007: 7th International
                 Conference, Beijing, China, May 27 --- 30, 2007,
                 Proceedings, Part I}",
  volume =       "4487",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xxxvi + 1275 (volume 1 of 4)",
  year =         "2007",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-72583-0 (print), 3-540-72584-9 (e-book)",
  ISBN-13 =      "978-3-540-72583-1 (print), 978-3-540-72584-8
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:19:25 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Yong Shi and Geert Dick van Albada and Jack Dongarra
                 and Peter M. A. Sloot",
  booktitle =    "{Computational Science -- ICCS 2007: 7th International
                 Conference, Beijing, China, May 27 --- 30, 2007,
                 Proceedings, Part II}",
  title =        "{Computational Science -- ICCS 2007: 7th International
                 Conference, Beijing, China, May 27 --- 30, 2007,
                 Proceedings, Part II}",
  volume =       "4488",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "153 (est.)",
  year =         "2007",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-72585-7 (print), 3-540-72586-5 (e-book)",
  ISBN-13 =      "978-3-540-72585-5 (print), 978-3-540-72586-2
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:19:26 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Yong Shi and Geert Dick van Albada and Jack Dongarra
                 and Peter M. A. Sloot",
  booktitle =    "{Computational Science -- ICCS 2007: 7th International
                 Conference, Beijing, China, May 27 --- 30, 2007,
                 Proceedings, Part III}",
  title =        "{Computational Science -- ICCS 2007: 7th International
                 Conference, Beijing, China, May 27 --- 30, 2007,
                 Proceedings, Part III}",
  volume =       "4489",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "132 (est.)",
  year =         "2007",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-72587-3 (print), 3-540-72588-1 (e-book)",
  ISBN-13 =      "978-3-540-72587-9 (print), 978-3-540-72588-6
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:19:27 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Yong Shi and Geert Dick van Albada and Jack Dongarra
                 and Peter M. A. Sloot",
  booktitle =    "{Computational Science -- ICCS 2007: 7th International
                 Conference, Beijing, China, May 27 --- 30, 2007,
                 Proceedings, Part IV}",
  title =        "{Computational Science -- ICCS 2007: 7th International
                 Conference, Beijing, China, May 27 --- 30, 2007,
                 Proceedings, Part IV}",
  volume =       "4490",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "149 (est.)",
  year =         "2007",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-72589-X (print), 3-540-72590-3 (e-book)",
  ISBN-13 =      "978-3-540-72589-3 (print), 978-3-540-72590-9
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:19:28 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Marian Bubak and Geert Dick van Albada and Jack
                 Dongarra and Peter M. A. Sloot",
  booktitle =    "{Computational Science -- ICCS 2008: 8th International
                 Conference, Krak{\'o}w, Poland, June 23--25, 2008,
                 Proceedings, Part I}",
  title =        "{Computational Science -- ICCS 2008: 8th International
                 Conference, Krak{\'o}w, Poland, June 23--25, 2008,
                 Proceedings, Part I}",
  volume =       "5101",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "153 (est.)",
  year =         "2008",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-69383-1 (print), 3-540-69384-X (e-book)",
  ISBN-13 =      "978-3-540-69383-3 (print), 978-3-540-69384-0
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:24:07 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Marian Bubak and Geert Dick van Albada and Jack
                 Dongarra and Peter M. A. Sloot",
  booktitle =    "{Computational Science -- ICCS 2008: 8th International
                 Conference, Krak{\'o}w, Poland, June 23--25, 2008,
                 Proceedings, Part II}",
  title =        "{Computational Science -- ICCS 2008: 8th International
                 Conference, Krak{\'o}w, Poland, June 23--25, 2008,
                 Proceedings, Part II}",
  volume =       "5102",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "186 (est.)",
  year =         "2008",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-69386-6 (print), 3-540-69387-4 (e-book)",
  ISBN-13 =      "978-3-540-69386-4 (print), 978-3-540-69387-1
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:24:09 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Marian Bubak and Geert Dick van Albada and Jack
                 Dongarra and Peter M. A. Sloot",
  booktitle =    "{Computational science -- ICCS 2008. 8th international
                 conference, Krak{\'o}w, Poland, June 23--25, 2008.
                 Proceedings, Part III}",
  title =        "{Computational science -- ICCS 2008. 8th international
                 conference, Krak{\'o}w, Poland, June 23--25, 2008.
                 Proceedings, Part III}",
  volume =       "5103",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xxviii + 758",
  year =         "2008",
  DOI =          "",
  bibdate =      "Sat Sep 4 17:11:23 2010",
  bibsource =    "",
  series =       ser-LNCS,
  ZMnumber =     "1139.68302",
  acknowledgement = ack-nhfb,
  classmath =    "68-06 (Proceedings of conferences (computer science))
                 00B25 (Proceedings of conferences of miscellaneous
                 specific interest)",
  remark =       "For the preceding conference see Zbl 1137.68307, Zbl
                 1137.68308, Zbl 1137.68309 and Zbl 1137.68310.",

  editor =       "Siddhartha Chatterjee",
  booktitle =    "{PPoPP '08: proceedings of the 2008 ACM SIGPLAN
                 Symposium on Principles and Practice of Parallel
                 Programming: Salt Lake City, Utah, USA, February
                 20--23, 2008}",
  title =        "{PPoPP '08: proceedings of the 2008 ACM SIGPLAN
                 Symposium on Principles and Practice of Parallel
                 Programming: Salt Lake City, Utah, USA, February
                 20--23, 2008}",
  publisher =    pub-ACM,
  address =      pub-ACM:adr,
  year =         "2008",
  ISBN =         "1-59593-795-1",
  ISBN-13 =      "978-1-59593-795-7",
  LCCN =         "QA76.642 .A27 2008",
  bibdate =      "Sat Dec 2 07:09:45 MST 2017",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  ajournal =     "PPOPP '08",
  remark =       "Bibliographic Level Mode of Issuance: Monograph.",
  subject =      "Engineering and Applied Sciences; Computer Science",

  author =       "Jack Dongarra and Robert Graybill and William Harrod
                 and Robert Lucas and Ewing Lusk and Piotr Luszczek and
                 Janice Mcmahon and Allan Snavely and Jeffrey Vetter and
                 Katherine Yelick and Sadaf Alam and Omid Khalili and
                 Jeremy Meredith and Mustafa Tikir",
  editor =       "M. V. Zelkowitz",
  booktitle =    "High Performance Computing",
  title =        "{DARPX's HPCS} program: History, models, tools,
  volume =       "72",
  publisher =    pub-ACADEMIC,
  address =      pub-ACADEMIC:adr,
  pages =        "1--100",
  year =         "2008",
  DOI =          "",
  ISBN =         "0-12-374411-3",
  ISBN-13 =      "978-0-12-374411-1",
  ISSN =         "0065-2458",
  LCCN =         "????",
  bibdate =      "Tue Jun 4 08:20:03 MDT 2013",
  bibsource =    "",
  series =       "Advances in Computers",
  acknowledgement = ack-nhfb,

  editor =       "Alexey Lastovetsky and Tahar Kechadi and Jack
  booktitle =    "{Recent Advances in Parallel Virtual Machine and
                 Message Passing Interface: 15th European PVM\slash MPI
                 Users' Group Meeting, Dublin, Ireland, September 7--10,
                 2008. Proceedings}",
  title =        "{Recent Advances in Parallel Virtual Machine and
                 Message Passing Interface: 15th European PVM\slash MPI
                 Users' Group Meeting, Dublin, Ireland, September 7--10,
                 2008. Proceedings}",
  volume =       "5205",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "129 (est.)",
  year =         "2008",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-87474-7 (print), 3-540-87475-5 (e-book)",
  ISBN-13 =      "978-3-540-87474-4 (print), 978-3-540-87475-1
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:17:37 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Roman Wyrzykowski and Jack Dongarra and Konrad
                 Karczewski and Jerzy Wasniewski",
  booktitle =    "{Parallel Processing and Applied Mathematics: 7th
                 International Conference, PPAM 2007, Gdansk, Poland,
                 September 9--12, 2007 Revised Selected Papers}",
  title =        "{Parallel Processing and Applied Mathematics: 7th
                 International Conference, PPAM 2007, Gdansk, Poland,
                 September 9--12, 2007 Revised Selected Papers}",
  volume =       "4967",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "188 (est.)",
  year =         "2008",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-540-68105-1 (print), 3-540-68111-6 (e-book)",
  ISBN-13 =      "978-3-540-68105-2 (print), 978-3-540-68111-3
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:21:08 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Gabrielle Allen and Jaros{\l}aw Nabrzyski and Edward
                 Seidel and Geert Dick van Albada and Jack Dongarra and
                 Peter M. A. Sloot",
  booktitle =    "{Computational science -- ICCS 2009. 9th international
                 conference Baton Rouge, LA, USA, May 25--27, 2009.
                 Proceedings, Part I}",
  title =        "{Computational science -- ICCS 2009. 9th international
                 conference Baton Rouge, LA, USA, May 25--27, 2009.
                 Proceedings, Part I}",
  volume =       "5544",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  year =         "2009",
  DOI =          "",
  bibdate =      "Sat Sep 4 17:11:27 2010",
  bibsource =    "",
  series =       ser-LNCS,
  ZMnumber =     "1162.68300",
  acknowledgement = ack-nhfb,
  classmath =    "{*68-06 (Proceedings of conferences (computer
                 science)) 00B25 (Proceedings of conferences of
                 miscellaneous specific interest) }",
  remark =       "For the preceding conference see Zbl 1139.68300, Zbl
                 1139.68301 and Zbl 1139.68302. For Part II of the
                 proceedings of ICCS 2009 see Zbl 1162.68302.",

  editor =       "Gabrielle Allen and Jaros{\l}aw Nabrzyski and Edward
                 Seidel and Geert Dick van Albada and Jack Dongarra and
                 Peter M. A. Sloot",
  booktitle =    "{Computational science -- ICCS 2009. 9th international
                 conference Baton Rouge, LA, USA, May 25--27, 2009.
                 Proceedings, Part II}",
  title =        "{Computational science -- ICCS 2009. 9th international
                 conference Baton Rouge, LA, USA, May 25--27, 2009.
                 Proceedings, Part II}",
  volume =       "5545",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xxxvii + 921",
  year =         "2009",
  DOI =          "",
  bibdate =      "Sat Sep 4 17:11:30 2010",
  bibsource =    "",
  series =       ser-LNCS,
  ZMnumber =     "1162.68302",
  acknowledgement = ack-nhfb,
  classmath =    "*68-06 (Proceedings of conferences (computer science))
                 00B25 (Proceedings of conferences of miscellaneous
                 specific interest)",
  remark =       "For the preceding conference see Zbl 1139.68300, Zbl
                 1139.68301 and Zbl 1139.68302. For Part II of the
                 proceedings of ICCS 2009 see Zbl 1162.68301.",

  editor =       "Matti Ropo and Jan Westerholm and Jack Dongarra",
  booktitle =    "{Recent Advances in Parallel Virtual Machine and
                 Message Passing Interface: 16th European PVM\slash MPI
                 Users' Group Meeting, Espoo, Finland, September 7--10,
                 2009. Proceedings}",
  title =        "{Recent Advances in Parallel Virtual Machine and
                 Message Passing Interface: 16th European PVM\slash MPI
                 Users' Group Meeting, Espoo, Finland, September 7--10,
                 2009. Proceedings}",
  volume =       "5759",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "142 (est.)",
  year =         "2009",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-642-03769-0 (print), 3-642-03770-4 (e-book)",
  ISBN-13 =      "978-3-642-03769-6 (print), 978-3-642-03770-2
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:20:58 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Adhemar Bultheel and Ronald Cools",
  booktitle =    "{The birth of numerical analysis}",
  title =        "{The birth of numerical analysis}",
  publisher =    pub-WORLD-SCI,
  address =      pub-WORLD-SCI:adr,
  pages =        "xvii + 221",
  year =         "2010",
  ISBN =         "981-283-625-X",
  ISBN-13 =      "978-981-283-625-0",
  LCCN =         "QA297 .B54 2010",
  bibdate =      "Mon Aug 23 11:06:23 MDT 2010",
  bibsource =    ";
  abstract =     "The 1947 paper by John von Neumann and Herman
                 Goldstine, ``Numerical Inverting of Matrices of High
                 Order'' (Bulletin of the AMS, Nov. 1947), is considered
                 as the birth certificate of numerical analysis. Since
                 its publication, the evolution of this domain has been
                 enormous. This book is a unique collection of
                 contributions by researchers who have lived through
                 this evolution, testifying about their personal
                 experiences and sketching the evolution of their
                 respective subdomains since the early years.",
  acknowledgement = ack-nhfb,
  remark =       "Proceedings of a symposium held at the Department of
                 Computer Science of the K.U. Leuven, October 29--30,
  subject =      "numerical analysis; congresses; history",

  editor =       "Rainer Keller and Edgar Gabriel and Michael Resch and
                 Jack Dongarra",
  booktitle =    "{Recent Advances in the Message Passing Interface:
                 17th European MPI Users' Group Meeting, EuroMPI 2010,
                 Stuttgart, Germany, September 12--15, 2010.
  title =        "{Recent Advances in the Message Passing Interface:
                 17th European MPI Users' Group Meeting, EuroMPI 2010,
                 Stuttgart, Germany, September 12--15, 2010.
  volume =       "6305",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "197 (est.)",
  year =         "2010",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-642-15645-2 (print), 3-642-15646-0 (e-book)",
  ISBN-13 =      "978-3-642-15645-8 (print), 978-3-642-15646-5
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:24:14 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Roman Wyrzykowski and Jack Dongarra and Konrad
                 Karczewski and Jerzy Wasniewski",
  booktitle =    "{Parallel Processing and Applied Mathematics: 8th
                 International Conference, PPAM 2009, Wroclaw, Poland,
                 September 13--16, 2009. Revised Selected Papers, Part
  title =        "{Parallel Processing and Applied Mathematics: 8th
                 International Conference, PPAM 2009, Wroclaw, Poland,
                 September 13--16, 2009. Revised Selected Papers, Part
  volume =       "6067",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "195 (est.)",
  year =         "2010",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-642-14389-X (print), 3-642-14390-3 (e-book)",
  ISBN-13 =      "978-3-642-14389-2 (print), 978-3-642-14390-8
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:19:01 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Roman Wyrzykowski and Jack Dongarra and Konrad
                 Karczewski and Jerzy Wasniewski",
  booktitle =    "{Parallel Processing and Applied Mathematics: 8th
                 International Conference, PPAM 2009, Wroclaw, Poland,
                 September 13--16, 2009, Revised Selected Papers, Part
  title =        "{Parallel Processing and Applied Mathematics: 8th
                 International Conference, PPAM 2009, Wroclaw, Poland,
                 September 13--16, 2009, Revised Selected Papers, Part
  volume =       "6068",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "193 (est.)",
  year =         "2010",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-642-14402-0 (print), 3-642-14403-9 (e-book)",
  ISBN-13 =      "978-3-642-14402-8 (print), 978-3-642-14403-5
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:19:02 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Yiannis Cotronis and Anthony Danalis and Dimitrios S.
                 Nikolopoulos and Jack Dongarra",
  booktitle =    "{Recent Advances in the Message Passing Interface:
                 18th European MPI Users' Group Meeting, EuroMPI 2011,
                 Santorini, Greece, September 18--21, 2011.
  title =        "{Recent Advances in the Message Passing Interface:
                 18th European MPI Users' Group Meeting, EuroMPI 2011,
                 Santorini, Greece, September 18--21, 2011.
  volume =       "6960",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "177 (est.)",
  year =         "2011",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-642-24448-3 (print), 3-642-24449-1 (e-book)",
  ISBN-13 =      "978-3-642-24448-3 (print), 978-3-642-24449-0
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:21:14 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Scott Lathrop and Jim Costa and William Kramer",
  booktitle =    "{SC'11: Proceedings of 2011 International Conference
                 for High Performance Computing, Networking, Storage and
                 Analysis, Seattle, WA, November 12--18 2011}",
  title =        "{SC'11: Proceedings of 2011 International Conference
                 for High Performance Computing, Networking, Storage and
                 Analysis, Seattle, WA, November 12--18 2011}",
  publisher =    pub-ACM # " and " # pub-IEEE,
  address =      pub-ACM:adr # " and " # pub-IEEE:adr,
  pages =        "????",
  year =         "2011",
  ISBN =         "1-4503-0771-X",
  ISBN-13 =      "978-1-4503-0771-0",
  LCCN =         "????",
  bibdate =      "Fri Dec 16 11:11:35 2011",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  xxeditor =     "{ACM}",

  editor =       "Jeffrey Hollingsworth",
  booktitle =    "{SC '12: Proceedings of the International Conference
                 on High Performance Computing, Networking, Storage and
                 Analysis, Salt Lake Convention Center, Salt Lake City,
                 UT, USA, November 10--16, 2012}",
  title =        "{SC '12: Proceedings of the International Conference
                 on High Performance Computing, Networking, Storage and
                 Analysis, Salt Lake Convention Center, Salt Lake City,
                 UT, USA, November 10--16, 2012}",
  publisher =    pub-IEEE,
  address =      pub-IEEE:adr,
  year =         "2012",
  ISBN =         "1-4673-0804-8",
  ISBN-13 =      "978-1-4673-0804-5",
  bibdate =      "Thu Nov 15 07:35:55 2012",
  bibsource =    ";
  acknowledgement = ack-nhfb,

  editor =       "Jesper Larsson Tr{\"a}ff and Siegfried Benkner and
                 Jack J. Dongarra",
  booktitle =    "{Recent Advances in the Message Passing Interface:
                 19th European MPI Users' Group Meeting, EuroMPI 2012,
                 Vienna, Austria, September 23--26, 2012. Proceedings}",
  title =        "{Recent Advances in the Message Passing Interface:
                 19th European MPI Users' Group Meeting, EuroMPI 2012,
                 Vienna, Austria, September 23--26, 2012. Proceedings}",
  volume =       "7490",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "162 (est.)",
  year =         "2012",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-642-33517-9 (print), 3-642-33518-7 (e-book)",
  ISBN-13 =      "978-3-642-33517-4 (print), 978-3-642-33518-1
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:23:42 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,

  editor =       "Roman Wyrzykowski and Jack Dongarra and Konrad
                 Karczewski and Jerzy Wa{\'s}niewski",
  booktitle =    "{Parallel Processing and Applied Mathematics: 9th
                 International Conference, PPAM 2011, Torun, Poland,
                 September 11--14, 2011. Revised Selected Papers, Part
  title =        "{Parallel Processing and Applied Mathematics: 9th
                 International Conference, PPAM 2011, Torun, Poland,
                 September 11--14, 2011. Revised Selected Papers, Part
  volume =       "7203",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "205 (est.)",
  year =         "2012",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-642-31463-5 (print), 3-642-31464-3 (e-book)",
  ISBN-13 =      "978-3-642-31463-6 (print), 978-3-642-31464-3
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:26:13 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Roman Wyrzykowski and Jack Dongarra and Konrad
                 Karczewski and Jerzy Wa{\'s}niewski",
  booktitle =    "{Parallel Processing and Applied Mathematics: 9th
                 International Conference, PPAM 2011, Torun, Poland,
                 September 11--14, 2011. Revised Selected Papers, Part
  title =        "{Parallel Processing and Applied Mathematics: 9th
                 International Conference, PPAM 2011, Torun, Poland,
                 September 11--14, 2011. Revised Selected Papers, Part
  volume =       "7204",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "200 (est.)",
  year =         "2012",
  CODEN =        "LNCSD9",
  DOI =          "",
  ISBN =         "3-642-31499-6 (print), 3-642-31500-3 (e-book)",
  ISBN-13 =      "978-3-642-31499-5 (print), 978-3-642-31500-8
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  LCCN =         "????",
  bibdate =      "Wed Dec 19 15:26:14 MST 2012",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  ORCID-numbers = "Dongarra, Jack/0000-0003-3247-1782",

  editor =       "Valeria V. Krzhizhanovskaya and G{\'a}bor
                 Z{\'a}vodszky and Michael H. Lees and Jack J. Dongarra
                 and Peter M. A. Sloot and S{\'e}rgio Brissos and
                 Jo{\~a}o Teixeira",
  booktitle =    "{Computational Science --- ICCS 2020 20th
                 International Conference, Amsterdam, The Netherlands,
                 June 3--5, 2020, Proceedings, Part II}",
  title =        "{Computational Science --- ICCS 2020 20th
                 International Conference, Amsterdam, The Netherlands,
                 June 3--5, 2020, Proceedings, Part II}",
  volume =       "12138",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "xix + 697",
  year =         "2020",
  DOI =          "",
  ISBN =         "3-030-50416-6, 3-030-50417-4 (e-book)",
  ISBN-13 =      "978-3-030-50416-8, 978-3-030-50417-5 (e-book)",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  bibdate =      "Thu Jun 25 08:21:10 2020",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  tableofcontents = "Front Matter / / i--xix \\
                 Modified Binary Tree in the Fast PIES for 2D Problems
                 with Complex Shapes / Andrzej Ku{\.z}elewski, Eugeniusz
                 Zieniuk, Agnieszka Bo{\l}tu{\'c}, Krzystof Szersze{\'n}
                 / 1--14 \\
                 Generating Random Floating--Point Numbers by Dividing
                 Integers: A Case Study / Fr{\'e}d{\'e}ric Goualard /
                 15--28 \\
                 An Effective Stable Numerical Method for Integrating
                 Highly Oscillating Functions with a Linear Phase /
                 Leonid A. Sevastianov, Konstantin P. Lovetskiy, Dmitry
                 S. Kulyabov / 29--43 \\
                 Fitting Penalized Logistic Regression Models Using QR
                 Factorization / Jacek Klimaszewski, Marcin Korze{\'n} /
                 44--57 \\
                 Uncertainty Quantification in Fractional Stochastic
                 Integro--Differential Equations Using Legendre Wavelet
                 Collocation Method / Abhishek Kumar Singh, Mani Mehra /
                 58--71 \\
                 A Direct High--Order Curvilinear Triangular Mesh
                 Generation Method Using an Advancing Front Technique /
                 Fariba Mohammadi, Shusil Dangi, Suzanne M. Shontz,
                 Cristian A. Linte / 72--85 \\
                 Data--Driven Partial Differential Equations Discovery
                 Approach for the Noised Multi--dimensional Data /
                 Mikhail Maslyaev, Alexander Hvatov, Anna Kalyuzhnaya /
                 86--100 \\
                 Preconditioning Jacobian Systems by Superimposing
                 Diagonal Blocks / M. Ali Rostami, H. Martin B{\"u}cker
                 / 101--115 \\
                 NURBS Curves in Parametric Integral Equations System
                 for Modeling and Solving Boundary Value Problems in
                 Elasticity / Marta Kapturczak, Eugeniusz Zieniuk,
                 Andrzej Ku{\.z}elewski / 116--123 \\
                 Parameterizations and Lagrange Cubics for Fitting
                 Multidimensional Data / Ryszard Kozera, Lyle Noakes,
                 Magdalena Wilko{\l}azka / 124--140 \\
                 Loop Aggregation for Approximate Scientific Computing /
                 June Sallou, Alexandre Gauvain, Johann Bourcier, Benoit
                 Combemale, Jean--Raynald de Dreuzy / 141--155 \\
                 Numerical Computation for a Flow Caused by a
                 High--Speed Traveling Train and a Stationary Overpass /
                 Shotaro Hamato, Masashi Yamakawa, Yongmann M. Chung,
                 Shinichi Asao / 156--169 \\
                 B{\'e}zier Surfaces for Modeling Inclusions in PIES /
                 Agnieszka Bo{\l}tu{\'c}, Eugeniusz Zieniuk, Krzysztof
                 Szersze{\'n}, Andrzej Ku{\.z}elewski / 170--183 \\
                 Impact of Water on Methane Adsorption in Nanopores: A
                 Hybrid GCMC--MD Simulation Study / Ji Zhou, Wenbin
                 Jiang, Mian Lin, Lili Ji, Gaohui Cao / 184--196 \\
                 A Stable Discontinuous Galerkin Based Isogeometric
                 Residual Minimization for the Stokes Problem / Marcin
                 {\L}o{\'s}, Sergio Rojas, Maciej Paszy{\'n}ski, Ignacio
                 Muga, Victor M. Calo / 197--211 \\
                 Numerical Modeling of the Two--Phase Flow of Water with
                 Ice in the Tom River / Vladislava Churuksaeva,
                 Alexander Starchenko / 212--224 \\
                 Remarks on Kaczmarz Algorithm for Solving Consistent
                 and Inconsistent System of Linear Equations / Xinyin
                 Huang, Gang Liu, Qiang Niu / 225--236 \\
                 Investigating the Benefit of FP16--Enabled
                 Mixed--Precision Solvers for Symmetric Positive
                 Definite Matrices Using GPUs / Ahmad Abdelfattah, Stan
                 Tomov, Jack Dongarra / 237--250 \\
                 Simulation Versus an Ordered Fuzzy--Numbers--Driven
                 Approach to the Multi--depot Vehicle Cyclic Routing and
                 Scheduling Problem / Grzegorz Bocewicz, Zbigniew
                 Banaszak, Czeslaw Smutnicki, Katarzyna Rudnik, Marcin
                 Witczak, Robert W{\'o}jcik / 251--266 \\
                 Epigenetic Modification of Genetic Algorithm / Kornel
                 Chrominski, Magdalena Tkacz, Mariusz Boryczka /
                 267--278 \\
                 ITP--KNN: Encrypted Video Flow Identification Based on
                 the Intermittent Traffic Pattern of Video and
                 $K$-Nearest Neighbors Classification / Youting Liu, Shu
                 Li, Chengwei Zhang, Chao Zheng, Yong Sun, Qingyun Liu /
                 279--293 \\
                 DeepAD: A Joint Embedding Approach for Anomaly
                 Detection on Attributed Networks / Dali Zhu, Yuchen Ma,
                 Yinlong Liu / 294--307 \\
                 SciNER: Extracting Named Entities from Scientific
                 Literature / Zhi Hong, Roselyne Tchoua, Kyle Chard, Ian
                 Foster / 308--321 \\
                 GPU--Embedding of kNN--Graph Representing Large and
                 High--Dimensional Data / Bartosz Minch, Mateusz Nowak,
                 Rafa{\l} Wcis{\l}o, Witold Dzwinel / 322--336 \\
                 Evolving Long Short--Term Memory Networks / Vicente
                 Coelho Lobo Neto, Leandro Aparecido Passos, Jo{\~a}o
                 Paulo Papa / 337--350 \\
                 Personality Recognition from Source Code Based on
                 Lexical, Syntactic and Semantic Features / Miko{\l}aj
                 Biel, Marcin Kuta, Jacek Kitowski / 351--363 \\
                 Data Fitting by Exponential Sums with Equal Weights /
                 Petr Chunaev, Ildar Safiullin / 364--371 \\
                 A Combination of Moment Descriptors, Fourier Transform
                 and Matching Measures for Action Recognition Based on
                 Shape / Katarzyna Go{\'s}ciewska, Dariusz Frejlichowski
                 / 372--386 \\
                 Improving Accuracy and Speeding Up Document Image
                 Classification Through Parallel Systems / Javier
                 Ferrando, Juan Luis Dom{\'\i}nguez, Jordi Torres,
                 Ra{\'u}l Garc{\'\i}a, David Garc{\'\i}a, Daniel Garrido
                 et al. / 387--400 \\
                 Computation of the Airborne Contaminant Transport in
                 Urban Area by the Artificial Neural Network / Anna
                 Wawrzynczak, Monika Berendt--Marchel / 401--413 \\
                 Exploring Musical Structure Using Tonnetz Lattice
                 Geometry and LSTMs / Manuchehr Aminian, Eric Kehoe,
                 Xiaofeng Ma, Amy Peterson, Michael Kirby / 414--424 \\
                 Modeling of Anti--tracking Network Based on
                 Convex--Polytope Topology / Changbo Tian, Yongzheng
                 Zhang, Tao Yin / 425--438 \\
                 A Workload Division Differential Privacy Algorithm to
                 Improve the Accuracy for Linear Computations / Jun Li,
                 Huan Ma, Guangjun Wu, Yanqin Zhang, Bingnan Ma, Zhen
                 Hui et al. / 439--452 \\
                 On the Automated Assessment of Open--Source Cyber
                 Threat Intelligence Sources / Andrea Tundis, Samuel
                 Ruppert, Max M{\"u}hlh{\"a}user / 453--467 \\
                 Malicious Domain Detection Based on K--means and SMOTE
                 / Qing Wang, Linyu Li, Bo Jiang, Zhigang Lu, Junrong
                 Liu, Shijie Jian / 468--481 \\
                 Microservice Disaster Crash Recovery: A Weak Global
                 Referential Integrity Management / Maude Manouvrier,
                 Cesare Pautasso, Marta Rukoz / 482--495 \\
                 Hashing Based Prediction for Large--Scale Kernel
                 Machine / Lijing Lu, Rong Yin, Yong Liu, Weiping Wang /
                 496--509 \\
                 Picking Peaches or Squeezing Lemons: Selecting
                 Crowdsourcing Workers for Reducing Cost of Redundancy /
                 Paulina Adamska, Marta Ju{\'z}win, Adam Wierzbicki /
                 510--523 \\
                 Are $n$-gram Categories Helpful in Text Classification?
                 / Jakub Kruczek, Paulina Kruczek, Marcin Kuta /
                 524--537 \\
                 Calculating Reactive Power Compensation for
                 Large--Scale Street Lighting / Sebastian Ernst, Leszek
                 Kotulski, Tomasz Lerch, Micha{\l} Rad, Adam
                 S{\k{e}}dziwy, Igor Wojnicki / 538--550 \\
                 Developing a Decision Support App for Computational
                 Agriculture / Andrew Lewis, Marcus Randall, Ben
                 Stewart--Koster / 551--561 \\
                 Optimal Location of Sensors for Early Detection of
                 Tsunami Waves / Angelie R. Ferrolino, Jose Ernie C.
                 Lope, Renier G. Mendoza / 562--575 \\
                 A Novel Formulation for Inverse Distance Weighting from
                 Weighted Linear Regression / Leonardo Ramos
                 Emmendorfer, Gra{\c{c}}aliz Pereira Dimuro / 576--589
                 Addressing the Robustness of Resource Allocation in the
                 Presence of Application and System Irregularities via
                 PEPA Based Modeling / Srishti Srivastava, Ioana
                 Banicescu, William S. Sanders / 590--603 \\
                 An Adaptive Computational Network Model for Strange
                 Loops in Political Evolution in Society / Julia Anten,
                 Jordan Earle, Jan Treur / 604--617 \\
                 Joint Entity Linking for Web Tables with Hybrid
                 Semantic Matching / Jie Xie, Yuhai Lu, Cong Cao,
                 Zhenzhen Li, Yangyang Guan, Yanbing Liu / 618--631 \\
                 A New Coefficient of Rankings Similarity in
                 Decision--Making Problems / Wojciech Sa abun, Karol
                 Urbaniak / 632--645 \\
                 Innovativeness Analysis of Scholarly Publications by
                 Age Prediction Using Ordinal Regression / Pavel Savov,
                 Adam Jatowt, Radoslaw Nielek / 646--660 \\
                 Advantage of Using Spherical over Cartesian Coordinates
                 in the Chromosome Territories 3D Modeling / Magdalena
                 A. Tkacz, Kornel Chromi{\'n}ski / 661--673 \\
                 Adaptive and Efficient Transfer for Online Remote
                 Visualization of Critical Weather Applications / Preeti
                 Malakar, Vijay Natarajan, Sathish S. Vadhiyar /
                 674--693 \\
                 Back Matter / / 695--697",

  editor =       "Roman Wyrzykowski and Ewa Deelman and Jack Dongarra
                 and Konrad Karczewski",
  booktitle =    "Parallel Processing and Applied Mathematics: {13th
                 International Conference, PPAM 2019, Bialystok, Poland,
                 September 8--11, 2019, Revised Selected Papers, Part
  title =        "Parallel Processing and Applied Mathematics: {13th
                 International Conference, PPAM 2019, Bialystok, Poland,
                 September 8--11, 2019, Revised Selected Papers, Part
  publisher =    pub-SV,
  address =      pub-SV:adr,
  year =         "2020",
  DOI =          "",
  ISBN =         "3-030-43229-7",
  ISBN-13 =      "978-3-030-43229-4",
  ISSN =         "0302-9743 (print), 1611-3349 (electronic)",
  ISSN-L =       "0302-9743",
  bibdate =      "Fri Dec 15 11:31:31 2023",
  bibsource =    ";
  series =       ser-LNCS,
  acknowledgement = ack-nhfb,
  keywords =     "posit arithmetic",
  tableofcontents = "Front Matter / i--xxiii \\
                 Numerical Algorithms and Parallel Scientific Computing
                 == Front Matter / 1--1 \\
                 Matthias Korch, Tim Werner / Multi-workgroup Tiling to
                 Improve the Locality of Explicit One-Step Methods for
                 ODE Systems with Limited Access Distance on GPUs /
                 3--12 \\
                 Davor Davidovi{\'c}, Enrique S. Quintana-Ort{\'\i} /
                 Structure-Aware Calculation of Many-Electron Wave
                 Function Overlaps on Multicore Processors / 13--24 \\
                 Charles D. Murray, Tobias Weinzierl / Lazy Stencil
                 Integration in Multigrid Algorithms / 25--37 \\
                 Filip Paw{\l}owski, Bora U{\c{c}}ar, Albert-Jan Yzelman
                 / High Performance Tensor Vector Multiplication on
                 Shared-Memory Systems / 38--48 \\
                 Pawe{\l} Augustynowicz, Andrzej Paszkiewicz / Efficient
                 Modular Squaring in Binary Fields on CPU Supporting AVX
                 and GPU / 49--57 \\
                 Carl Christian Kjelgaard Mikkelsen, Mirko Myllykoski /
                 Parallel Robust Computation of Generalized Eigenvectors
                 of Matrix Pencils / 58--69 \\
                 Mirko Myllykoski, Carl Christian Kjelgaard Mikkelsen /
                 Introduction to StarNEig A Task-Based Library for
                 Solving Nonsymmetric Eigenvalue Problems / 70--81 \\
                 Angelika Schwarz, Carl Christian Kjelgaard Mikkelsen /
                 Robust Task-Parallel Solution of the Triangular
                 Sylvester Equation / 82--92 \\
                 Beata Dmitruk, Przemys{\l}aw Stpiczy{\'n}ski /
                 Vectorized Parallel Solver for Tridiagonal Toeplitz
                 Systems of Linear Equations / 93--103 \\
                 Carola Kruse, Masha Sosonkina, Mario Arioli, Nicolas
                 Tardieu, Ulrich R{\"u}de / Parallel Performance of an
                 Iterative Solver Based on the Golub-Kahan
                 Bidiagonalization / 104--116 \\
                 Linus Seelinger, Anne Reinarz, Robert Scheichl / A
                 High-Performance Implementation of a Robust
                 Preconditioner for Heterogeneous Problems / 117--128
                 Viviana Arrigoni, Annalisa Massini / Hybrid Solver for
                 Quasi Block Diagonal Linear Systems / 129--140 \\
                 Michal Krav{\v{c}}enko, Jan Zapletal, Xavier Claeys,
                 Michal Merta / Parallel Adaptive Cross Approximation
                 for the Multi-trace Formulation of Scattering Problems
                 / 141--150 \\
                 Daisuke Takahashi / Implementation of Parallel 3-D Real
                 FFT with 2-D Decomposition on Intel Xeon Phi Clusters /
                 151--161 \\
                 Doru Thom Popovici, Devangi N. Parikh, Daniele G.
                 Spampinato, Tze Meng Low / Exploiting Symmetries of
                 Small Prime-Sized DFTs / 162--173 \\
                 Victor Gergel, Evgeny Kozinov / Parallel Computations
                 for Various Scalarization Schemes in Multicriteria
                 Optimization Problems / 174--184 \\
                 Emerging HPC Architectures \\
                 Front Matter / 185--185 \\
                 Enrico Calore, Alessandro Gabbana, Fabio Rinaldi,
                 Sebastiano Fabio Schifano, Raffaele Tripiccione / Early
                 Performance Assessment of the ThunderX2 Processor for
                 Lattice Based Simulations / 187--198 \\
                 Emerging HPC Architectures \\
                 Mate Cobrnic, Alen Duspara, Leon Dragic, Igor Piljic,
                 Hrvoje Mlinaric, Mario Kovac / An Area Efficient and
                 Reusable HEVC 1D-DCT Hardware Accelerator / 199--208
                 Performance Analysis and Scheduling in HPC Systems \\
                 Front Matter / 209--209 \\
                 M. Yusuf {\"O}zkaya, Anne Benoit, {\"U}mit V.
                 {\c{C}}ataly{\"u}rek / Improving Locality-Aware
                 Scheduling with Acyclic Directed Graph Partitioning /
                 211--223 \\
                 Maciej Drozdowski, Gaurav Singh, J{\k{e}}drzej M.
                 Marsza{\l}kowski / Isoefficiency Maps for Divisible
                 Computations in Hierarchical Memory Systems / 224--234
                 Environments and Frameworks for
                 Parallel/Distributed/Cloud Computing \\
                 Front Matter / 235--235 \\
                 Tim Cramer, Manoel R{\"o}mmer, Boris Kosmynin, Erich
                 Focht, Matthias S. M{\"u}ller / OpenMP Target Device
                 Offloading for the SX-Aurora TSUBASA Vector Engine /
                 237--249 \\
                 Camille Coti, Allen D. Malony / On the Road to DiPOSH:
                 Adventures in High-Performance OpenSHMEM / 250--260 \\
                 Roman Wiatr, Vladyslav Lyutenko, Mi{\l}osz Demczuk,
                 Renata S{\l}ota, Jacek Kitowski / Click-Fraud Detection
                 for Online Advertising / 261--271 \\
                 Adam Smyk, Marek Tudruj, Lukasz Grochal / Parallel
                 Graph Partitioning Optimization Under PEGASUS DA
                 Application Global State Monitoring / 272--286 \\
                 Bartosz Balis, Michal Orzechowski, Krystian Pawlik,
                 Maciej Pawlik, Maciej Malawski / Cloud Infrastructure
                 Automation for Scientific Workflows / 287--297 \\
                 Applications of Parallel Computing \\
                 Front Matter / 299--299 \\
                 Steven W. D. Chien, Ivy B. Peng, Stefano Markidis /
                 Posit NPB: Assessing the Precision Improvement in HPC
                 Scientific Applications / 301--310 \\
                 Lukas Krenz, Leonhard Rannabauer, Michael Bader / A
                 High-Order Discontinuous Galerkin Solver with Dynamic
                 Adaptive Mesh Refinement to Simulate Cloud Formation
                 Processes / 311--323 \\
                 Evgeny Kuznetsov, Nikolay Kondratyuk, Mikhail Logunov,
                 Vsevolod Nikolskiy, Vladimir Stegailov / Performance
                 and Portability of State-of-Art Molecular Dynamics
                 Software on Modern GPUs / 324--334 \\
                 Iosif Meyerov, Alexander Panov, Sergei Bastrakov,
                 Aleksei Bashinov, Evgeny Efimenko, Elena Panova, Igor
                 Surmin, Valentin Volokitin, and Arkady Gonoskov /
                 Exploiting Parallelism on Shared Memory in the QED
                 Particle-in-Cell Code PICADOR with Greedy Load
                 Balancing / 335--347 \\
                 Michael Quell, Paul Manstetten, Andreas H{\"o}ssinger,
                 Siegfried Selberherr, Josef Weinbub / Parallelized
                 Construction of Extension Velocities for the Level-Set
                 Method / 348--358 \\
                 Marcin Czajkowski, Krzysztof Jurczuk, Marek Kretowski /
                 Relative Expression Classification Tree. A Preliminary
                 GPU-Based Implementation / 359--369 \\
                 Kamil Halbiniak, Lukasz Szustak, Adam Kulawik, Pawel
                 Gepner / Performance Optimizations for Parallel
                 Modeling of Solidification with Dynamic Intensity of
                 Computation / 370--381 \\
                 Parallel Non-numerical Algorithms \\
                 Front Matter / 383--383 \\
                 Joel Fuentes, Wei-yu Chen, Guei-yuan Lueh, Arturo
                 Garza, Isaac D. Scherson / SIMD-node Transformations
                 for Non-blocking Data Structures / 385--395 \\
                 Parallel Non-numerical Algorithms \\
                 Hironobu Kobayashi, Yasuaki Ito, Koji Nakano / Stained
                 Glass Image Generation Using Voronoi Diagram and Its
                 GPU Acceleration / 396--407 \\
                 Anna Sasak-Oko{\'n} / Modifying Queries Strategy for
                 Graph-Based Speculative Query Execution for RDBMS /
                 408--418 \\
                 Soft Computing with Applications \\
                 Front Matter / 419--419 \\
                 Krzysztof Jurczuk, Marcin Czajkowski, Marek Kretowski /
                 Accelerating GPU-based Evolutionary Induction of
                 Decision Trees --- Fitness Evaluation Reuse / 421--431
                 Hatem Khalloof, Phil Ostheimer, Wilfried Jakob, Shadi
                 Shahoud, Clemens Duepmeier, Veit Hagenmeyer / A
                 Distributed Modular Scalable and Generic Framework for
                 Parallelizing Population-Based Metaheuristics /
                 432--444 \\
                 Danuta Rutkowska, Krzysztof Wiaderek / Parallel
                 Processing of Images Represented by Linguistic
                 Description in Databases / 445--456 \\
                 Wojciech Kwedlo, Micha{\l} {\L}ubowicz / An OpenMP
                 Parallelization of the K-means Algorithm Accelerated
                 Using KD-trees / 457--466 \\
                 W{\l}odzimierz Funika, Pawe{\l} Koperek / Evaluating
                 the Use of Policy Gradient Optimization Approach for
                 Automatic Cloud Resource Provisioning / 467--478 \\
                 {\L}ukasz Karbowiak / Improving Efficiency of Automatic
                 Labeling by Image Transformations on CPU and GPU /
                 479--490 \\
                 Special Session on GPU Computing \\
                 Front Matter / 1--1 \\
                 Takahiro Inoue, Hiroki Tokura, Koji Nakano, Yasuaki Ito
                 / Efficient Triangular Matrix Vector Multiplication on
                 the GPU / 493--504 \\
                 Dominik Ernst, Georg Hager, Jonas Thies, Gerhard
                 Wellein / Performance Engineering for a Tall & Skinny
                 Matrix Multiplication Kernels on GPUs / 505--515 \\
                 Daichi Mukunoki, Takeshi Ogita, Katsuhisa Ozaki /
                 Reproducible BLAS Routines with Tunable Accuracy Using
                 Ozaki Scheme for Many-Core Architectures / 516--527 \\
                 Tao Chang, Emeric Brun, Christophe Calvin / Portable
                 Monte Carlo Transport Performance Evaluation in the
                 PATMOS Prototype / 528--539 \\
                 Special Session on Parallel Matrix Factorizations \\
                 Front Matter / 541--541 \\
                 Piyush Sao, Ramakrishnan Kannan / Multifrontal
                 Non-negative Matrix Factorization / 543--554 \\
                 Martin Be{\v{c}}ka, Gabriel Ok{\v{s}}a /Preconditioned
                 Jacobi SVD Algorithm Outperforms PDGESVD / 555--566 \\
                 Marek Parfieniuk / A Parallel Factorization for
                 Generating Orthogonal Matrices / 567--578 \\
                 Back Matter / 579--581",

  author =       "Anonymous",
  title =        "{ACM Turing Award} Honors {Jack Dongarra} for
                 Pioneering Concepts and Methods Which Resulted in
                 World-Changing Computations: {Dongarra}'s Algorithms
                 and Software Fueled the Growth of High-Performance
                 Computing and Had Significant Impacts in Many Areas of
                 Computational Science from {AI} to Computer Graphics",
  howpublished = "ACM Web site",
  day =          "29",
  month =        mar,
  year =         "2022",
  bibdate =      "Sat Apr 02 06:19:57 2022",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,

  author =       "Neil Savage",
  title =        "News: Always improving performance",
  journal =      j-CACM,
  volume =       "65",
  number =       "6",
  pages =        "16--18",
  month =        jun,
  year =         "2022",
  CODEN =        "CACMA2",
  DOI =          "",
  ISSN =         "0001-0782 (print), 1557-7317 (electronic)",
  ISSN-L =       "0001-0782",
  bibdate =      "Mon May 23 10:16:43 MDT 2022",
  bibsource =    ";
  URL =          "",
  abstract =     "Jack J. Dongarra is the recipient of the 2021 ACM A.M.
                 Turing Award for his pioneering contributions to
                 numerical algorithms and libraries that enabled
                 high-performance computational software to keep pace
                 with exponential hardware improvements for over
  acknowledgement = ack-nhfb,
  fjournal =     "Communications of the ACM",
  journal-URL =  "",

  editor =       "Roman Wyrzykowski and Jack Dongarra and Ewa Deelman
                 and Konrad Karczewski",
  booktitle =    "{Parallel Processing and Applied Mathematics: 14th
                 International Conference, PPAM 2022, Gdansk, Poland,
                 September 11--14, 2022, Revised Selected Papers, Part
  title =        "{Parallel Processing and Applied Mathematics: 14th
                 International Conference, PPAM 2022, Gdansk, Poland,
                 September 11--14, 2022, Revised Selected Papers, Part
  volume =       "13827",
  publisher =    pub-SV,
  address =      pub-SV:adr,
  pages =        "531",
  year =         "2023",
  DOI =          "",
  ISBN =         "3-031-30441-1, 3-031-30444-6, 3-031-30445-4 (e-book)",
  ISBN-13 =      "978-3-031-30441-5, 978-3-031-30444-6,
                 978-3-031-30445-3 (e-book)",
  LCCN =         "Q334-342",
  bibdate =      "Mon May 1 10:00:38 MDT 2023",
  bibsource =    ";
  series =       ser-LNCS,
  URL =          "",
  acknowledgement = ack-nhfb,
  tableofcontents = "Intro \\
                 Preface \\
                 Organization \\
                 Contents --- Part II \\
                 Contents --- Part I \\
                 I 9th Workshop on Language-Based Parallel Programming
                 (WLPP 2022) \\
                 Kokkos-Based Implementation of MPCD on Heterogeneous
                 Nodes \\
                 1 Introduction \\
                 2 Multi-Particle Collision Dynamics \\
                 3 Implementation with Cabana \\
                 3.1 Collection of Particles in Cells \\
                 3.2 Communication of Required Information \\
                 3.3 Rotation of Velocities \\
                 4 Benchmarks and Discussion \\
                 5 Conclusion and Outlook \\
                 References \\
                 Comparison of Load Balancing Schemes for Asynchronous
                 Many-Task Runtimes \\
                 1 Introduction \\
                 2 Background \\
                 2.1 Lifeline Scheme \\
                 2.2 Hybrid Scheme \\
                 2.3 Nested Fork-Join and Dynamic Independent Tasks \\
                 3 Design and Implementation of Lifeline-Pure Scheme \\
                 4 Experimental Evaluation \\
                 5 Related Work \\
                 6 Conclusions \\
                 References \\
                 New Insights on the Revised Definition of the
                 Performance Portability Metric \\
                 1 Introduction \\
                 2 Definition of the $\Phi$ Metrics \\
                 3 Proportionality \\
                 4 Smith's Article \\
                 5 The Principles \\
                 6 Lossy Metrics \\
                 7 Properties of a Good Metric \\
                 8 Conclusions \\
                 References \\
                 Inferential Statistical Analysis of Performance
                 Portability \\
                 1 Introduction \\
                 2 OpenACC Performance Portability \\
                 3 OpenACC's Observation Statistics \\
                 4 Hypothesis Testing \\
                 4.1 One-sample Wilcoxon Signed-Rank Test \\
                 4.2 Nonparametric Bootstrap \\
                 5 OpenMP, Kokkos, and Raja \\
                 6 Conclusions \\
                 References \\
                 NPDP Benchmark Suite for Loop Tiling Effectiveness
                 Evaluation \\
                 1 Introduction \\
                 2 NPDP Kernels \\
                 3 Related Work \\
                 4 Experimental Study \\
                 5 Conclusion \\
                 References \\
                 Parallel Vectorized Implementations of Compensated
                 Summation Algorithms \\
                 1 Introduction \\
                 2 Compensated Summation Algorithms \\
                 3 Implementation of Parallel Vectorized Algorithms \\
                 4 Results of Experiments \\
                 5 Conclusions and Future Work \\
                 References \\
                 References \\
                 6th Workshop on Models, Algorithms and Methodologies
                 for Hybrid Parallelism in New HPC Systems (MAMHYP 2022)
                 Malleability Techniques for HPC Systems \\
                 1 Introduction \\
                 2 ADMIRE Project \\
                 3 FlexMPI \\
                 4 A Malleability Use Case: WaComM++ \\
                 5 Conclusions \\
                 References \\
                 Algorithm and Software Overhead: A Theoretical Approach
                 to Performance Portability \\
                 1 Introduction \\
                 2 The Performance Evaluation Framework \\
                 2.1 Decomposition of a Problem \\
                 2.2 Algorithm",

%%% ====================================================================
%%% Additional cross-referenced works:
  author =       "Anonymous",
  title =        "Book Reviews: 26. {Barrett, Berry, Chan, Demmel,
                 Donato, Dongarra, Eijkhout, Pozo, Romine, and van der
  journal =      j-MATH-COMPUT,
  volume =       "64",
  number =       "211",
  pages =        "??--??",
  month =        jul,
  year =         "1995",
  CODEN =        "MCMPAF",
  ISSN =         "0025-5718 (print), 1088-6842 (electronic)",
  ISSN-L =       "0025-5718",
  bibdate =      "Mon Jul 26 10:22:57 1999",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "Mathematics of Computation",
  journal-URL =  "",

%%% Last MathSciNet search: Tue Sep 19 12:50:42 2023