IMP model for parallelism

  • A DSL for Integrative Parallel Programming pdf link
    @InProceedings{Eijkhout:ISPDC2014,
      Title                    = {A {DSL} for Integrative Parallel Programming},
      Author                   = {Eijkhout, V.},
      Booktitle                = {Parallel and Distributed Computing (ISPDC), 2014 IEEE 13th International Symposium on},
      Year                     = {2014},
      Month                    = {June},
      Pages                    = {27-34},
    
      Doi                      = {10.1109/ISPDC.2014.36}
    
  • A Unified Approach to Parallel Programming, pdf link
    @INPROCEEDINGS{Eijkhout:WCECS:2012,
      author = {Victor Eijkhout},
      title = {A Unified Approach to Parallel Programming},
      booktitle = {Proceedings of International Conference on Computer Science and Applications
    	(ICCSA'12)},
      year = {2012},
      editor = {S.I. Ao and Craig Douglas and W.S. Grundfest and Jon Burgstone},
      pages = {78--83},
      publisher = {Newswood Limited, International Association of Engineers},
      note = {ISBN (Vol I): 978-988-19251-6-9, ISBN (Vol II): 978-988-19252-4-4,
    	ISSN: 2078-0958 (Print), ISSN: 2078-0966 (Online)},
    }
    
  • A Theory of Data Movement in Parallel Computations, pdf link
    @ARTICLE{Eijkhout:ICCS2012,
      author = {Victor Eijkhout},
      title = {A Theory of Data Movement in Parallel Computations},
      journal = {Procedia Computer Science},
      year = {2012},
      volume = {9},
      pages = {236 - 245},
      number = {0},
      note = {Proceedings of the International Conference on Computational
    	Science, ICCS 2012, Also published as technical report
    	TR-12-03 of the Texas Advanced Computing Center, The University of
    	Texas at Austin.},
      doi = {10.1016/j.procs.2012.04.025},
      issn = {1877-0509},
      url = {http://www.sciencedirect.com/science/article/pii/S1877050912001469}
    }
    
  • A Gentle Introduction to the Integrative Model for Parallelism, pdf link
    @TechReport{IMP-11,
      Title                    = {A gentle introduction to the Integrative Model for Parallelism},
      Author                   = {Victor Eijkhout},
      Institution              = {Integrative Programming Lab, Texas Advanced Computing Center,
     The University of Texas at Austin},
      Year                     = {2014},
      Number                   = {IMP-11},
    }
    
  • Report on NSF EAGER 1451204, pdf link
    @TechReport{IMP-19,
      Title                    = {Report on {NSF EAGER} 1451204.},
      Author                   = {Victor Eijkhout},
      Institution              = {Integrative Programming Lab, Texas Advanced Computing Center,
     The University of Texas at Austin},
      Year                     = {2014},
      Number                   = {IMP-19},
    }
    
  • Definition of a ‘communication avoiding’ compiler in the integrative model, pdf link
    @TechReport{IMP-06,
      Title                    = {Definition of a `communication avoiding' compiler in the Integrative Model},
      Author                   = {Victor Eijkhout},
      Institution              = {Integrative Programming Lab, Texas Advanced Computing Center,
     The University of Texas at Austin},
      Year                     = {2014},
      Number                   = {IMP-06},
    }
    

Flame-iterative

  • download link
    FLAME Derivation of the General Minimal Residual Method, with Paolo Bientinesi
    @TECHREPORT{EijkBien:flame-gmres-report,
    author = {Victor Eijkhout and Paolo Bientinesi},
    title = {{FLAME} Derivation of the {General Minimal Residual Method}},
    institution = {Texas Advanced Computing Center, The University of Texas at Austin},
    number = {TR-13-03},
    
  • Incomplete Factorizations in the {FLAME} Framework, with Paolo Bientinesi. download link
    @TECHREPORT{EijkhoutBientinesi2010:ILU,
      author = {Victor Eijkhout and Paolo Bientinesi},
      title = {Incomplete Factorizations in the {FLAME} Framework},
      institution = {Texas Advanced Computing Center, The University of Texas at Austin},
      year = {2010},
      number = {TR-10-04}
    }
    
  • Proof-driven Derivation of Krylov Solver Libraries. With Paolo Bientinesi and Robert van de Geijn. pdf file.
    @TECHREPORT{Eijkhout2010:ProofDriven,
      author = {Victor Eijkhout and Paolo Bientinesi and Robert van de Geijn},
      title = {Proof-Driven Derivation of {Krylov} Solver Libraries},
      institution = {Texas Advanced Computing Center, The University of Texas at Austin},
      year = {2010},
      number = {TR-10-02},
      note = {submitted to SIAM J. Scientific Comput.},
    }
    
  • Toward Mechanical Derivation of Krylov Solver Libraries. With Paolo Bientinesi and Robert van de Geijn. Published in the proceedings of ICCS 2010; also TACC technical report TR-10-01. pdf file
    @article{Eijkhout2010ICCS-krylov,
    author = "Victor Eijkhout and Paolo Bientinesi and Robert van de Geijn",
    title = "Towards mechanical derivation of Krylov solver libraries",
    journal = "Procedia Computer Science",
    volume = "1",
    number = "1",
    pages = "1799 - 1807",
    year = "2010",
    note = "proceedings of ICCS 2010, \url{http://www.sciencedirect.com/science/publication?issn=18770509&volume=1&issue=1}",
    issn = "1877-0509",
    doi = "DOI: 10.1016/j.procs.2010.04.202",
    url = 
    "http://www.sciencedirect.com/science/article/B9865-506HM1Y-75/2/0011e8957c953ac7c727d4d533ae8dd5"
    }
    
  • Formal correctness proof of mechanically derived {Krylov} methods, with Paolo Bientinesi, Maggie Myers, and Robert van de Geijn. TACC Technical Report 09-06. pdf file.
    @techreport{Bientinesi2009:correctness,
      author = {Paolo Bientinesi and Victor Eijkhout and Maggie Myers and Robert
    	van de Geijn},
      title = {Formal Correctness Proof of Automatically Derived {K}rylov Methods},
      institution = {Texas Advanced Computing Center, The University of Texas at Austin},
      number = {09-06},
      year = {2009},
      keywords = {hoare triples, correctness proof, conjugate gradients, krylov methods}
    }
    
  • Formal derivation of Krylov methods, with Paolo Bientinesi and Robert van de Geijn. TACC Technical Report 08-03. pdf file.
    @techreport{Eijkhout:flame-krylov,
    title = {Formal derivation of Krylov methods},
    author = {Victor Eijkhout and Paolo Bientinesi and Robert {van de Geijn}},
    institution = {Texas Advanced Computing Center, The University
        of Texas at Austin},
    number = {TR-08-03}
    }
    

Test Problem Server

  • An On-demand Test Problem Server. With Bill Barth, James Kneeland, Steve Mock, John Peterson.pdf file

Self-Adapting Numerical Software

  • Application of Alternating Decision Trees in Selecting Sparse Linear Solvers. With Sanjukta Bhowmick and others. pdf file
    @ARTICLE{Bhowmick2010ADT,
      author = {S. Bhowmick and V. Eijkhout and Y. Freund and E. Fuentes and D. Keyes},
      title = {Application of Alternating Decision Trees in Selecting Sparse Linear
    	Solvers},
      year = {2010},
      booktitle = {Software Automatic Tuning: From Concepts to the State-of-the-Art
    	Results},
      editor = {K. Naono and K. Teranishi and J. Cavazos and R. Suda}
    }
    
  • Machine Learning for Multi-stage Selection of Numerical Methods. With Erika Fuentes. pdf file
    @INCOLLECTION{EijkFuen2010:multistage,
      author = {Victor Eijkhout and Erika Fuentes},
      title = {Machine Learning for Multi-stage Selection of Numerical Methods},
      booktitle = {New Advances in Machine Learning},
      publisher = {Intech},
      year = {2010},
      pages = {117--136}
    }
    
  • Multi-stage Learning of Linear Algebra Algorithms, with Erika Fuentes. pdf file
    @INPROCEEDINGS{EijkFuen:icmla2008,
      author = {Victor Eijkhout and Erika Fuentes},
      title = {Multi-stage Learning of Linear Algebra Algorithms},
      booktitle = {International Conference on Machine Learning and its Applications,
    	San Diego, CA, 11-13 December 2008},
      year = {2008}
    }
    
  • Software Architecture of an Intelligent Recommender System. With Erika Fuentes. pdf file
    @techreport{EijkFuen:architecture,
    author = {Victor Eijkhout and Erika Fuentes},
    title = {Software Architecture of an Intelligent Recommender System},
    institution = {Texas Advanced Computing Center,
        The University of Texas at Austin},
    number = {TR-08-01},
    year = {2008}
    }
    
  • Application of Machine Learning to the Selection of Sparse Linear Solvers. With Sanjukta Bhowmick et al. pdf file
    @article{Bhowmicketal:application,
    title = {Application of Machine Learning to the Selection of Sparse Linear Solvers},
    author = {S. Bhowmick and V. Eijkhout and Y. Freund and E. Fuentes and D. Keyes},
    journal = IJHPCA,
    year = 2006,
    note = {submitted}
    }
    
  • A Standard and Software for Numerical Metadata. With Erika Fuentes. pdf file
    @techreport{EijkFuentes:TOMSmetadata,
    author = {Victor Eijkhout and Erika Fuentes},
    title = {A Proposed Standard for Numerical Metadata},
    institution = {Texas Advanced Computing Center, The University of Texas at Austin},
    number = {TR-07-01},
    note = {submitted to ACM TOMS}
    }
    
  • The Component Structure of a Self-Adapting Numerical Software System, with Tom Eidson, Jack Dongarra, Erika Fuentes. pdf file
    @article{EijkFuenEidDong:components2005,
    title = {The Component Structure of a Self-Adapting Numerical Software
      System},
    author = {Victor Eijkhout and Erika Fuentes and
        Thomas Eidson and Jack Dongarra},
    journal = IJPP,
    volume = {33},
    issue = {2},
    month = {June},
    year = {2005}
    }
    
  • Self Adapting Linear Algebra Algorithms and Software. With Jim Demmel et al. pdf file
    @article{DemEtAl:ieeeproc2004,
    title = {Self Adapting Linear Algebra Algorithms and Software},
    author = {Jim Demmel and Jack Dongarra and Victor Eijkhout and Erika Fuentes
      and Antoine Petitet and Rich Vuduc and R. Clint Whaley and Katherine Yelick},
    journal = {Proceedings of the IEEE},
    volume = {93},
    issue = {2},
    month = {February},
    year =  {2005},
    pages = {293-312},
    issn  = {0018-9219}
    }
    
  • Self-adapting Numerical Software and Automatic Tuning of Heuristics. With Jack Dongarra.
    @inproceedings{DonEij:iccs2003,
    title = {Self-adapting Numerical Software and Automatic
      Tuning of Heuristics},
    author = {Jack Dongarra and Victor Eijkhout},
    booktitle = {Proceedings of the International Conference on
        Computational Science, June 2--4 2003,
        St.\ Petersburg (Russia) and Melbourne (Australia)},
    year = {2003}
    }
    
  • Applying Aspect-Orient Programming Concepts to a Component-based Programming Model. With Tom Eidson and Jack Dongarra. pdf file
    @inproceedings{EidDonEij:ipdps2003,
    title = {Applying Aspect-Orient Programming Concepts to a Component-based
            Programming Model},
    author = {Thomas Eidson and Jack Dongarra and Victor Eijkhout},
    booktitle = {Proceedings of the 
                 17th International Parallel and Distributed Processing Symposium
               (IPDPS) April 22--26, 2003, Nice, France},
    year = {2003}
    }
    
  • Self-Adapting Numerical Software for Next Generation Applications. With Jack Dongarra. pdf file
    @article{DonEijk:sans,
    author = {Jack Dongarra and Victor Eijkhout},
    title = {Self-adapting Numerical Software for Next Generation Applications},
    institution = {Innovative Computing Lab, University of Tennessee},
    journal = {Int. J. High Perf. Comput. Appl.},
    volume = {17},
    issue = {2},
    pages = {125--131},
    note = {also Lapack Working Note 157, ICL-UT-02-07}
    }
    
  • Seamless access to adaptive solver algorithms. With Dorian Arnold, Jack Dongarra, Susan Blackford, Tinghua Xu. ps file
    @INPROCEEDINGS{Aretal:seamless-sgi,
      AUTHOR={D.C. Arnold and S. Blackford and J. Dongarra and V. Eijkhout
              and T. Xu},
      TITLE={Seamless Access to Adaptive Solver Algorithms},
      BOOKTITLE={SGI Users' Conference},
      PUBLISHER={Academic Computer Center CYFRONET},
      EDITOR={Bubak, M. and Moscinski, J. and Noga, M.},
      MONTH={October},
      YEAR = {2000},
      PAGES = {23-30}
    }
    

Sparse direct factorizations

  • A Parallel Sparse Direct Solver via Hierarchical DAG Scheduling, with Kyungjoo Kim, pdf file
     
    @TECHREPORT{KimEijkhout:2012Sparse,
      author = {Kyungjoo Kim and Victor Eijkhout},
      title = {A Parallel Sparse Direct Solver via Hierarchical DAG Scheduling},
      institution = {Texas Advanced Computing Center, The University of Texas at Austin},
      year = {2012},
      number = {TR-12-05}
    }
    
  • Dense Matrix Computation on a Heterogenous Architecture: A Block Synchronous Approach, with Kyungjoo Kim and Robert van de Geijn, pdf file
     
    @TECHREPORT{KimEijkhoutVDG:2012GPU,
      number = {TR-12-04},
      title = {Dense Matrix Computation on a Heterogenous Architecture: A Block Synchronous Approach},
      author = {Kyungjoo Kim and Victor Eijkhout and Robert A. van de Geijn},
      institution = {Texas Advanced Computing Center, The University of Texas at Austin},
      year = {2012}
    }
    
  • Sparse Direct Factorizations through Unassembled Hyper-Matrices. With Paolo Bientinesi, Kyungjoo Kim, Jason Kurtz, Robert van de Geijn. TACC Technical Report TR-07-2. Submitted to Computer Methods in Applied Mechanics and Engineering. pdf file
    @ARTICLE{Bientinesi:2010uhm,
      author = {Paolo Bientinesi and Victor Eijkhout and Kyungjoo Kim and Jason Kurtz
    	and Robert van de Geijn},
      title = {Sparse Direct Factorizations through Unassembled Hyper-Matrices},
      journal = {Computer Methods in Applied Mechanics and Engineering},
      year = {2010},
      volume = {199},
      pages = {430--438},
      doi = {http://dx.doi.org/10.1016/j.cma.2009.07.012}
    }
    

Performance optimization

  • Performance Optimization and Modeling of Blocked Sparse Kernels. With Alfredo Buttari, Julien Langou, Salvatore Filippone. Intl. J. High Perf. Comp. Appls., 2007. Also report number ICL-UT-04-05. pdf file
    @article{ButtEijkLang:spmvp,
    author = {Alfredo Buttari and Victor Eijkhout and Julien Langou 
      and Salvatore Filippone},
    title = {Performance Optimization and Modeling of Blocked Sparse Kernels},
    journal = IJHPCA,
    year = {2007},
    volume = {21},
    pages = {467--484}
    }
    

Numerical Linear Algebra

  • The Spike factorization as domain decomposition method; equivalent and variant approaches. With Robert van de Geijn. To appear in a Spriner volume dedicated to Ahmed Sameh. pdf file
    @INCOLLECTION{EvdG2011:spike-springer,
      author = {Victor Eijkhout and Robert {van de Geijn}},
      title = {The {Spike} Factorization as Domain Decompositin Method: 
        equivalen and variant approaches},
      booktitle = {High-Performance Scientific Computing: 
        Algorithms and Applications},
      publisher = {Spinger Verlag},
      year = {2011},
      editor = {Efstratios Gallopoulos}
    }
    
  • The role of the strengthened Cauchy-Buniakowskii-Schwarz inequality in multilevel methods. With Panayot Vassilevski. In SIAM Review 1991. ps file.
    @article{EijVa:cbs,
    author = {Victor Eijkhout and Panayot Vassilevski},
    title = {The role of the extended Cauchy-Buniakowskii-Scharz
        inequality in multilevel methods},
    journal = {SIAM Review},
    year = {1991},
    volume = {33},
    pages = {405--419},
    keywords = {algebraic multilevel, Cauchy-Schwarz inequality,
    	finite elements}
    }
    
  • A matrix framework for Conjugate Gradients methods and some variants of CG with less synchronization overhead. With Ed D'Azevedo and Chuck Romine. In SIAM Parallel Processing proceedings, 1993. pdf file
    @inproceedings{DAzEijRo:ppscicomp,
    author = {E.F. D'Azevedo and V.L. Eijkhout and C.H. Romine},
    title = {A Matrix Framework for Conjugate Gradient Methods and
             Some Variants of CG with Less Synchronization Overhead},
    booktitle = {Proceedings of the Sixth SIAM Conference
             on Parallel Procesing for Scientific Computing},
    publisher = {SIAM},
    address = {Philadelphia},
    year = {1993},
    pages = {644-646},
    keywords = {iterative methods, parallelism, communication cost}
    }
    
  • Reducing communication costs in the conjugate gradient algorithm on distributed memory multiprocessors. With Ed D'Azevedo and Chuck Romine. UTK CS report CS-93-185, Lapack Working Note 56. ps file
    @techreport{DAzEijRo:lawn56,
    author = {E.F. D'Azevedo and V.L. Eijkhout and C.H. Romine},
    title = {Lapack Working Note 56:
    	Reducing communication costs in the conjugate gradient
    	algorithm on distributed memory multiprocessor},
    institution = {Computer Science Department, 
    	University of Tennessee, Knoxville},
    number = {CS-93-185},
    year = {1993},
    keywords = {iterative methods, parallelism, communication cost}
    }
    
  • Computational variants of teh CGS and BiCGstab methods. Lapack working note 78, 1994. ps file
    @techreport{Eij:cgs3t,
    author = {Victor Eijkhout},
    title = {Lapack Working Note 78, {C}omputational variants of the {CGS}
    		  and {BiCGstab} methods},
    institution = {Computer Science Department, 
    	University of Tennessee, Knoxville},
    number = {CS-94-241},
    year = {1994}
    }
    
  • On the existence problem of incomplete factorisation methods. Lapack working note 144, 1999. ps file
    @techreport{Eijk:ilu-overview,
    author = {Victor Eijkhout},
    title = {On the Existence Problem of Incomplete Factorisation Methods},
    institution = {Computer Science Department, University of Tennessee},
    number = {Lapack working note 144, UT-CS-99-435},
    year = {1999}
    }
    
  • The `weighted modification' incomplete factorisation method. Lapack working note 145, 1999. ps file
    @techreport{Eijk:weighted-ilu,
    author = {Victor Eijkhout},
    title = {The `weighted modification' incomplete factorisation method},
    institution = {Computer Science Department, University of Tennessee},
    number = {Lapack working note 145, UT-CS-99-436},
    year = {1999}
    }
    
  • Recursive approach in sparse matrix LU factorization, with Jack Dongarra and Piotr Luszczek, Scientific Programming 2001 pdf file
    @ARTICLE{DonEijkLus:recursive2001
      AUTHOR = "Jack J. Dongarra and Victor Eijkhout and Piotr Luszczek",
      TITLE = "Recursive approach in sparse matrix {LU} factorization",
      JOURNAL = "Scientific Programming",
      VOLUME = "9",
      NUMBER = "1",
      PAGES = "51-60",
      YEAR = "2001" }
    
  • Automatic determination of matrix blocks. Lapack working note 151, 2001; submitted to Scientific Programming. ps file
    @techreport{Eijk:auto-block,
    author = {Victor Eijkhout},
    title = {Automatic Determination of Matrix Blocks},
    institution = {Department of Computer Science, University of Tennessee},
    number = {ut-cs-01-458},
    note = {Lapack Working Note 151},
    year = {2001}
    }
    
  • An iterative solver benchmark. With Jack Dongarra and Henk van der Vorst. Lapack working note 152. Scientific Programming, 2001. pdf file
    @article{DonEijkVDV:benchmark,
    author = {Jack Dongarra and Victor Eijkhout and Henk {van der Vorst}},
    title = {An Iterative Solver Benchmark},
    journal = {Scientific Programming},
    volume = {9},
    issue = {4},
    year = {2001},
    pages = {223--231},
    note = {also Lapack Working Note 152}
    }
    

Overview articles

  • Overview of iterative linear solver packages. In NHSE Review, 1998. ps file
    @article{Eijk:nhse-iterative-survey,
    author = {Victor Eijkhout},
    title = {Overview of Iterative Linear System Solver Packages},
    year = {1998},
    journal = {NHSE review},
    volume = {3},
    issue = {1},
    note = {available at {\tt http://\discretionary{}{}{}%
    www.nhse.org/\discretionary{}{}{}%
    NHSEreview/ILS/\discretionary{}{}{}%
    ILStoc.html},
                    also UT Lapack Working Note 141}
    }
    
  • Numerical Linear Algebra. With Jack Dongarra. In Encyclopaedia of computer science and technology, volume 41; 1999. ps file
    @incollection{DonEijk:ency,
    author = {Jack J. Dongarra and Victor Eijkhout},
    title = {Numerical Linear Algebra},
    booktitle = {Encyclopaedia of Computer Science and Technology},
    volume = {41},
    pages = {207--234},
    editor = {Allen Kent and James G. Williams},
    publisher = {Marcel Dekker, Inc.},
    year = {1999}
    }