sandialabs
diff --git a/‎COPYING
+6-4 b/‎COPYING
+6-4
diff --git a/‎configure.in
+11-4 b/‎configure.in
+11-4
diff --git a/‎test/benchmarks/Makefile.am
+3 b/‎test/benchmarks/Makefile.am
+3
diff --git a/‎test/benchmarks/mantevo/Makefile.am
+19 b/‎test/benchmarks/mantevo/Makefile.am
+19
diff --git a/‎test/benchmarks/mantevo/hpccg/HPCCG.cpp
+149 b/‎test/benchmarks/mantevo/hpccg/HPCCG.cpp
+149
diff --git a/‎test/benchmarks/mantevo/hpccg/HPCCG.hpp
+59 b/‎test/benchmarks/mantevo/hpccg/HPCCG.hpp
+59
diff --git a/‎test/benchmarks/mantevo/hpccg/HPC_Sparse_Matrix.hpp
+70 b/‎test/benchmarks/mantevo/hpccg/HPC_Sparse_Matrix.hpp
+70
@@ -27,17 +27,17 @@ certain rights in this software.
 * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
 * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-The qthreads library contains parts of an earlier library (libtask, by Russ
-Cox) that requires the propogation of its copyright information. This sofware
-is in the fastcontext directory, namely the files:
+The qthreads library contains heavily modified parts of an earlier library
+(libtask, by Russ Cox) that requires the propogation of its copyright
+information. This sofware is in the fastcontext directory, namely the files:
 
 	asm.S
 	power-ucontext.h
 	386-ucontext.h
 	context.c
 	taskimpl.h
 
-However, those files have been extensively modified.
+However, as noted above, those files have been extensively modified, and do not resemble the original very much.
 
 The rest of the qthread library, which will function on any Unix system with
 the makecontext()-family of functions, can stand alone. Those files are simply
@@ -50,6 +50,8 @@ used only by the UTS implementation in test/benchmarks/uts. The license for the
 random number generator code is in the LICENSE file in the
 test/benchmarks/uts/rng directory.
 
+The benchmark suite ALSO contains some code from the Sandia Mantevo project, contained in the test/benchmarks/mantevo directory. The licenses for those codes reside in their respective directories. For example, the HPCCG code license is in test/benchmarks/mantevo/hpccg/README.
+
 ~~~~~~~~~~~~~
 
 The libtask copyright is as follows:
 
@@ -1042,10 +1042,15 @@ AS_IF([test "x$enable_multinode" = "xyes"],
        esac],
       [enable_multinode="no"])
 
-AS_IF([test "x$enable_lf_febs" == "xyes"],
-      [enable_lf_febs=yes
-       AC_DEFINE([LOCK_FREE_FEBS], [1], [Define to use a lock-free hash table for FEB metadata.])],
+AS_IF([test "x$enable_lf_febs" = "xyes"],
+      [AC_DEFINE([LOCK_FREE_FEBS], [1], [Define to use a lock-free hash table for FEB metadata.])],
       [enable_lf_febs=no])
+dnl AS_IF([test "x$enable_lf_febs" != "xno"],
+dnl       [AS_IF([test "x$enable_hardware_atomics" = "xyes" -a "x$qthread_cv_atomic_CASptr" = "xyes"],
+dnl              [enable_lf_febs=yes
+dnl               AC_DEFINE([LOCK_FREE_FEBS], [1], [Define to use a lock-free hash table for FEB metadata.])],
+dnl              [enable_lf_febs=no])],
+dnl       [enable_lf_febs=no])
 
 ## --------------- ##
 ## Output and done ##
@@ -1097,9 +1102,11 @@ AC_CONFIG_FILES([Makefile
                  test/features/Makefile
                  test/stress/Makefile
                  test/benchmarks/Makefile
+                 test/benchmarks/mantevo/Makefile
+                 test/benchmarks/mantevo/hpccg/Makefile
                  test/benchmarks/rose_bots/Makefile])
 AS_IF([test "enable_multinode" = "yes"],
-                 [AC_CONFIG_FILES([test/multinode/Makefile])])
+      [AC_CONFIG_FILES([test/multinode/Makefile])])
 AC_OUTPUT
 
 case "$qthread_cv_stack_size" in
 
@@ -1,3 +1,4 @@
+SUBDIRS = mantevo
 
 .PHONY: buildall buildtests buildextra benchmarks
 
@@ -135,9 +136,11 @@ buildall: $(benchmarks)
 	$(MAKE) -C rose_bots buildall
 buildextra: $(benchmarks)
 	$(MAKE) -C rose_bots buildextra
+	$(MAKE) -C mantevo buildextra
 else
 buildall: $(benchmarks)
 buildextra: $(benchmarks)
+	$(MAKE) -C mantevo buildextra
 endif
 
 benchmarks: buildextra
 
@@ -0,0 +1,19 @@
+SUBDIRS = hpccg
+
+.PHONY: buildall buildextra benchmarks
+
+benchmarks: buildextra
+buildall: buildextra
+
+mantevo_benchmarks = hpccg
+
+buildextra:
+	$(MAKE) -C hpccg hpccg
+
+INCLUDES = -I$(top_srcdir)/include
+qthreadlib = $(top_builddir)/src/libqthread.la
+
+LDADD = $(qthreadlib)
+
+$(qthreadlib):
+	$(MAKE) -C $(top_builddir)/src libqthread.la
@@ -0,0 +1,149 @@
+
+//@HEADER
+// ************************************************************************
+// 
+//               HPCCG: Simple Conjugate Gradient Benchmark Code
+//                 Copyright (2006) Sandia Corporation
+// 
+// Under terms of Contract DE-AC04-94AL85000, there is a non-exclusive
+// license for use of this work by or on behalf of the U.S. Government.
+// 
+// This library is free software; you can redistribute it and/or modify
+// it under the terms of the GNU Lesser General Public License as
+// published by the Free Software Foundation; either version 2.1 of the
+// License, or (at your option) any later version.
+//  
+// This library is distributed in the hope that it will be useful, but
+// WITHOUT ANY WARRANTY; without even the implied warranty of
+// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+// Lesser General Public License for more details.
+//  
+// You should have received a copy of the GNU Lesser General Public
+// License along with this library; if not, write to the Free Software
+// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307
+// USA
+// Questions? Contact Michael A. Heroux ([email protected]) 
+// 
+// ************************************************************************
+//@HEADER
+
+/////////////////////////////////////////////////////////////////////////
+
+// Routine to compute an approximate solution to Ax = b where:
+
+// A - known matrix stored as an HPC_Sparse_Matrix struct
+
+// b - known right hand side vector
+
+// x - On entry is initial guess, on exit new approximate solution
+
+// max_iter - Maximum number of iterations to perform, even if
+//            tolerance is not met.
+
+// tolerance - Stop and assert convergence if norm of residual is <=
+//             to tolerance.
+
+// niters - On output, the number of iterations actually performed.
+
+/////////////////////////////////////////////////////////////////////////
+
+#include <iostream>
+#include <cstdio>
+#include <cmath>
+#include "mytimer.hpp"
+#include "HPCCG.hpp"
+
+#define TICK()  t0 = mytimer() // Use TICK and TOCK to time a code section
+#define TOCK(t) t += mytimer() - t0
+int HPCCG(HPC_Sparse_Matrix * A,
+	  const double * const b, double * const x,
+	  const int max_iter, const double tolerance, int &niters, double & normr,
+	  double * times)
+
+{
+  double t_begin = mytimer();  // Start timing right away
+
+  double t0 = 0.0, t1 = 0.0, t2 = 0.0, t3 = 0.0, t4 = 0.0;
+#ifdef USING_MPI
+  double t5 = 0.0;
+#endif
+  int nrow = A->local_nrow;
+  int ncol = A->local_ncol;
+
+  double * r = new double [nrow];
+  double * p = new double [ncol]; // In parallel case, A is rectangular
+  double * Ap = new double [nrow];
+
+  normr = 0.0;
+  double rtrans = 0.0;
+  double oldrtrans = 0.0;
+
+#ifdef USING_MPI
+  int size, rank; // Number of MPI processes, My process ID
+  MPI_Comm_size(MPI_COMM_WORLD, &size);
+  MPI_Comm_rank(MPI_COMM_WORLD, &rank);
+#else
+  //int size = 1; // Serial case (not using MPI)
+  int rank = 0;
+#endif
+
+  int print_freq = max_iter/10; 
+  if (print_freq>50) print_freq=50;
+  if (print_freq<1)  print_freq=1;
+
+  // p is of length ncols, copy x to p for sparse MV operation
+  TICK(); waxpby(nrow, 1.0, x, 0.0, x, p); TOCK(t2);
+#ifdef USING_MPI
+  TICK(); exchange_externals(A,p); TOCK(t5); 
+#endif
+  TICK(); HPC_sparsemv(A, p, Ap); TOCK(t3);
+  TICK(); waxpby(nrow, 1.0, b, -1.0, Ap, r); TOCK(t2);
+  TICK(); ddot(nrow, r, r, &rtrans, t4); TOCK(t1);
+  normr = sqrt(rtrans);
+
+  if (rank==0) printf("Initial Residual = %g\n", normr);
+
+  for(int k=1; k<max_iter && normr > tolerance; k++ )
+    {
+      if (k == 1)
+	{
+	  TICK(); waxpby(nrow, 1.0, r, 0.0, r, p); TOCK(t2);
+	}
+      else
+	{
+	  oldrtrans = rtrans;
+	  TICK(); ddot (nrow, r, r, &rtrans, t4); TOCK(t1);// 2*nrow ops
+	  double beta = rtrans/oldrtrans;
+	  TICK(); waxpby (nrow, 1.0, r, beta, p, p);  TOCK(t2);// 2*nrow ops
+	}
+      normr = sqrt(rtrans);
+      if (rank==0 && (k%print_freq == 0 || k+1 == max_iter))
+      printf("Iteration = %i   Residual = %g\n", k, normr);
+     
+
+#ifdef USING_MPI
+      TICK(); exchange_externals(A,p); TOCK(t5); 
+#endif
+      TICK(); HPC_sparsemv(A, p, Ap); TOCK(t3); // 2*nnz ops
+      double alpha = 0.0;
+      TICK(); ddot(nrow, p, Ap, &alpha, t4); TOCK(t1); // 2*nrow ops
+      alpha = rtrans/alpha;
+      TICK(); waxpby(nrow, 1.0, x, alpha, p, x);// 2*nrow ops
+      waxpby(nrow, 1.0, r, -alpha, Ap, r);  TOCK(t2);// 2*nrow ops
+      niters = k;
+    }
+
+  // Store times
+  times[1] = t1; // ddot time
+  times[2] = t2; // waxpby time
+  times[3] = t3; // sparsemv time
+  times[4] = t4; // AllReduce time
+#ifdef USING_MPI
+  times[5] = t5; // exchange boundary time
+#endif
+  delete [] p;
+  delete [] Ap;
+  delete [] r;
+  times[0] = mytimer() - t_begin;  // Total time. All done...
+  return(0);
+}
@@ -0,0 +1,59 @@
+
+//@HEADER
+// ************************************************************************
+// 
+//               HPCCG: Simple Conjugate Gradient Benchmark Code
+//                 Copyright (2006) Sandia Corporation
+// 
+// Under terms of Contract DE-AC04-94AL85000, there is a non-exclusive
+// license for use of this work by or on behalf of the U.S. Government.
+// 
+// This library is free software; you can redistribute it and/or modify
+// it under the terms of the GNU Lesser General Public License as
+// published by the Free Software Foundation; either version 2.1 of the
+// License, or (at your option) any later version.
+//  
+// This library is distributed in the hope that it will be useful, but
+// WITHOUT ANY WARRANTY; without even the implied warranty of
+// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+// Lesser General Public License for more details.
+//  
+// You should have received a copy of the GNU Lesser General Public
+// License along with this library; if not, write to the Free Software
+// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307
+// USA
+// Questions? Contact Michael A. Heroux ([email protected]) 
+// 
+// ************************************************************************
+//@HEADER
+
+#ifndef HPCCG_H
+#define HPCCG_H
+#include "HPC_sparsemv.hpp"
+#include "ddot.hpp"
+#include "waxpby.hpp"
+#include "HPC_Sparse_Matrix.hpp"
+
+#ifdef USING_MPI
+#include "exchange_externals.hpp"
+#include <mpi.h> // If this routine is compiled with -DUSING_MPI
+                 // then include mpi.h
+#endif
+int HPCCG(HPC_Sparse_Matrix * A,
+	  const double * const b, double * const x,
+	  const int max_iter, const double tolerance, int & niters, double & normr, double * times);
+
+// this function will compute the Conjugate Gradient...
+// A <=> Matrix
+// b <=> constant
+// xnot <=> initial guess
+// max_iter <=> how many times we iterate
+// tolerance <=> specifies how "good"of a value we would like
+// x <=> used for return value
+
+// A is known
+// x is unknown vector
+// b is known vector
+// xnot = 0
+// niters is the number of iterations
+#endif
@@ -0,0 +1,70 @@
+
+//@HEADER
+// ************************************************************************
+// 
+//               HPCCG: Simple Conjugate Gradient Benchmark Code
+//                 Copyright (2006) Sandia Corporation
+// 
+// Under terms of Contract DE-AC04-94AL85000, there is a non-exclusive
+// license for use of this work by or on behalf of the U.S. Government.
+// 
+// This library is free software; you can redistribute it and/or modify
+// it under the terms of the GNU Lesser General Public License as
+// published by the Free Software Foundation; either version 2.1 of the
+// License, or (at your option) any later version.
+//  
+// This library is distributed in the hope that it will be useful, but
+// WITHOUT ANY WARRANTY; without even the implied warranty of
+// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+// Lesser General Public License for more details.
+//  
+// You should have received a copy of the GNU Lesser General Public
+// License along with this library; if not, write to the Free Software
+// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307
+// USA
+// Questions? Contact Michael A. Heroux ([email protected]) 
+// 
+// ************************************************************************
+//@HEADER
+
+#ifndef HPC_SPARSE_MATRIX_H
+#define HPC_SPARSE_MATRIX_H
+
+// These constants are upper bounds that might need to be changes for 
+// pathological matrices, e.g., those with nearly dense rows/columns.
+
+const int max_external = 100000;
+const int max_num_messages = 500;
+const int max_num_neighbors = max_num_messages;
+
+
+struct HPC_Sparse_Matrix_STRUCT {
+  char   *title;
+  int start_row;
+  int stop_row;
+  int total_nrow;
+  long long total_nnz;
+  int local_nrow;
+  int local_ncol;  // Must be defined in make_local_matrix
+  int local_nnz;
+  int  * nnz_in_row;
+  double ** ptr_to_vals_in_row;
+  int ** ptr_to_inds_in_row;
+  double ** ptr_to_diags;
+
+#ifdef USING_MPI
+  int num_external;
+  int num_send_neighbors;
+  int *external_index;
+  int *external_local_index;
+  int total_to_be_sent;
+  int *elements_to_send;
+  int *neighbors;
+  int *recv_length;
+  int *send_length;
+  double *send_buffer;
+
+#endif
+};
+typedef struct HPC_Sparse_Matrix_STRUCT HPC_Sparse_Matrix;
+#endif