187 lines
7.0 KiB
Plaintext
187 lines
7.0 KiB
Plaintext
# SPDX-FileCopyrightText: Copyright (c) 2024 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
# SPDX-License-Identifier: Apache-2.0
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
|
|
#HEADER
|
|
# -- High Performance Conjugate Gradient Benchmark (HPCG)
|
|
# HPCG - 3.1 - March 28, 2019
|
|
|
|
# Michael A. Heroux
|
|
# Scalable Algorithms Group, Computing Research Division
|
|
# Sandia National Laboratories, Albuquerque, NM
|
|
#
|
|
# Piotr Luszczek
|
|
# Jack Dongarra
|
|
# University of Tennessee, Knoxville
|
|
# Innovative Computing Laboratory
|
|
#
|
|
# (C) Copyright 2013-2019 All Rights Reserved
|
|
#
|
|
#
|
|
# -- Copyright notice and Licensing terms:
|
|
#
|
|
# Redistribution and use in source and binary forms, with or without
|
|
# modification, are permitted provided that the following conditions
|
|
# are met:
|
|
#
|
|
# 1. Redistributions of source code must retain the above copyright
|
|
# notice, this list of conditions and the following disclaimer.
|
|
#
|
|
# 2. Redistributions in binary form must reproduce the above copyright
|
|
# notice, this list of conditions, and the following disclaimer in the
|
|
# documentation and/or other materials provided with the distribution.
|
|
#
|
|
# 3. All advertising materials mentioning features or use of this
|
|
# software must display the following acknowledgement:
|
|
# This product includes software developed at Sandia National
|
|
# Laboratories, Albuquerque, NM and the University of
|
|
# Tennessee, Knoxville, Innovative Computing Laboratory.
|
|
#
|
|
# 4. The name of the University, the name of the Laboratory, or the
|
|
# names of its contributors may not be used to endorse or promote
|
|
# products derived from this software without specific written
|
|
# permission.
|
|
#
|
|
# -- Disclaimer:
|
|
#
|
|
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
# ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE UNIVERSITY
|
|
# OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
# DATA OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
# ######################################################################
|
|
#@HEADER
|
|
# ----------------------------------------------------------------------
|
|
# - shell --------------------------------------------------------------
|
|
# ----------------------------------------------------------------------
|
|
#
|
|
SHELL = /bin/sh
|
|
#
|
|
CD = cd
|
|
CP = cp
|
|
LN_S = ln -s -f
|
|
MKDIR = mkdir -p
|
|
RM = /bin/rm -f
|
|
TOUCH = touch
|
|
#
|
|
# ----------------------------------------------------------------------
|
|
# - HPCG Directory Structure / HPCG library ------------------------------
|
|
# ----------------------------------------------------------------------
|
|
#
|
|
TOPdir = .
|
|
SRCdir = $(TOPdir)/src
|
|
INCdir = $(TOPdir)/src
|
|
BINdir = $(TOPdir)/bin
|
|
#
|
|
# ----------------------------------------------------------------------
|
|
# - Message Passing library (MPI) --------------------------------------
|
|
# ----------------------------------------------------------------------
|
|
# MPinc tells the C compiler where to find the Message Passing library
|
|
# header files, MPlib is defined to be the name of the library to be
|
|
# used. The variable MPdir is only used for defining MPinc and MPlib.
|
|
#
|
|
#MPdir =
|
|
#MPinc =
|
|
#MPlib =
|
|
#
|
|
#
|
|
# ----------------------------------------------------------------------
|
|
# - HPCG includes / libraries / specifics -------------------------------
|
|
# ----------------------------------------------------------------------
|
|
#
|
|
|
|
NVPL_SPARSE_INC=$(NVPL_PATH)/include
|
|
NVPL_SPARSE_LIB=$(NVPL_PATH)/lib
|
|
|
|
HPCG_INCLUDES = -I$(INCdir) -I$(INCdir)/$(arch) -I$(MPdir)/include $(CRAY_CUDATOOLKIT_INCLUDE_OPTS)
|
|
HPCG_LIBS = -L${MPlib} -lmpi
|
|
|
|
HPCG_INCLUDES += -I$(CUDA_HOME)/include -I$(Mathdir)/include
|
|
HPCG_LIBS += -L$(Mathdir)/lib -lcuda -lcusparse -lcublas -lcublasLt -L$(CUDA_HOME)/lib64
|
|
|
|
ifeq ($(USE_NCCL), 1)
|
|
HPCG_INCLUDES += -I$(NCCLdir)/include
|
|
HPCG_LIBS += -L$(NCCLdir)/lib -lnccl
|
|
endif
|
|
|
|
#
|
|
# - Compile time options -----------------------------------------------
|
|
#
|
|
# -DHPCG_NO_MPI Define to disable MPI
|
|
# -DHPCG_NO_OPENMP Define to disable OPENMP
|
|
# -DHPCG_CONTIGUOUS_ARRAYS Define to have sparse matrix arrays long and contiguous
|
|
# -DHPCG_DEBUG Define to enable debugging output
|
|
# -DHPCG_DETAILED_DEBUG Define to enable very detailed debugging output
|
|
# -DUSE_CUDA Define to enable GPU execution
|
|
# -DUSE_NCCL Define to enabele NCCL P2P communication. Use --p2p=4 for NCCL
|
|
# -DUSE_INT64 Define to enable INT64 indexing
|
|
|
|
# By default HPCG will:
|
|
# *) Build with MPI enabled.
|
|
# *) Build with OpenMP enabled.
|
|
# *) Not generate debugging output.
|
|
#
|
|
HPCG_OPTS = -DHPCG_CUBIC_RADICAL_SEARCH -DHPCG_CONTIGUOUS_ARRAYS #-DHPCG_DEBUG #-DHPCG_NO_MPI
|
|
HPCG_OPTS += -DUSE_CUDA
|
|
|
|
ifeq ($(USE_NCCL), 1)
|
|
HPCG_OPTS += -DUSE_NCCL
|
|
endif
|
|
|
|
ifeq ($(HPCG_ENG_VERSION), 1)
|
|
HPCG_OPTS += -DHPCG_ENG_VERSION
|
|
endif
|
|
|
|
ifeq ($(USE_INT64), 1)
|
|
HPCG_OPTS += -DINDEX_64
|
|
endif
|
|
|
|
#If not set, the defualt values in src/hpcg.hpp will be used
|
|
HPCG_OPTS += -Dmake_HPCG_VER_MAJOR=$(HPCG_VER_MAJOR)
|
|
HPCG_OPTS += -Dmake_HPCG_VER_MINOR=$(HPCG_VER_MINOR)
|
|
HPCG_OPTS += -DHPCG_COMMIT_HASH=$(HPCG_COMMIT_HASH)
|
|
#
|
|
# ----------------------------------------------------------------------
|
|
#
|
|
HPCG_DEFS = $(HPCG_OPTS) $(HPCG_INCLUDES)
|
|
#
|
|
# ----------------------------------------------------------------------
|
|
# - Compilers / linkers - Optimization flags ---------------------------
|
|
# ----------------------------------------------------------------------
|
|
#
|
|
CUDA_ARCH = -gencode=arch=compute_80,code=sm_80 -gencode=arch=compute_90,code=sm_90
|
|
ifeq ($(BUILD_B100), 1)
|
|
CUDA_ARCH += --generate-code arch=compute_100,code=sm_100
|
|
endif
|
|
CPU_ARCH ?= native
|
|
|
|
CXX = nvcc
|
|
CXXFLAGS = $(HPCG_DEFS) -O3 -Xcompiler --std=c++17 -Xcompiler -Ofast,-fopenmp,-mcpu=$(CPU_ARCH),-mtune=$(CPU_ARCH),-ftree-vectorize,-funroll-loops $(CUDA_ARCH)
|
|
|
|
#
|
|
LINKER = $(CXX)
|
|
LINKFLAGS = $(CXXFLAGS) $(HPCG_LIBS)
|
|
#
|
|
ARCHIVER = ar
|
|
ARFLAGS = r
|
|
RANLIB = echo
|
|
#
|
|
# ----------------------------------------------------------------------
|