2014-08-05 17:32:28 +08:00
|
|
|
#
|
|
|
|
#//===----------------------------------------------------------------------===//
|
|
|
|
#//
|
|
|
|
#// The LLVM Compiler Infrastructure
|
|
|
|
#//
|
|
|
|
#// This file is dual licensed under the MIT and the University of Illinois Open
|
|
|
|
#// Source Licenses. See LICENSE.txt for details.
|
|
|
|
#//
|
|
|
|
#//===----------------------------------------------------------------------===//
|
|
|
|
#
|
2014-06-02 02:01:33 +08:00
|
|
|
|
2015-06-01 11:05:13 +08:00
|
|
|
# CMAKE libomp
|
2014-08-05 17:32:28 +08:00
|
|
|
cmake_minimum_required(VERSION 2.8 FATAL_ERROR)
|
|
|
|
|
|
|
|
# Add cmake directory to search for custom cmake functions
|
|
|
|
set(CMAKE_MODULE_PATH ${CMAKE_CURRENT_SOURCE_DIR}/cmake ${CMAKE_MODULE_PATH})
|
|
|
|
|
2015-05-06 04:02:52 +08:00
|
|
|
# Standalone build or part of LLVM?
|
2015-05-21 06:33:24 +08:00
|
|
|
set(LIBOMP_STANDALONE_BUILD FALSE)
|
2015-07-16 00:05:30 +08:00
|
|
|
if("${CMAKE_SOURCE_DIR}" STREQUAL "${CMAKE_CURRENT_SOURCE_DIR}" OR
|
2015-05-06 04:02:52 +08:00
|
|
|
"${CMAKE_SOURCE_DIR}/runtime" STREQUAL "${CMAKE_CURRENT_SOURCE_DIR}")
|
2015-07-16 00:57:19 +08:00
|
|
|
project(libomp C CXX)
|
|
|
|
set(LIBOMP_STANDALONE_BUILD TRUE)
|
2015-05-06 04:02:52 +08:00
|
|
|
endif()
|
|
|
|
|
2015-08-29 02:42:10 +08:00
|
|
|
# Set libomp version
|
|
|
|
set(LIBOMP_VERSION_MAJOR 5)
|
|
|
|
set(LIBOMP_VERSION_MINOR 0)
|
|
|
|
|
2015-07-16 00:05:30 +08:00
|
|
|
# These include files are in the cmake/ subdirectory
|
|
|
|
include(LibompUtils)
|
|
|
|
include(LibompGetArchitecture)
|
|
|
|
include(LibompHandleFlags)
|
|
|
|
include(LibompDefinitions)
|
2014-08-05 17:32:28 +08:00
|
|
|
|
2015-07-16 00:05:30 +08:00
|
|
|
# Determine the target architecture
|
|
|
|
if(${LIBOMP_STANDALONE_BUILD})
|
2015-07-16 00:57:19 +08:00
|
|
|
# If adding a new architecture, take a look at cmake/LibompGetArchitecture.cmake
|
|
|
|
libomp_get_architecture(LIBOMP_DETECTED_ARCH)
|
|
|
|
set(LIBOMP_ARCH ${LIBOMP_DETECTED_ARCH} CACHE STRING
|
|
|
|
"The architecture to build for (x86_64/i386/arm/ppc64/ppc64le/aarch64/mic).")
|
|
|
|
# Allow user to choose a suffix for the installation directory.
|
|
|
|
set(LIBOMP_LIBDIR_SUFFIX "" CACHE STRING
|
|
|
|
"suffix of lib installation directory e.g., 64 => lib64")
|
|
|
|
# Should assertions be enabled? They are on by default.
|
|
|
|
set(LIBOMP_ENABLE_ASSERTIONS TRUE CACHE BOOL
|
|
|
|
"enable assertions?")
|
2015-07-18 11:14:02 +08:00
|
|
|
set(LIBOMP_ENABLE_WERROR FALSE CACHE BOOL
|
|
|
|
"Enable -Werror flags to turn warnings into errors for supporting compilers.")
|
2015-07-16 00:57:19 +08:00
|
|
|
# CMAKE_BUILD_TYPE was not defined, set default to Release
|
|
|
|
if(NOT CMAKE_BUILD_TYPE)
|
|
|
|
set(CMAKE_BUILD_TYPE Release)
|
|
|
|
endif()
|
2015-07-16 00:05:30 +08:00
|
|
|
else() # Part of LLVM build
|
2015-07-16 00:57:19 +08:00
|
|
|
# Determine the native architecture from LLVM.
|
|
|
|
string(TOLOWER "${LLVM_TARGET_ARCH}" LIBOMP_NATIVE_ARCH)
|
|
|
|
if( LIBOMP_NATIVE_ARCH STREQUAL "host" )
|
|
|
|
string(REGEX MATCH "^[^-]*" LIBOMP_NATIVE_ARCH ${LLVM_HOST_TRIPLE})
|
|
|
|
endif ()
|
|
|
|
if(LIBOMP_NATIVE_ARCH MATCHES "i[2-6]86")
|
|
|
|
set(LIBOMP_ARCH i386)
|
|
|
|
elseif(LIBOMP_NATIVE_ARCH STREQUAL "x86")
|
|
|
|
set(LIBOMP_ARCH i386)
|
|
|
|
elseif(LIBOMP_NATIVE_ARCH STREQUAL "amd64")
|
|
|
|
set(LIBOMP_ARCH x86_64)
|
|
|
|
elseif(LIBOMP_NATIVE_ARCH STREQUAL "x86_64")
|
|
|
|
set(LIBOMP_ARCH x86_64)
|
|
|
|
elseif(LIBOMP_NATIVE_ARCH MATCHES "powerpc")
|
|
|
|
set(LIBOMP_ARCH ppc64)
|
|
|
|
elseif(LIBOMP_NATIVE_ARCH MATCHES "aarch64")
|
|
|
|
set(LIBOMP_ARCH aarch64)
|
|
|
|
elseif(LIBOMP_NATIVE_ARCH MATCHES "arm64")
|
|
|
|
set(LIBOMP_ARCH aarch64)
|
|
|
|
elseif(LIBOMP_NATIVE_ARCH MATCHES "arm")
|
|
|
|
set(LIBOMP_ARCH arm)
|
|
|
|
else()
|
|
|
|
# last ditch effort
|
|
|
|
libomp_get_architecture(LIBOMP_ARCH)
|
|
|
|
endif ()
|
|
|
|
set(LIBOMP_LIBDIR_SUFFIX ${LLVM_LIBDIR_SUFFIX})
|
|
|
|
set(LIBOMP_ENABLE_ASSERTIONS ${LLVM_ENABLE_ASSERTIONS})
|
2015-07-18 11:14:02 +08:00
|
|
|
set(LIBOMP_ENABLE_WERROR ${LLVM_ENABLE_WERROR})
|
2014-08-05 17:32:28 +08:00
|
|
|
endif()
|
2015-07-16 00:05:30 +08:00
|
|
|
libomp_check_variable(LIBOMP_ARCH 32e x86_64 32 i386 arm ppc64 ppc64le aarch64 mic)
|
2014-08-05 17:32:28 +08:00
|
|
|
|
2015-05-27 01:27:01 +08:00
|
|
|
set(LIBOMP_LIB_TYPE normal CACHE STRING
|
2015-07-16 00:57:19 +08:00
|
|
|
"Performance,Profiling,Stubs library (normal/profile/stubs)")
|
2015-07-16 00:05:30 +08:00
|
|
|
libomp_check_variable(LIBOMP_LIB_TYPE normal profile stubs)
|
|
|
|
set(LIBOMP_OMP_VERSION 41 CACHE STRING
|
2015-07-16 00:57:19 +08:00
|
|
|
"The OpenMP version (41/40/30)")
|
2015-07-16 00:05:30 +08:00
|
|
|
libomp_check_variable(LIBOMP_OMP_VERSION 41 40 30)
|
2015-08-29 02:42:10 +08:00
|
|
|
# Set the OpenMP Year and Month assiociated with version
|
|
|
|
if(${LIBOMP_OMP_VERSION} GREATER 40 OR ${LIBOMP_OMP_VERSION} EQUAL 40)
|
|
|
|
set(LIBOMP_OMP_YEAR_MONTH 201307)
|
|
|
|
elseif(${LIBOMP_OMP_VERSION} GREATER 30 OR ${LIBOMP_OMP_VERSION} EQUAL 30)
|
|
|
|
set(LIBOMP_OMP_YEAR_MONTH 201107)
|
|
|
|
else()
|
|
|
|
set(LIBOMP_OMP_YEAR_MONTH 200505)
|
|
|
|
endif()
|
2015-07-16 00:05:30 +08:00
|
|
|
set(LIBOMP_MIC_ARCH knc CACHE STRING
|
2015-07-16 00:57:19 +08:00
|
|
|
"Intel(R) Many Integrated Core Architecture (Intel(R) MIC Architecture) (knf/knc). Ignored if not Intel(R) MIC Architecture build.")
|
2015-07-16 00:05:30 +08:00
|
|
|
if("${LIBOMP_ARCH}" STREQUAL "mic")
|
2015-07-16 00:57:19 +08:00
|
|
|
libomp_check_variable(LIBOMP_MIC_ARCH knf knc)
|
2015-07-16 00:05:30 +08:00
|
|
|
endif()
|
|
|
|
set(LIBOMP_FORTRAN_MODULES FALSE CACHE BOOL
|
2015-07-16 00:57:19 +08:00
|
|
|
"Create Fortran module files? (requires fortran compiler)")
|
2014-08-05 17:32:28 +08:00
|
|
|
|
2015-05-30 00:13:56 +08:00
|
|
|
# - Support for universal fat binary builds on Mac
|
2015-07-16 00:05:30 +08:00
|
|
|
# - Having this extra variable allows people to build this library as a universal library
|
2015-05-30 00:13:56 +08:00
|
|
|
# without forcing a universal build of the llvm/clang compiler.
|
|
|
|
set(LIBOMP_OSX_ARCHITECTURES "${CMAKE_OSX_ARCHITECTURES}" CACHE STRING
|
2015-07-16 00:57:19 +08:00
|
|
|
"For Mac builds, semicolon separated list of architectures to build for universal fat binary.")
|
2015-05-30 00:13:56 +08:00
|
|
|
set(CMAKE_OSX_ARCHITECTURES ${LIBOMP_OSX_ARCHITECTURES})
|
|
|
|
|
2015-07-16 00:05:30 +08:00
|
|
|
# User specified flags. These are appended to the configured flags.
|
2015-05-27 01:27:01 +08:00
|
|
|
set(LIBOMP_CFLAGS "" CACHE STRING
|
2015-07-16 00:57:19 +08:00
|
|
|
"Appended user specified C compiler flags.")
|
2015-05-27 01:27:01 +08:00
|
|
|
set(LIBOMP_CXXFLAGS "" CACHE STRING
|
2015-07-16 00:57:19 +08:00
|
|
|
"Appended user specified C++ compiler flags.")
|
2015-05-27 01:27:01 +08:00
|
|
|
set(LIBOMP_CPPFLAGS "" CACHE STRING
|
2015-07-16 00:57:19 +08:00
|
|
|
"Appended user specified C preprocessor flags.")
|
2015-05-27 01:27:01 +08:00
|
|
|
set(LIBOMP_ASMFLAGS "" CACHE STRING
|
2015-07-16 00:57:19 +08:00
|
|
|
"Appended user specified assembler flags.")
|
2015-05-27 01:27:01 +08:00
|
|
|
set(LIBOMP_LDFLAGS "" CACHE STRING
|
2015-07-16 00:57:19 +08:00
|
|
|
"Appended user specified linker flags.")
|
2015-05-27 01:27:01 +08:00
|
|
|
set(LIBOMP_LIBFLAGS "" CACHE STRING
|
2015-07-16 00:57:19 +08:00
|
|
|
"Appended user specified linked libs flags. (e.g., -lm)")
|
2015-07-16 00:05:30 +08:00
|
|
|
set(LIBOMP_FFLAGS "" CACHE STRING
|
2015-07-16 00:57:19 +08:00
|
|
|
"Appended user specified Fortran compiler flags. These are only used if LIBOMP_FORTRAN_MODULES==TRUE.")
|
2014-08-05 17:32:28 +08:00
|
|
|
|
2015-06-01 11:05:13 +08:00
|
|
|
# Should the libomp library and generated headers be copied into the original source exports/ directory
|
2015-07-16 00:05:30 +08:00
|
|
|
# Turning this to FALSE aids parallel builds to not interfere with each other.
|
|
|
|
# Currently, the testsuite module expects the just built OpenMP library to be located inside the exports/
|
|
|
|
# directory. TODO: have testsuite run under llvm-lit directly. We can then get rid of copying to exports/
|
|
|
|
set(LIBOMP_COPY_EXPORTS TRUE CACHE STRING
|
2015-07-16 00:57:19 +08:00
|
|
|
"Should exports be copied into source exports/ directory?")
|
2015-05-14 20:54:08 +08:00
|
|
|
|
2014-08-05 17:32:28 +08:00
|
|
|
# Get the build number from kmp_version.c
|
2015-08-29 02:42:10 +08:00
|
|
|
libomp_get_build_number("${CMAKE_CURRENT_SOURCE_DIR}" LIBOMP_VERSION_BUILD)
|
|
|
|
math(EXPR LIBOMP_VERSION_BUILD_YEAR "${LIBOMP_VERSION_BUILD}/10000")
|
|
|
|
math(EXPR LIBOMP_VERSION_BUILD_MONTH_DAY "${LIBOMP_VERSION_BUILD}%10000")
|
2014-08-05 17:32:28 +08:00
|
|
|
|
2015-07-16 00:05:30 +08:00
|
|
|
# Currently don't record any timestamps
|
2015-08-29 02:42:10 +08:00
|
|
|
set(LIBOMP_BUILD_DATE "No_Timestamp")
|
2014-08-05 17:32:28 +08:00
|
|
|
|
|
|
|
# Architecture
|
|
|
|
set(IA32 FALSE)
|
|
|
|
set(INTEL64 FALSE)
|
|
|
|
set(ARM FALSE)
|
2015-01-13 22:43:35 +08:00
|
|
|
set(AARCH64 FALSE)
|
2015-01-20 02:29:35 +08:00
|
|
|
set(PPC64BE FALSE)
|
|
|
|
set(PPC64LE FALSE)
|
2014-08-07 18:12:54 +08:00
|
|
|
set(PPC64 FALSE)
|
2015-07-16 00:05:30 +08:00
|
|
|
set(MIC FALSE)
|
2015-07-16 00:57:19 +08:00
|
|
|
if("${LIBOMP_ARCH}" STREQUAL "i386" OR "${LIBOMP_ARCH}" STREQUAL "32") # IA-32 architecture
|
|
|
|
set(IA32 TRUE)
|
2015-07-16 00:05:30 +08:00
|
|
|
elseif("${LIBOMP_ARCH}" STREQUAL "x86_64" OR "${LIBOMP_ARCH}" STREQUAL "32e") # Intel(R) 64 architecture
|
2015-07-16 00:57:19 +08:00
|
|
|
set(INTEL64 TRUE)
|
2015-05-21 06:33:24 +08:00
|
|
|
elseif("${LIBOMP_ARCH}" STREQUAL "arm") # ARM architecture
|
2015-07-16 00:57:19 +08:00
|
|
|
set(ARM TRUE)
|
2015-05-21 06:33:24 +08:00
|
|
|
elseif("${LIBOMP_ARCH}" STREQUAL "ppc64") # PPC64BE architecture
|
2015-07-16 00:57:19 +08:00
|
|
|
set(PPC64BE TRUE)
|
|
|
|
set(PPC64 TRUE)
|
2015-05-21 06:33:24 +08:00
|
|
|
elseif("${LIBOMP_ARCH}" STREQUAL "ppc64le") # PPC64LE architecture
|
2015-07-16 00:57:19 +08:00
|
|
|
set(PPC64LE TRUE)
|
|
|
|
set(PPC64 TRUE)
|
2015-05-21 06:33:24 +08:00
|
|
|
elseif("${LIBOMP_ARCH}" STREQUAL "aarch64") # AARCH64 architecture
|
2015-07-16 00:57:19 +08:00
|
|
|
set(AARCH64 TRUE)
|
2015-05-21 06:33:24 +08:00
|
|
|
elseif("${LIBOMP_ARCH}" STREQUAL "mic") # Intel(R) Many Integrated Core Architecture
|
2015-07-16 00:57:19 +08:00
|
|
|
set(MIC TRUE)
|
2014-08-05 17:32:28 +08:00
|
|
|
endif()
|
|
|
|
|
|
|
|
# Set some flags based on build_type
|
2015-05-27 01:27:01 +08:00
|
|
|
set(RELEASE_BUILD FALSE)
|
|
|
|
set(DEBUG_BUILD FALSE)
|
2014-08-05 17:32:28 +08:00
|
|
|
set(RELWITHDEBINFO_BUILD FALSE)
|
2015-07-16 00:05:30 +08:00
|
|
|
set(MINSIZEREL_BUILD FALSE)
|
|
|
|
string(TOLOWER "${CMAKE_BUILD_TYPE}" libomp_build_type_lowercase)
|
|
|
|
if("${libomp_build_type_lowercase}" STREQUAL "release")
|
2015-07-16 00:57:19 +08:00
|
|
|
set(RELEASE_BUILD TRUE)
|
2015-07-16 00:05:30 +08:00
|
|
|
elseif("${libomp_build_type_lowercase}" STREQUAL "debug")
|
2015-07-16 00:57:19 +08:00
|
|
|
set(DEBUG_BUILD TRUE)
|
2015-07-16 00:05:30 +08:00
|
|
|
elseif("${libomp_build_type_lowercase}" STREQUAL "relwithdebinfo")
|
2015-07-16 00:57:19 +08:00
|
|
|
set(RELWITHDEBINFO_BUILD TRUE)
|
2015-07-16 00:05:30 +08:00
|
|
|
elseif("${libomp_build_type_lowercase}" STREQUAL "minsizerel")
|
2015-07-16 00:57:19 +08:00
|
|
|
set(MINSIZEREL_BUILD TRUE)
|
2014-08-05 17:32:28 +08:00
|
|
|
endif()
|
|
|
|
|
|
|
|
# Include itt notify interface? Right now, always.
|
2015-05-21 06:33:24 +08:00
|
|
|
set(LIBOMP_USE_ITT_NOTIFY TRUE)
|
2014-08-05 17:32:28 +08:00
|
|
|
|
|
|
|
# normal, profile, stubs library.
|
|
|
|
set(NORMAL_LIBRARY FALSE)
|
|
|
|
set(STUBS_LIBRARY FALSE)
|
|
|
|
set(PROFILE_LIBRARY FALSE)
|
2015-05-21 06:33:24 +08:00
|
|
|
if("${LIBOMP_LIB_TYPE}" STREQUAL "normal")
|
2015-07-16 00:57:19 +08:00
|
|
|
set(NORMAL_LIBRARY TRUE)
|
2015-05-21 06:33:24 +08:00
|
|
|
elseif("${LIBOMP_LIB_TYPE}" STREQUAL "profile")
|
2015-07-16 00:57:19 +08:00
|
|
|
set(PROFILE_LIBRARY TRUE)
|
2015-05-21 06:33:24 +08:00
|
|
|
elseif("${LIBOMP_LIB_TYPE}" STREQUAL "stubs")
|
2015-07-16 00:57:19 +08:00
|
|
|
set(STUBS_LIBRARY TRUE)
|
2014-08-05 17:32:28 +08:00
|
|
|
endif()
|
|
|
|
|
2015-07-16 00:05:30 +08:00
|
|
|
# Setting directory names
|
|
|
|
set(LIBOMP_BASE_DIR ${CMAKE_CURRENT_SOURCE_DIR})
|
|
|
|
set(LIBOMP_SRC_DIR ${LIBOMP_BASE_DIR}/src)
|
|
|
|
set(LIBOMP_TOOLS_DIR ${LIBOMP_BASE_DIR}/tools)
|
|
|
|
set(LIBOMP_INC_DIR ${LIBOMP_SRC_DIR}/include/${LIBOMP_OMP_VERSION})
|
2015-09-22 04:41:31 +08:00
|
|
|
set(LIBOMP_BINARY_DIR ${CMAKE_CURRENT_BINARY_DIR})
|
2014-08-05 17:32:28 +08:00
|
|
|
|
2015-07-16 00:05:30 +08:00
|
|
|
# Enabling Fortran if it is needed
|
|
|
|
if(${LIBOMP_FORTRAN_MODULES})
|
2015-07-16 00:57:19 +08:00
|
|
|
enable_language(Fortran)
|
2015-07-16 00:05:30 +08:00
|
|
|
endif()
|
2015-07-16 00:57:19 +08:00
|
|
|
# Enable MASM Compiler if it is needed (Windows only)
|
2015-07-16 00:05:30 +08:00
|
|
|
if(WIN32)
|
2015-07-16 00:57:19 +08:00
|
|
|
enable_language(ASM_MASM)
|
2015-07-16 00:05:30 +08:00
|
|
|
endif()
|
2014-08-05 17:32:28 +08:00
|
|
|
|
2015-07-16 00:05:30 +08:00
|
|
|
# Getting legal type/arch
|
|
|
|
libomp_get_legal_type(LIBOMP_LEGAL_TYPE)
|
|
|
|
libomp_get_legal_arch(LIBOMP_LEGAL_ARCH)
|
2014-08-05 17:32:28 +08:00
|
|
|
|
2015-07-16 00:05:30 +08:00
|
|
|
# Compiler flag checks, library checks, threading check, etc.
|
|
|
|
include(config-ix)
|
I apologise in advance for the size of this check-in. At Intel we do
understand that this is not friendly, and are working to change our
internal code-development to make it easier to make development
features available more frequently and in finer (more functional)
chunks. Unfortunately we haven't got that in place yet, and unpicking
this into multiple separate check-ins would be non-trivial, so please
bear with me on this one. We should be better in the future.
Apologies over, what do we have here?
GGC 4.9 compatibility
--------------------
* We have implemented the new entrypoints used by code compiled by GCC
4.9 to implement the same functionality in gcc 4.8. Therefore code
compiled with gcc 4.9 that used to work will continue to do so.
However, there are some other new entrypoints (associated with task
cancellation) which are not implemented. Therefore user code compiled
by gcc 4.9 that uses these new features will not link against the LLVM
runtime. (It remains unclear how to handle those entrypoints, since
the GCC interface has potentially unpleasant performance implications
for join barriers even when cancellation is not used)
--- new parallel entry points ---
new entry points that aren't OpenMP 4.0 related
These are implemented fully :-
GOMP_parallel_loop_dynamic()
GOMP_parallel_loop_guided()
GOMP_parallel_loop_runtime()
GOMP_parallel_loop_static()
GOMP_parallel_sections()
GOMP_parallel()
--- cancellation entry points ---
Currently, these only give a runtime error if OMP_CANCELLATION is true
because our plain barriers don't check for cancellation while waiting
GOMP_barrier_cancel()
GOMP_cancel()
GOMP_cancellation_point()
GOMP_loop_end_cancel()
GOMP_sections_end_cancel()
--- taskgroup entry points ---
These are implemented fully.
GOMP_taskgroup_start()
GOMP_taskgroup_end()
--- target entry points ---
These are empty (as they are in libgomp)
GOMP_target()
GOMP_target_data()
GOMP_target_end_data()
GOMP_target_update()
GOMP_teams()
Improvements in Barriers and Fork/Join
--------------------------------------
* Barrier and fork/join code is now in its own file (which makes it
easier to understand and modify).
* Wait/release code is now templated and in its own file; suspend/resume code is also templated
* There's a new, hierarchical, barrier, which exploits the
cache-hierarchy of the Intel(r) Xeon Phi(tm) coprocessor to improve
fork/join and barrier performance.
***BEWARE*** the new source files have *not* been added to the legacy
Cmake build system. If you want to use that fixes wil be required.
Statistics Collection Code
--------------------------
* New code has been added to collect application statistics (if this
is enabled at library compile time; by default it is not). The
statistics code itself is generally useful, the lightweight timing
code uses the X86 rdtsc instruction, so will require changes for other
architectures.
The intent of this code is not for users to tune their codes but
rather
1) For timing code-paths inside the runtime
2) For gathering general properties of OpenMP codes to focus attention
on which OpenMP features are most used.
Nested Hot Teams
----------------
* The runtime now maintains more state to reduce the overhead of
creating and destroying inner parallel teams. This improves the
performance of code that repeatedly uses nested parallelism with the
same resource allocation. Set the new KMP_HOT_TEAMS_MAX_LEVEL
envirable to a depth to enable this (and, of course, OMP_NESTED=true
to enable nested parallelism at all).
Improved Intel(r) VTune(Tm) Amplifier support
---------------------------------------------
* The runtime provides additional information to Vtune via the
itt_notify interface to allow it to display better OpenMP specific
analyses of load-imbalance.
Support for OpenMP Composite Statements
---------------------------------------
* Implement new entrypoints required by some of the OpenMP 4.1
composite statements.
Improved ifdefs
---------------
* More separation of concepts ("Does this platform do X?") from
platforms ("Are we compiling for platform Y?"), which should simplify
future porting.
ScaleMP* contribution
---------------------
Stack padding to improve the performance in their environment where
cross-node coherency is managed at the page level.
Redesign of wait and release code
---------------------------------
The code is simplified and performance improved.
Bug Fixes
---------
*Fixes for Windows multiple processor groups.
*Fix Fortran module build on Linux: offload attribute added.
*Fix entry names for distribute-parallel-loop construct to be consistent with the compiler codegen.
*Fix an inconsistent error message for KMP_PLACE_THREADS environment variable.
llvm-svn: 219214
2014-10-08 00:25:50 +08:00
|
|
|
|
2015-07-16 00:05:30 +08:00
|
|
|
# Is there a quad precision data type available?
|
|
|
|
# TODO: Make this a real feature check
|
|
|
|
set(LIBOMP_USE_QUAD_PRECISION "${LIBOMP_HAVE_QUAD_PRECISION}" CACHE BOOL
|
2015-07-16 00:57:19 +08:00
|
|
|
"Should 128-bit precision entry points be built?")
|
2015-07-16 00:05:30 +08:00
|
|
|
if(LIBOMP_USE_QUAD_PRECISION AND (NOT LIBOMP_HAVE_QUAD_PRECISION))
|
2015-07-16 00:57:19 +08:00
|
|
|
libomp_error_say("128-bit quad precision functionality requested but not available")
|
I apologise in advance for the size of this check-in. At Intel we do
understand that this is not friendly, and are working to change our
internal code-development to make it easier to make development
features available more frequently and in finer (more functional)
chunks. Unfortunately we haven't got that in place yet, and unpicking
this into multiple separate check-ins would be non-trivial, so please
bear with me on this one. We should be better in the future.
Apologies over, what do we have here?
GGC 4.9 compatibility
--------------------
* We have implemented the new entrypoints used by code compiled by GCC
4.9 to implement the same functionality in gcc 4.8. Therefore code
compiled with gcc 4.9 that used to work will continue to do so.
However, there are some other new entrypoints (associated with task
cancellation) which are not implemented. Therefore user code compiled
by gcc 4.9 that uses these new features will not link against the LLVM
runtime. (It remains unclear how to handle those entrypoints, since
the GCC interface has potentially unpleasant performance implications
for join barriers even when cancellation is not used)
--- new parallel entry points ---
new entry points that aren't OpenMP 4.0 related
These are implemented fully :-
GOMP_parallel_loop_dynamic()
GOMP_parallel_loop_guided()
GOMP_parallel_loop_runtime()
GOMP_parallel_loop_static()
GOMP_parallel_sections()
GOMP_parallel()
--- cancellation entry points ---
Currently, these only give a runtime error if OMP_CANCELLATION is true
because our plain barriers don't check for cancellation while waiting
GOMP_barrier_cancel()
GOMP_cancel()
GOMP_cancellation_point()
GOMP_loop_end_cancel()
GOMP_sections_end_cancel()
--- taskgroup entry points ---
These are implemented fully.
GOMP_taskgroup_start()
GOMP_taskgroup_end()
--- target entry points ---
These are empty (as they are in libgomp)
GOMP_target()
GOMP_target_data()
GOMP_target_end_data()
GOMP_target_update()
GOMP_teams()
Improvements in Barriers and Fork/Join
--------------------------------------
* Barrier and fork/join code is now in its own file (which makes it
easier to understand and modify).
* Wait/release code is now templated and in its own file; suspend/resume code is also templated
* There's a new, hierarchical, barrier, which exploits the
cache-hierarchy of the Intel(r) Xeon Phi(tm) coprocessor to improve
fork/join and barrier performance.
***BEWARE*** the new source files have *not* been added to the legacy
Cmake build system. If you want to use that fixes wil be required.
Statistics Collection Code
--------------------------
* New code has been added to collect application statistics (if this
is enabled at library compile time; by default it is not). The
statistics code itself is generally useful, the lightweight timing
code uses the X86 rdtsc instruction, so will require changes for other
architectures.
The intent of this code is not for users to tune their codes but
rather
1) For timing code-paths inside the runtime
2) For gathering general properties of OpenMP codes to focus attention
on which OpenMP features are most used.
Nested Hot Teams
----------------
* The runtime now maintains more state to reduce the overhead of
creating and destroying inner parallel teams. This improves the
performance of code that repeatedly uses nested parallelism with the
same resource allocation. Set the new KMP_HOT_TEAMS_MAX_LEVEL
envirable to a depth to enable this (and, of course, OMP_NESTED=true
to enable nested parallelism at all).
Improved Intel(r) VTune(Tm) Amplifier support
---------------------------------------------
* The runtime provides additional information to Vtune via the
itt_notify interface to allow it to display better OpenMP specific
analyses of load-imbalance.
Support for OpenMP Composite Statements
---------------------------------------
* Implement new entrypoints required by some of the OpenMP 4.1
composite statements.
Improved ifdefs
---------------
* More separation of concepts ("Does this platform do X?") from
platforms ("Are we compiling for platform Y?"), which should simplify
future porting.
ScaleMP* contribution
---------------------
Stack padding to improve the performance in their environment where
cross-node coherency is managed at the page level.
Redesign of wait and release code
---------------------------------
The code is simplified and performance improved.
Bug Fixes
---------
*Fixes for Windows multiple processor groups.
*Fix Fortran module build on Linux: offload attribute added.
*Fix entry names for distribute-parallel-loop construct to be consistent with the compiler codegen.
*Fix an inconsistent error message for KMP_PLACE_THREADS environment variable.
llvm-svn: 219214
2014-10-08 00:25:50 +08:00
|
|
|
endif()
|
|
|
|
|
2015-07-16 00:05:30 +08:00
|
|
|
# libgomp drop-in compatibility requires versioned symbols
|
|
|
|
set(LIBOMP_USE_VERSION_SYMBOLS "${LIBOMP_HAVE_VERSION_SYMBOLS}" CACHE BOOL
|
2015-07-16 00:57:19 +08:00
|
|
|
"Should version symbols be used? These provide binary compatibility with libgomp.")
|
2015-07-16 00:05:30 +08:00
|
|
|
if(LIBOMP_USE_VERSION_SYMBOLS AND (NOT LIBOMP_HAVE_VERSION_SYMBOLS))
|
2015-07-16 00:57:19 +08:00
|
|
|
libomp_error_say("Version symbols functionality requested but not available")
|
2014-08-05 17:32:28 +08:00
|
|
|
endif()
|
|
|
|
|
2015-07-16 00:05:30 +08:00
|
|
|
# On multinode systems, larger alignment is desired to avoid false sharing
|
|
|
|
set(LIBOMP_USE_INTERNODE_ALIGNMENT FALSE CACHE BOOL
|
2015-07-16 00:57:19 +08:00
|
|
|
"Should larger alignment (4096 bytes) be used for some locks and data structures?")
|
2014-08-05 17:32:28 +08:00
|
|
|
|
2015-07-16 00:05:30 +08:00
|
|
|
# Build code that allows the OpenMP library to conveniently interface with debuggers
|
|
|
|
set(LIBOMP_USE_DEBUGGER FALSE CACHE BOOL
|
2015-07-16 00:57:19 +08:00
|
|
|
"Enable debugger interface code?")
|
2014-08-05 17:32:28 +08:00
|
|
|
|
2015-07-16 00:05:30 +08:00
|
|
|
# Should we link to C++ library?
|
|
|
|
set(LIBOMP_USE_STDCPPLIB FALSE CACHE BOOL
|
2015-07-16 00:57:19 +08:00
|
|
|
"Should we link to C++ library?")
|
2014-08-05 17:32:28 +08:00
|
|
|
|
2015-07-16 00:05:30 +08:00
|
|
|
# TSX (x86) based locks have __asm code which can be troublesome for some compilers.
|
|
|
|
# TODO: Make this a real feature check
|
|
|
|
set(LIBOMP_USE_ADAPTIVE_LOCKS "${LIBOMP_HAVE_ADAPTIVE_LOCKS}" CACHE BOOL
|
2015-07-16 00:57:19 +08:00
|
|
|
"Should TSX-based lock be compiled (adaptive lock in kmp_lock.cpp). These are x86 specific.")
|
2015-07-16 00:05:30 +08:00
|
|
|
if(LIBOMP_USE_ADAPTIVE_LOCKS AND (NOT LIBOMP_HAVE_ADAPTIVE_LOCKS))
|
2015-07-16 00:57:19 +08:00
|
|
|
libomp_error_say("Adaptive locks (TSX) functionality requested but not available")
|
2014-08-05 17:32:28 +08:00
|
|
|
endif()
|
|
|
|
|
2015-07-16 00:05:30 +08:00
|
|
|
# - stats-gathering enables OpenMP stats where things like the number of
|
|
|
|
# parallel regions, clock ticks spent in particular openmp regions are recorded.
|
|
|
|
# TODO: Make this a real feature check
|
|
|
|
set(LIBOMP_STATS FALSE CACHE BOOL
|
2015-07-16 00:57:19 +08:00
|
|
|
"Stats-Gathering functionality?")
|
2015-07-16 00:05:30 +08:00
|
|
|
if(LIBOMP_STATS AND (NOT LIBOMP_HAVE_STATS))
|
2015-07-16 00:57:19 +08:00
|
|
|
libomp_error_say("Stats-gathering functionality requested but not available")
|
2015-01-16 21:05:23 +08:00
|
|
|
endif()
|
2015-08-12 05:36:41 +08:00
|
|
|
# The stats functionality requires the std c++ library
|
|
|
|
if(LIBOMP_STATS)
|
|
|
|
set(LIBOMP_USE_STDCPPLIB TRUE)
|
|
|
|
endif()
|
2015-07-16 00:05:30 +08:00
|
|
|
|
|
|
|
# OMPT-support
|
|
|
|
# TODO: Make this a real feature check
|
|
|
|
set(LIBOMP_OMPT_SUPPORT FALSE CACHE BOOL
|
2015-07-16 00:57:19 +08:00
|
|
|
"OMPT-support?")
|
2015-07-16 00:05:30 +08:00
|
|
|
set(LIBOMP_OMPT_BLAME TRUE CACHE BOOL
|
2015-07-16 00:57:19 +08:00
|
|
|
"OMPT-blame?")
|
2015-07-16 00:05:30 +08:00
|
|
|
set(LIBOMP_OMPT_TRACE TRUE CACHE BOOL
|
2015-07-16 00:57:19 +08:00
|
|
|
"OMPT-trace?")
|
2015-07-16 00:05:30 +08:00
|
|
|
if(LIBOMP_OMPT_SUPPORT AND (NOT LIBOMP_HAVE_OMPT_SUPPORT))
|
2015-07-16 00:57:19 +08:00
|
|
|
libomp_error_say("OpenMP Tools Interface requested but not available")
|
2014-08-05 17:32:28 +08:00
|
|
|
endif()
|
|
|
|
|
|
|
|
# Setting final library name
|
2015-07-16 00:05:30 +08:00
|
|
|
set(LIBOMP_DEFAULT_LIB_NAME libomp)
|
2014-08-05 17:32:28 +08:00
|
|
|
if(${PROFILE_LIBRARY})
|
2015-07-16 00:57:19 +08:00
|
|
|
set(LIBOMP_DEFAULT_LIB_NAME ${LIBOMP_DEFAULT_LIB_NAME}prof)
|
2014-08-05 17:32:28 +08:00
|
|
|
endif()
|
|
|
|
if(${STUBS_LIBRARY})
|
2015-07-16 00:57:19 +08:00
|
|
|
set(LIBOMP_DEFAULT_LIB_NAME ${LIBOMP_DEFAULT_LIB_NAME}stubs)
|
2014-08-05 17:32:28 +08:00
|
|
|
endif()
|
2015-07-16 00:05:30 +08:00
|
|
|
set(LIBOMP_LIB_NAME ${LIBOMP_DEFAULT_LIB_NAME} CACHE STRING "Base OMP library name")
|
|
|
|
set(LIBOMP_LIB_FILE ${LIBOMP_LIB_NAME}${CMAKE_SHARED_LIBRARY_SUFFIX})
|
2014-08-05 17:32:28 +08:00
|
|
|
|
|
|
|
# Print configuration after all variables are set.
|
2015-05-21 06:33:24 +08:00
|
|
|
if(${LIBOMP_STANDALONE_BUILD})
|
2015-07-16 00:57:19 +08:00
|
|
|
libomp_say("Operating System -- ${CMAKE_SYSTEM_NAME}")
|
|
|
|
libomp_say("Target Architecture -- ${LIBOMP_ARCH}")
|
|
|
|
if(${MIC})
|
|
|
|
libomp_say("Intel(R) MIC Architecture -- ${LIBOMP_MIC_ARCH}")
|
|
|
|
endif()
|
|
|
|
libomp_say("Build Type -- ${CMAKE_BUILD_TYPE}")
|
|
|
|
libomp_say("OpenMP Version -- ${LIBOMP_OMP_VERSION}")
|
|
|
|
libomp_say("Lib Type -- ${LIBOMP_LIB_TYPE}")
|
|
|
|
libomp_say("Fortran Modules -- ${LIBOMP_FORTRAN_MODULES}")
|
|
|
|
# will say development if all zeros
|
2015-08-29 02:42:10 +08:00
|
|
|
if(${LIBOMP_VERSION_BUILD} STREQUAL 00000000)
|
2015-07-16 00:57:19 +08:00
|
|
|
set(LIBOMP_BUILD Development)
|
|
|
|
else()
|
2015-08-29 02:42:10 +08:00
|
|
|
set(LIBOMP_BUILD ${LIBOMP_VERSION_BUILD})
|
2015-07-16 00:57:19 +08:00
|
|
|
endif()
|
|
|
|
libomp_say("Build -- ${LIBOMP_BUILD}")
|
|
|
|
libomp_say("Use Stats-gathering -- ${LIBOMP_STATS}")
|
|
|
|
libomp_say("Use Debugger-support -- ${LIBOMP_USE_DEBUGGER}")
|
|
|
|
libomp_say("Use OMPT-support -- ${LIBOMP_OMPT_SUPPORT}")
|
|
|
|
if(${LIBOMP_OMPT_SUPPORT})
|
|
|
|
libomp_say("Use OMPT-blame -- ${LIBOMP_OMPT_BLAME}")
|
|
|
|
libomp_say("Use OMPT-trace -- ${LIBOMP_OMPT_TRACE}")
|
|
|
|
endif()
|
|
|
|
libomp_say("Use Adaptive locks -- ${LIBOMP_USE_ADAPTIVE_LOCKS}")
|
|
|
|
libomp_say("Use quad precision -- ${LIBOMP_USE_QUAD_PRECISION}")
|
2015-05-06 04:02:52 +08:00
|
|
|
endif()
|
|
|
|
|
2015-06-12 01:23:57 +08:00
|
|
|
add_subdirectory(src)
|
2015-09-22 04:41:31 +08:00
|
|
|
add_subdirectory(test)
|
2014-06-02 02:01:33 +08:00
|
|
|
|