llama.cpp/ggml/src/ggml-sycl/CMakeLists.txt

if (NOT GGML_SYCL_TARGET MATCHES "^(INTEL|NVIDIA|AMD)$")
    message(FATAL_ERROR "Invalid backend chosen, supported options are INTEL, NVIDIA, or AMD")
endif()

check_cxx_compiler_flag("-fsycl" SUPPORTS_SYCL)

if (DEFINED ENV{ONEAPI_ROOT})
    message(STATUS "Using oneAPI Release SYCL compiler (icpx).")
elseif(SUPPORTS_SYCL)
    message(WARNING "Using open-source SYCL compiler (clang++). Didn't detect ENV {ONEAPI_ROOT}.
        If you expected the oneAPI Release compiler, please install oneAPI & source it, like:
        source /opt/intel/oneapi/setvars.sh")
else()
    message(FATAL_ERROR, "C++ compiler lacks SYCL support.")
endif()
message(STATUS "SYCL found")
#todo: AOT

add_library(ggml-sycl
            ggml-sycl.cpp
            ../../include/ggml-sycl.h)

target_link_libraries(ggml-sycl PRIVATE ggml-base)
target_include_directories(ggml-sycl PRIVATE . ..)

if (GGML_SYCL_F16)
    if (GGML_SYCL_TARGET STREQUAL "AMD")
        message(WARNING "AMD target does not entirely support FP16 in the SYCL backend.")
    endif()
    add_compile_definitions(GGML_SYCL_F16)
endif()

set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wno-narrowing -fsycl")

if (GGML_SYCL_TARGET STREQUAL "NVIDIA")
    add_compile_definitions(GGML_SYCL_WARP_SIZE=32)
elseif (GGML_SYCL_TARGET STREQUAL "AMD")
    # INFO: Allowed Sub_group_sizes are not consistent through all
    # hip targets. For example, 64 is used for certain models, but the backend
    # does not support it.
    # Target archs tested working: gfx1030, gfx1031, (Only tested sub_group_size = 32)
    add_compile_definitions(GGML_SYCL_WARP_SIZE=32)
else()
    add_compile_definitions(GGML_SYCL_WARP_SIZE=16)
endif()

file(GLOB   GGML_HEADERS_SYCL "*.hpp")
file(GLOB   GGML_SOURCES_SYCL "*.cpp")
target_sources(ggml-sycl PRIVATE ${GGML_HEADERS_SYCL} ${GGML_SOURCES_SYCL})

find_package(DNNL)
message("-- DNNL found:" ${DNNL_FOUND})

if (GGML_SYCL_TARGET STREQUAL "INTEL")
    add_compile_definitions(GGML_SYCL_DNNL=${DNNL_FOUND})
else()
    add_compile_definitions(GGML_SYCL_DNNL=0)
endif()

if (${DNNL_FOUND} AND GGML_SYCL_TARGET STREQUAL "INTEL")
    target_link_libraries(ggml-sycl PRIVATE DNNL::dnnl)
endif()

if (WIN32)
    find_package(IntelSYCL REQUIRED)
    find_package(MKL REQUIRED)
    target_link_libraries(ggml-sycl PRIVATE IntelSYCL::SYCL_CXX MKL::MKL MKL::MKL_SYCL)
else()
    if (GGML_SYCL_TARGET STREQUAL "INTEL")
        target_link_libraries(ggml-sycl PRIVATE sycl OpenCL mkl_core pthread m dl mkl_sycl_blas mkl_intel_ilp64 mkl_tbb_thread)
    elseif (GGML_SYCL_TARGET STREQUAL "NVIDIA")
        set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fsycl-targets=nvptx64-nvidia-cuda")
        target_link_libraries(ggml-sycl PRIVATE sycl pthread m dl onemkl)
    elseif (GGML_SYCL_TARGET STREQUAL "AMD")
        if (GGML_SYCL_HIP_TARGET STREQUAL "")
            message(ERROR "Can't enable SYCL hip backend, GGML_SYCL_HIP_TARGET has not been set.")
        endif()
        set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fsycl-targets=amdgcn-amd-amdhsa -Xsycl-target-backend --offload-arch=${GGML_SYCL_HIP_TARGET}")
        target_link_libraries(ggml-sycl PRIVATE sycl pthread m dl onemkl)
    endif()
endif()
ggml : build backends as libraries (#10256) * ggml : build backends as libraries --------- Signed-off-by: Xiaodong Ye <xiaodong.ye@mthreads.com> Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> Co-authored-by: R0CKSTAR <xiaodong.ye@mthreads.com> 2024-11-14 18:04:35 +01:00			`if (NOT GGML_SYCL_TARGET MATCHES "^(INTEL\|NVIDIA\|AMD)$")`
			`message(FATAL_ERROR "Invalid backend chosen, supported options are INTEL, NVIDIA, or AMD")`
			`endif()`

			`check_cxx_compiler_flag("-fsycl" SUPPORTS_SYCL)`

			`if (DEFINED ENV{ONEAPI_ROOT})`
			`message(STATUS "Using oneAPI Release SYCL compiler (icpx).")`
			`elseif(SUPPORTS_SYCL)`
			`message(WARNING "Using open-source SYCL compiler (clang++). Didn't detect ENV {ONEAPI_ROOT}.`
			`If you expected the oneAPI Release compiler, please install oneAPI & source it, like:`
			`source /opt/intel/oneapi/setvars.sh")`
			`else()`
			`message(FATAL_ERROR, "C++ compiler lacks SYCL support.")`
			`endif()`
			`message(STATUS "SYCL found")`
			`#todo: AOT`

			`add_library(ggml-sycl`
			`ggml-sycl.cpp`
			`../../include/ggml-sycl.h)`

			`target_link_libraries(ggml-sycl PRIVATE ggml-base)`
			`target_include_directories(ggml-sycl PRIVATE . ..)`

			`if (GGML_SYCL_F16)`
			`if (GGML_SYCL_TARGET STREQUAL "AMD")`
			`message(WARNING "AMD target does not entirely support FP16 in the SYCL backend.")`
			`endif()`
			`add_compile_definitions(GGML_SYCL_F16)`
			`endif()`

			`set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wno-narrowing -fsycl")`

			`if (GGML_SYCL_TARGET STREQUAL "NVIDIA")`
			`add_compile_definitions(GGML_SYCL_WARP_SIZE=32)`
			`elseif (GGML_SYCL_TARGET STREQUAL "AMD")`
			`# INFO: Allowed Sub_group_sizes are not consistent through all`
			`# hip targets. For example, 64 is used for certain models, but the backend`
			`# does not support it.`
			`# Target archs tested working: gfx1030, gfx1031, (Only tested sub_group_size = 32)`
			`add_compile_definitions(GGML_SYCL_WARP_SIZE=32)`
			`else()`
			`add_compile_definitions(GGML_SYCL_WARP_SIZE=16)`
			`endif()`

			`file(GLOB GGML_HEADERS_SYCL "*.hpp")`
			`file(GLOB GGML_SOURCES_SYCL "*.cpp")`
			`target_sources(ggml-sycl PRIVATE ${GGML_HEADERS_SYCL} ${GGML_SOURCES_SYCL})`

			`find_package(DNNL)`
			`message("-- DNNL found:" ${DNNL_FOUND})`

			`if (GGML_SYCL_TARGET STREQUAL "INTEL")`
			`add_compile_definitions(GGML_SYCL_DNNL=${DNNL_FOUND})`
			`else()`
			`add_compile_definitions(GGML_SYCL_DNNL=0)`
			`endif()`

			`if (${DNNL_FOUND} AND GGML_SYCL_TARGET STREQUAL "INTEL")`
			`target_link_libraries(ggml-sycl PRIVATE DNNL::dnnl)`
			`endif()`

			`if (WIN32)`
			`find_package(IntelSYCL REQUIRED)`
			`find_package(MKL REQUIRED)`
			`target_link_libraries(ggml-sycl PRIVATE IntelSYCL::SYCL_CXX MKL::MKL MKL::MKL_SYCL)`
			`else()`
			`if (GGML_SYCL_TARGET STREQUAL "INTEL")`
			`target_link_libraries(ggml-sycl PRIVATE sycl OpenCL mkl_core pthread m dl mkl_sycl_blas mkl_intel_ilp64 mkl_tbb_thread)`
			`elseif (GGML_SYCL_TARGET STREQUAL "NVIDIA")`
			`set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fsycl-targets=nvptx64-nvidia-cuda")`
			`target_link_libraries(ggml-sycl PRIVATE sycl pthread m dl onemkl)`
			`elseif (GGML_SYCL_TARGET STREQUAL "AMD")`
			`if (GGML_SYCL_HIP_TARGET STREQUAL "")`
			`message(ERROR "Can't enable SYCL hip backend, GGML_SYCL_HIP_TARGET has not been set.")`
			`endif()`
			`set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fsycl-targets=amdgcn-amd-amdhsa -Xsycl-target-backend --offload-arch=${GGML_SYCL_HIP_TARGET}")`
			`target_link_libraries(ggml-sycl PRIVATE sycl pthread m dl onemkl)`
			`endif()`
			`endif()`