Skip to content

Commit 0b0d611

Browse files
authored
[Driver][SYCL] Add initial SYCL offload compilation support (#107493)
Introduces the SYCL based toolchain and initial toolchain construction when using the '-fsycl' option. This option will enable SYCL based offloading, creating a SPIR-V based IR file packaged into the compiled host object. This includes early support for creating the host/device object using the new offloading model. The device object is created using the spir64-unknown-unknown target triple. New/Updated Options: -fsycl Enables SYCL offloading for host and device -fsycl-device-only Enables device only compilation for SYCL -fsycl-host-only Enables host only compilation for SYCL RFC Reference: https://discourse.llvm.org/t/rfc-sycl-driver-enhancements/74092
1 parent 58f107f commit 0b0d611

File tree

20 files changed

+532
-26
lines changed

20 files changed

+532
-26
lines changed

clang/include/clang/Driver/Action.h

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -94,6 +94,7 @@ class Action {
9494
OFK_Cuda = 0x02,
9595
OFK_OpenMP = 0x04,
9696
OFK_HIP = 0x08,
97+
OFK_SYCL = 0x10,
9798
};
9899

99100
static const char *getClassName(ActionClass AC);

clang/include/clang/Driver/Driver.h

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -582,6 +582,10 @@ class Driver {
582582
/// @name Helper Methods
583583
/// @{
584584

585+
/// getSYCLDeviceTriple - Returns the SYCL device triple for the
586+
/// specified ArchType.
587+
llvm::Triple getSYCLDeviceTriple(StringRef TargetArch = "spir64") const;
588+
585589
/// PrintActions - Print the list of actions.
586590
void PrintActions(const Compilation &C) const;
587591

clang/include/clang/Driver/Options.td

Lines changed: 12 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -182,7 +182,8 @@ def opencl_Group : OptionGroup<"<opencl group>">, Group<f_Group>,
182182
DocName<"OpenCL options">;
183183

184184
def sycl_Group : OptionGroup<"<SYCL group>">, Group<f_Group>,
185-
DocName<"SYCL options">;
185+
DocName<"SYCL options">,
186+
Visibility<[ClangOption, CLOption]>;
186187

187188
def cuda_Group : OptionGroup<"<CUDA group>">, Group<f_Group>,
188189
DocName<"CUDA options">,
@@ -6780,16 +6781,20 @@ defm : FlangIgnoredDiagOpt<"frontend-loop-interchange">;
67806781
defm : FlangIgnoredDiagOpt<"target-lifetime">;
67816782

67826783
// C++ SYCL options
6784+
let Group = sycl_Group in {
67836785
def fsycl : Flag<["-"], "fsycl">,
6784-
Visibility<[ClangOption, CLOption]>,
6785-
Group<sycl_Group>, HelpText<"Enables SYCL kernels compilation for device">;
6786+
HelpText<"Enables SYCL kernels compilation for device">;
67866787
def fno_sycl : Flag<["-"], "fno-sycl">,
6787-
Visibility<[ClangOption, CLOption]>,
6788-
Group<sycl_Group>, HelpText<"Disables SYCL kernels compilation for device">;
6788+
HelpText<"Disables SYCL kernels compilation for device">;
6789+
def fsycl_device_only : Flag<["-"], "fsycl-device-only">,
6790+
Alias<offload_device_only>, HelpText<"Compile SYCL kernels for device only">;
6791+
def fsycl_host_only : Flag<["-"], "fsycl-host-only">,
6792+
Alias<offload_host_only>, HelpText<"Compile SYCL kernels for host only">;
67896793
def sycl_link : Flag<["--"], "sycl-link">, Flags<[HelpHidden]>,
6790-
Visibility<[ClangOption, CLOption]>,
6791-
Group<sycl_Group>, HelpText<"Perform link through clang-sycl-linker via the target "
6794+
HelpText<"Perform link through clang-sycl-linker via the target "
67926795
"offloading toolchain.">;
6796+
} // let Group = sycl_Group
6797+
67936798
// OS-specific options
67946799
let Flags = [TargetSpecific] in {
67956800
defm android_pad_segment : BooleanFFlag<"android-pad-segment">, Group<f_Group>;

clang/include/clang/Driver/ToolChain.h

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -762,6 +762,10 @@ class ToolChain {
762762
virtual void AddHIPIncludeArgs(const llvm::opt::ArgList &DriverArgs,
763763
llvm::opt::ArgStringList &CC1Args) const;
764764

765+
/// Add arguments to use system-specific SYCL includes.
766+
virtual void AddSYCLIncludeArgs(const llvm::opt::ArgList &DriverArgs,
767+
llvm::opt::ArgStringList &CC1Args) const;
768+
765769
/// Add arguments to use MCU GCC toolchain includes.
766770
virtual void AddIAMCUIncludeArgs(const llvm::opt::ArgList &DriverArgs,
767771
llvm::opt::ArgStringList &CC1Args) const;

clang/lib/Driver/Action.cpp

Lines changed: 7 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -111,6 +111,8 @@ std::string Action::getOffloadingKindPrefix() const {
111111
return "device-openmp";
112112
case OFK_HIP:
113113
return "device-hip";
114+
case OFK_SYCL:
115+
return "device-sycl";
114116

115117
// TODO: Add other programming models here.
116118
}
@@ -128,6 +130,8 @@ std::string Action::getOffloadingKindPrefix() const {
128130
Res += "-hip";
129131
if (ActiveOffloadKindMask & OFK_OpenMP)
130132
Res += "-openmp";
133+
if (ActiveOffloadKindMask & OFK_SYCL)
134+
Res += "-sycl";
131135

132136
// TODO: Add other programming models here.
133137

@@ -164,6 +168,8 @@ StringRef Action::GetOffloadKindName(OffloadKind Kind) {
164168
return "openmp";
165169
case OFK_HIP:
166170
return "hip";
171+
case OFK_SYCL:
172+
return "sycl";
167173

168174
// TODO: Add other programming models here.
169175
}
@@ -320,7 +326,7 @@ void OffloadAction::DeviceDependences::add(Action &A, const ToolChain &TC,
320326
DeviceBoundArchs.push_back(BoundArch);
321327

322328
// Add each active offloading kind from a mask.
323-
for (OffloadKind OKind : {OFK_OpenMP, OFK_Cuda, OFK_HIP})
329+
for (OffloadKind OKind : {OFK_OpenMP, OFK_Cuda, OFK_HIP, OFK_SYCL})
324330
if (OKind & OffloadKindMask)
325331
DeviceOffloadKinds.push_back(OKind);
326332
}

clang/lib/Driver/CMakeLists.txt

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -77,6 +77,7 @@ add_clang_library(clangDriver
7777
ToolChains/RISCVToolchain.cpp
7878
ToolChains/Solaris.cpp
7979
ToolChains/SPIRV.cpp
80+
ToolChains/SYCL.cpp
8081
ToolChains/TCE.cpp
8182
ToolChains/UEFI.cpp
8283
ToolChains/VEToolchain.cpp

clang/lib/Driver/Compilation.cpp

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -217,10 +217,11 @@ static bool ActionFailed(const Action *A,
217217
if (FailingCommands.empty())
218218
return false;
219219

220-
// CUDA/HIP can have the same input source code compiled multiple times so do
221-
// not compiled again if there are already failures. It is OK to abort the
222-
// CUDA pipeline on errors.
223-
if (A->isOffloading(Action::OFK_Cuda) || A->isOffloading(Action::OFK_HIP))
220+
// CUDA/HIP/SYCL can have the same input source code compiled multiple times
221+
// so do not compile again if there are already failures. It is OK to abort
222+
// the CUDA/HIP/SYCL pipeline on errors.
223+
if (A->isOffloading(Action::OFK_Cuda) || A->isOffloading(Action::OFK_HIP) ||
224+
A->isOffloading(Action::OFK_SYCL))
224225
return true;
225226

226227
for (const auto &CI : FailingCommands)

clang/lib/Driver/Driver.cpp

Lines changed: 94 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -43,6 +43,7 @@
4343
#include "ToolChains/PS4CPU.h"
4444
#include "ToolChains/RISCVToolchain.h"
4545
#include "ToolChains/SPIRV.h"
46+
#include "ToolChains/SYCL.h"
4647
#include "ToolChains/Solaris.h"
4748
#include "ToolChains/TCE.h"
4849
#include "ToolChains/UEFI.h"
@@ -781,6 +782,27 @@ Driver::OpenMPRuntimeKind Driver::getOpenMPRuntime(const ArgList &Args) const {
781782
return RT;
782783
}
783784

785+
static const char *getDefaultSYCLArch(Compilation &C) {
786+
// If -fsycl is supplied we will assume SPIR-V
787+
if (C.getDefaultToolChain().getTriple().isArch32Bit())
788+
return "spirv32";
789+
return "spirv64";
790+
}
791+
792+
static bool addSYCLDefaultTriple(Compilation &C,
793+
SmallVectorImpl<llvm::Triple> &SYCLTriples) {
794+
for (const auto &SYCLTriple : SYCLTriples) {
795+
if (SYCLTriple.getSubArch() == llvm::Triple::NoSubArch &&
796+
SYCLTriple.isSPIROrSPIRV())
797+
return false;
798+
}
799+
// Add the default triple as it was not found.
800+
llvm::Triple DefaultTriple =
801+
C.getDriver().getSYCLDeviceTriple(getDefaultSYCLArch(C));
802+
SYCLTriples.insert(SYCLTriples.begin(), DefaultTriple);
803+
return true;
804+
}
805+
784806
void Driver::CreateOffloadingDeviceToolChains(Compilation &C,
785807
InputList &Inputs) {
786808

@@ -994,6 +1016,41 @@ void Driver::CreateOffloadingDeviceToolChains(Compilation &C,
9941016
return;
9951017
}
9961018

1019+
//
1020+
// SYCL
1021+
//
1022+
// We need to generate a SYCL toolchain if the user specified -fsycl.
1023+
bool IsSYCL = C.getInputArgs().hasFlag(options::OPT_fsycl,
1024+
options::OPT_fno_sycl, false);
1025+
1026+
auto argSYCLIncompatible = [&](OptSpecifier OptId) {
1027+
if (!IsSYCL)
1028+
return;
1029+
if (Arg *IncompatArg = C.getInputArgs().getLastArg(OptId))
1030+
Diag(clang::diag::err_drv_argument_not_allowed_with)
1031+
<< IncompatArg->getSpelling() << "-fsycl";
1032+
};
1033+
// -static-libstdc++ is not compatible with -fsycl.
1034+
argSYCLIncompatible(options::OPT_static_libstdcxx);
1035+
// -ffreestanding cannot be used with -fsycl
1036+
argSYCLIncompatible(options::OPT_ffreestanding);
1037+
1038+
llvm::SmallVector<llvm::Triple, 4> UniqueSYCLTriplesVec;
1039+
1040+
if (IsSYCL) {
1041+
addSYCLDefaultTriple(C, UniqueSYCLTriplesVec);
1042+
1043+
// We'll need to use the SYCL and host triples as the key into
1044+
// getOffloadingDeviceToolChain, because the device toolchains we're
1045+
// going to create will depend on both.
1046+
const ToolChain *HostTC = C.getSingleOffloadToolChain<Action::OFK_Host>();
1047+
for (const auto &TT : UniqueSYCLTriplesVec) {
1048+
auto SYCLTC = &getOffloadingDeviceToolChain(C.getInputArgs(), TT, *HostTC,
1049+
Action::OFK_SYCL);
1050+
C.addOffloadDeviceToolChain(SYCLTC, Action::OFK_SYCL);
1051+
}
1052+
}
1053+
9971054
//
9981055
// TODO: Add support for other offloading programming models here.
9991056
//
@@ -2027,6 +2084,20 @@ void Driver::PrintHelp(bool ShowHidden) const {
20272084
VisibilityMask);
20282085
}
20292086

2087+
llvm::Triple Driver::getSYCLDeviceTriple(StringRef TargetArch) const {
2088+
SmallVector<StringRef, 5> SYCLAlias = {"spir", "spir64", "spirv32",
2089+
"spirv64"};
2090+
if (std::find(SYCLAlias.begin(), SYCLAlias.end(), TargetArch) !=
2091+
SYCLAlias.end()) {
2092+
llvm::Triple TT;
2093+
TT.setArchName(TargetArch);
2094+
TT.setVendor(llvm::Triple::UnknownVendor);
2095+
TT.setOS(llvm::Triple::UnknownOS);
2096+
return TT;
2097+
}
2098+
return llvm::Triple(TargetArch);
2099+
}
2100+
20302101
void Driver::PrintVersion(const Compilation &C, raw_ostream &OS) const {
20312102
if (IsFlangMode()) {
20322103
OS << getClangToolFullVersion("flang") << '\n';
@@ -4184,6 +4255,7 @@ void Driver::BuildActions(Compilation &C, DerivedArgList &Args,
41844255

41854256
bool UseNewOffloadingDriver =
41864257
C.isOffloadingHostKind(Action::OFK_OpenMP) ||
4258+
C.isOffloadingHostKind(Action::OFK_SYCL) ||
41874259
Args.hasFlag(options::OPT_foffload_via_llvm,
41884260
options::OPT_fno_offload_via_llvm, false) ||
41894261
Args.hasFlag(options::OPT_offload_new_driver,
@@ -4594,6 +4666,8 @@ Driver::getOffloadArchs(Compilation &C, const llvm::opt::DerivedArgList &Args,
45944666
Archs.insert(OffloadArchToString(OffloadArch::HIPDefault));
45954667
else if (Kind == Action::OFK_OpenMP)
45964668
Archs.insert(StringRef());
4669+
else if (Kind == Action::OFK_SYCL)
4670+
Archs.insert(StringRef());
45974671
} else {
45984672
Args.ClaimAllArgs(options::OPT_offload_arch_EQ);
45994673
Args.ClaimAllArgs(options::OPT_no_offload_arch_EQ);
@@ -4618,7 +4692,7 @@ Action *Driver::BuildOffloadingActions(Compilation &C,
46184692
OffloadAction::DeviceDependences DDeps;
46194693

46204694
const Action::OffloadKind OffloadKinds[] = {
4621-
Action::OFK_OpenMP, Action::OFK_Cuda, Action::OFK_HIP};
4695+
Action::OFK_OpenMP, Action::OFK_Cuda, Action::OFK_HIP, Action::OFK_SYCL};
46224696

46234697
for (Action::OffloadKind Kind : OffloadKinds) {
46244698
SmallVector<const ToolChain *, 2> ToolChains;
@@ -4663,6 +4737,11 @@ Action *Driver::BuildOffloadingActions(Compilation &C,
46634737
break;
46644738
}
46654739

4740+
// Assemble actions are not used for the SYCL device side. Both compile
4741+
// and backend actions are used to generate IR and textual IR if needed.
4742+
if (Kind == Action::OFK_SYCL && Phase == phases::Assemble)
4743+
continue;
4744+
46664745
auto TCAndArch = TCAndArchs.begin();
46674746
for (Action *&A : DeviceActions) {
46684747
if (A->getType() == types::TY_Nothing)
@@ -4901,6 +4980,7 @@ Action *Driver::ConstructPhaseAction(
49014980
return C.MakeAction<BackendJobAction>(Input, Output);
49024981
}
49034982
if (Args.hasArg(options::OPT_emit_llvm) ||
4983+
TargetDeviceOffloadKind == Action::OFK_SYCL ||
49044984
(((Input->getOffloadingToolChain() &&
49054985
Input->getOffloadingToolChain()->getTriple().isAMDGPU()) ||
49064986
TargetDeviceOffloadKind == Action::OFK_HIP) &&
@@ -6592,6 +6672,19 @@ const ToolChain &Driver::getOffloadingDeviceToolChain(
65926672
HostTC, Args);
65936673
break;
65946674
}
6675+
case Action::OFK_SYCL:
6676+
switch (Target.getArch()) {
6677+
case llvm::Triple::spir:
6678+
case llvm::Triple::spir64:
6679+
case llvm::Triple::spirv32:
6680+
case llvm::Triple::spirv64:
6681+
TC = std::make_unique<toolchains::SYCLToolChain>(*this, Target, HostTC,
6682+
Args);
6683+
break;
6684+
default:
6685+
break;
6686+
}
6687+
break;
65956688
default:
65966689
break;
65976690
}

clang/lib/Driver/ToolChain.cpp

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1487,6 +1487,9 @@ void ToolChain::AddCudaIncludeArgs(const ArgList &DriverArgs,
14871487
void ToolChain::AddHIPIncludeArgs(const ArgList &DriverArgs,
14881488
ArgStringList &CC1Args) const {}
14891489

1490+
void ToolChain::AddSYCLIncludeArgs(const ArgList &DriverArgs,
1491+
ArgStringList &CC1Args) const {}
1492+
14901493
llvm::SmallVector<ToolChain::BitCodeLibraryInfo, 12>
14911494
ToolChain::getDeviceLibs(const ArgList &DriverArgs) const {
14921495
return {};

0 commit comments

Comments
 (0)