intel
diff --git a/‎clang/lib/CodeGen/BackendUtil.cpp
Lines changed: 16 additions & 54 deletions b/‎clang/lib/CodeGen/BackendUtil.cpp
Lines changed: 16 additions & 54 deletions
diff --git a/‎clang/lib/Driver/ToolChains/MSVC.cpp
Lines changed: 3 additions & 0 deletions b/‎clang/lib/Driver/ToolChains/MSVC.cpp
Lines changed: 3 additions & 0 deletions
diff --git a/‎clang/test/Driver/suppress_LNK4221_intelfpga_sycl-link.cpp
Lines changed: 6 additions & 0 deletions b/‎clang/test/Driver/suppress_LNK4221_intelfpga_sycl-link.cpp
Lines changed: 6 additions & 0 deletions
diff --git a/‎llvm/lib/Target/NVPTX/SYCL/GlobalOffset.cpp
Lines changed: 4 additions & 4 deletions b/‎llvm/lib/Target/NVPTX/SYCL/GlobalOffset.cpp
Lines changed: 4 additions & 4 deletions
diff --git a/‎sycl/include/CL/__spirv/spirv_ops.hpp
Lines changed: 234 additions & 8 deletions b/‎sycl/include/CL/__spirv/spirv_ops.hpp
Lines changed: 234 additions & 8 deletions
@@ -42,7 +42,6 @@
 #include "llvm/Passes/StandardInstrumentations.h"
 #include "llvm/Support/BuryPointer.h"
 #include "llvm/Support/CommandLine.h"
-#include "llvm/Support/Debug.h"
 #include "llvm/Support/MemoryBuffer.h"
 #include "llvm/Support/PrettyStackTrace.h"
 #include "llvm/Support/TargetRegistry.h"
@@ -82,11 +81,6 @@
 #include "llvm/Transforms/Utils/SymbolRewriter.h"
 #include "llvm/Transforms/Utils/UniqueInternalLinkageNames.h"
 #include <memory>
-
-namespace SPIRV {
-  extern llvm::cl::opt<bool> SPIRVNoDerefAttr;
-}
-
 using namespace clang;
 using namespace llvm;
 
@@ -622,54 +616,22 @@ void EmitAssemblyHelper::CreatePasses(legacy::PassManager &MPM,
          CodeGenOpts.PrepareForThinLTO));
   }
 
-  // FIXME: This code is a workaround for a number of problems with optimized
-  // SYCL code for the SPIR target. This change trying to balance between doing
-  // too few and too many optimizations. The current approach is to disable as
-  // much as possible just to keep the compiler functional. Eventually we can
-  // consider allowing -On option to configure the optimization set for the FE
-  // device compiler as well, but before that we must fix all the functional and
-  // performance issues caused by LLVM transformantions.
-  // E.g. LLVM optimizations make use of llvm intrinsics, instructions, data
-  // types, etc., which are not supported by the SPIR-V translator (current
-  // "back-end" for SYCL device compiler).
-  // NOTE: We use "normal" inliner (i.e. from O2/O3), but limit the rest of
-  // optimization pipeline. Inliner is a must for enabling size reduction
-  // optimizations.
-  if (LangOpts.SYCLIsDevice && TargetTriple.isSPIR()) {
-    PMBuilder.OptLevel = 1;
-    PMBuilder.SizeLevel = 2;
-    PMBuilder.SLPVectorize = false;
-    PMBuilder.LoopVectorize = false;
-    PMBuilder.DivergentTarget = true;
-    PMBuilder.DisableGVNLoadPRE = true;
-    PMBuilder.ForgetAllSCEVInLoopUnroll = true;
-
-    PMBuilder.DisableUnrollLoops = true;
-    // Loop interleaving in the loop vectorizer has historically been set to be
-    // enabled when loop unrolling is enabled.
-    PMBuilder.LoopsInterleaved = false;
-    PMBuilder.MergeFunctions = false;
-    PMBuilder.PrepareForThinLTO = false;
-    PMBuilder.PrepareForLTO = false;
-    PMBuilder.RerollLoops = false;
-  } else {
-    PMBuilder.OptLevel = CodeGenOpts.OptimizationLevel;
-    PMBuilder.SizeLevel = CodeGenOpts.OptimizeSize;
-    PMBuilder.SLPVectorize = CodeGenOpts.VectorizeSLP;
-    PMBuilder.LoopVectorize = CodeGenOpts.VectorizeLoop;
-    // Only enable CGProfilePass when using integrated assembler, since
-    // non-integrated assemblers don't recognize .cgprofile section.
-    PMBuilder.CallGraphProfile = !CodeGenOpts.DisableIntegratedAS;
-
-    PMBuilder.DisableUnrollLoops = !CodeGenOpts.UnrollLoops;
-    // Loop interleaving in the loop vectorizer has historically been set to be
-    // enabled when loop unrolling is enabled.
-    PMBuilder.LoopsInterleaved = CodeGenOpts.UnrollLoops;
-    PMBuilder.MergeFunctions = CodeGenOpts.MergeFunctions;
-    PMBuilder.PrepareForThinLTO = CodeGenOpts.PrepareForThinLTO;
-    PMBuilder.PrepareForLTO = CodeGenOpts.PrepareForLTO;
-    PMBuilder.RerollLoops = CodeGenOpts.RerollLoops;
-  }
+  PMBuilder.OptLevel = CodeGenOpts.OptimizationLevel;
+  PMBuilder.SizeLevel = CodeGenOpts.OptimizeSize;
+  PMBuilder.SLPVectorize = CodeGenOpts.VectorizeSLP;
+  PMBuilder.LoopVectorize = CodeGenOpts.VectorizeLoop;
+  // Only enable CGProfilePass when using integrated assembler, since
+  // non-integrated assemblers don't recognize .cgprofile section.
+  PMBuilder.CallGraphProfile = !CodeGenOpts.DisableIntegratedAS;
+
+  PMBuilder.DisableUnrollLoops = !CodeGenOpts.UnrollLoops;
+  // Loop interleaving in the loop vectorizer has historically been set to be
+  // enabled when loop unrolling is enabled.
+  PMBuilder.LoopsInterleaved = CodeGenOpts.UnrollLoops;
+  PMBuilder.MergeFunctions = CodeGenOpts.MergeFunctions;
+  PMBuilder.PrepareForThinLTO = CodeGenOpts.PrepareForThinLTO;
+  PMBuilder.PrepareForLTO = CodeGenOpts.PrepareForLTO;
+  PMBuilder.RerollLoops = CodeGenOpts.RerollLoops;
 
   MPM.add(new TargetLibraryInfoWrapperPass(*TLII));
 
 
@@ -322,6 +322,9 @@ void visualstudio::Linker::constructMSVCLibCommand(Compilation &C,
     }
     CmdArgs.push_back(II.getFilename());
   }
+  if (Args.hasArg(options::OPT_fsycl_link_EQ) &&
+      Args.hasArg(options::OPT_fintelfpga))
+    CmdArgs.push_back("/IGNORE:4221");
   CmdArgs.push_back(
       C.getArgs().MakeArgString(Twine("-OUT:") + Output.getFilename()));
 
 
@@ -0,0 +1,6 @@
+// REQUIRES: system-windows
+// RUN:  %clangxx -target x86_64-pc-windows-msvc -fsycl -fintelfpga -fsycl-link -Xshardware %s -### 2>&1 \
+// RUN:  | FileCheck %s
+// RUN:  %clang_cl -target x86_64-pc-windows-msvc -fsycl -fintelfpga -fsycl-link -Xshardware %s -### 2>&1 \
+// RUN:  | FileCheck %s
+// CHECK: /IGNORE:4221
@@ -259,6 +259,9 @@ class GlobalOffset : public ModulePass {
     Function *NewFunc = Function::Create(NewFuncTy, Func->getLinkage(),
                                          Func->getAddressSpace());
 
+    // Keep original function ordering.
+    M.getFunctionList().insertAfter(Func->getIterator(), NewFunc);
+
     if (KeepOriginal) {
       // TODO: Are there better naming alternatives that allow for unmangling?
       NewFunc->setName(Func->getName() + "_with_offset");
@@ -272,7 +275,7 @@ class GlobalOffset : public ModulePass {
       }
 
       SmallVector<ReturnInst *, 8> Returns;
-      CloneFunctionInto(NewFunc, Func, VMap, /*ModuleLevelChanges=*/false,
+      CloneFunctionInto(NewFunc, Func, VMap, /*ModuleLevelChanges=*/true,
                         Returns);
     } else {
       NewFunc->copyAttributesFrom(Func);
@@ -298,9 +301,6 @@ class GlobalOffset : public ModulePass {
         NewFunc->addMetadata(MD.first, *MD.second);
     }
 
-    // Keep original function ordering.
-    M.getFunctionList().insertAfter(Func->getIterator(), NewFunc);
-
     Value *ImplicitOffset = NewFunc->arg_begin() + (NewFunc->arg_size() - 1);
     // Add bitcast to match the return type of the intrinsic if needed.
     if (ImplicitArgumentType != ImplicitOffsetPtrType) {
 
@@ -205,6 +205,14 @@ __SYCL_CONVERGENT__ extern SYCL_EXTERNAL void
 __spirv_SubgroupBlockWriteINTEL(__attribute__((opencl_global)) uint32_t *Ptr,
                                 dataT Data) noexcept;
 
+template <typename dataT>
+__SYCL_CONVERGENT__ extern SYCL_EXTERNAL dataT __spirv_SubgroupBlockReadINTEL(
+    const __attribute__((opencl_global)) uint64_t *Ptr) noexcept;
+
+template <typename dataT>
+__SYCL_CONVERGENT__ extern SYCL_EXTERNAL void
+__spirv_SubgroupBlockWriteINTEL(__attribute__((opencl_global)) uint64_t *Ptr,
+                                dataT Data) noexcept;
 template <int W, int rW>
 extern SYCL_EXTERNAL ap_int<rW>
 __spirv_FixedSqrtINTEL(ap_int<W> a, bool S, int32_t I, int32_t rI,
@@ -256,14 +264,232 @@ extern SYCL_EXTERNAL ap_int<rW>
 __spirv_FixedExpINTEL(ap_int<W> a, bool S, int32_t I, int32_t rI,
                       int32_t Quantization = 0, int32_t Overflow = 0) noexcept;
 
-template <typename dataT>
-__SYCL_CONVERGENT__ extern SYCL_EXTERNAL dataT __spirv_SubgroupBlockReadINTEL(
-    const __attribute__((opencl_global)) uint64_t *Ptr) noexcept;
-
-template <typename dataT>
-__SYCL_CONVERGENT__ extern SYCL_EXTERNAL void
-__spirv_SubgroupBlockWriteINTEL(__attribute__((opencl_global)) uint64_t *Ptr,
-                                dataT Data) noexcept;
+// In the following built-ins width of arbitrary precision integer type for
+// a floating point variable should be equal to sum of corresponding
+// exponent width E, mantissa width M and 1 for sign bit. I.e. WA = EA + MA + 1.
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatCastINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatCastFromIntINTEL(
+    ap_int<WA> A, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatCastToIntINTEL(
+    ap_int<WA> A, int32_t MA, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int WB, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatAddINTEL(
+    ap_int<WA> A, int32_t MA, ap_int<WB> B, int32_t MB, int32_t Mout,
+    int32_t EnableSubnormals = 0, int32_t RoundingMode = 0,
+    int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int WB, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatSubINTEL(
+    ap_int<WA> A, int32_t MA, ap_int<WB> B, int32_t MB, int32_t Mout,
+    int32_t EnableSubnormals = 0, int32_t RoundingMode = 0,
+    int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int WB, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatMulINTEL(
+    ap_int<WA> A, int32_t MA, ap_int<WB> B, int32_t MB, int32_t Mout,
+    int32_t EnableSubnormals = 0, int32_t RoundingMode = 0,
+    int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int WB, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatDivINTEL(
+    ap_int<WA> A, int32_t MA, ap_int<WB> B, int32_t MB, int32_t Mout,
+    int32_t EnableSubnormals = 0, int32_t RoundingMode = 0,
+    int32_t RoundingAccuracy = 0) noexcept;
+
+// Comparison built-ins don't use Subnormal Support, Rounding Mode and
+// Rounding Accuracy.
+template <int WA, int WB>
+extern SYCL_EXTERNAL bool
+__spirv_ArbitraryFloatGTINTEL(ap_int<WA> A, int32_t MA, ap_int<WB> B,
+                              int32_t MB) noexcept;
+
+template <int WA, int WB>
+extern SYCL_EXTERNAL bool
+__spirv_ArbitraryFloatGEINTEL(ap_int<WA> A, int32_t MA, ap_int<WB> B,
+                              int32_t MB) noexcept;
+
+template <int WA, int WB>
+extern SYCL_EXTERNAL bool
+__spirv_ArbitraryFloatLTINTEL(ap_int<WA> A, int32_t MA, ap_int<WB> B,
+                              int32_t MB) noexcept;
+
+template <int WA, int WB>
+extern SYCL_EXTERNAL bool
+__spirv_ArbitraryFloatLEINTEL(ap_int<WA> A, int32_t MA, ap_int<WB> B,
+                              int32_t MB) noexcept;
+
+template <int WA, int WB>
+extern SYCL_EXTERNAL bool
+__spirv_ArbitraryFloatEQINTEL(ap_int<WA> A, int32_t MA, ap_int<WB> B,
+                              int32_t MB) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatRecipINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatRSqrtINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatCbrtINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int WB, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatHypotINTEL(
+    ap_int<WA> A, int32_t MA, ap_int<WB> B, int32_t MB, int32_t Mout,
+    int32_t EnableSubnormals = 0, int32_t RoundingMode = 0,
+    int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatSqrtINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatLogINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatLog2INTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatLog10INTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatLog1pINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatExpINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatExp2INTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatExp10INTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatExpm1INTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatSinINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatCosINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+// Result value contains both values of sine and cosine and so has the size of
+// 2 * Wout where Wout is equal to (1 + Eout + Mout).
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<2 * Wout> __spirv_ArbitraryFloatSinCosINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatSinPiINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatCosPiINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+// Result value contains both values of sine(A*pi) and cosine(A*pi) and so has
+// the size of 2 * Wout where Wout is equal to (1 + Eout + Mout).
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<2 * Wout> __spirv_ArbitraryFloatSinCosPiINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatASinINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatASinPiINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatACosINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatACosPiINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatATanINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatATanPiINTEL(
+    ap_int<WA> A, int32_t MA, int32_t Mout, int32_t EnableSubnormals = 0,
+    int32_t RoundingMode = 0, int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int WB, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatATan2INTEL(
+    ap_int<WA> A, int32_t MA, ap_int<WB> B, int32_t MB, int32_t Mout,
+    int32_t EnableSubnormals = 0, int32_t RoundingMode = 0,
+    int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int WB, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatPowINTEL(
+    ap_int<WA> A, int32_t MA, ap_int<WB> B, int32_t MB, int32_t Mout,
+    int32_t EnableSubnormals = 0, int32_t RoundingMode = 0,
+    int32_t RoundingAccuracy = 0) noexcept;
+
+template <int WA, int WB, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout> __spirv_ArbitraryFloatPowRINTEL(
+    ap_int<WA> A, int32_t MA, ap_int<WB> B, int32_t MB, int32_t Mout,
+    int32_t EnableSubnormals = 0, int32_t RoundingMode = 0,
+    int32_t RoundingAccuracy = 0) noexcept;
+
+// PowN built-in calculates `A^B` where `A` is arbitrary precision floating
+// point number and `B` is arbitrary precision integer, i.e. its width doesn't
+// depend on sum of exponent and mantissa.
+template <int WA, int WB, int Wout>
+extern SYCL_EXTERNAL ap_int<Wout>
+__spirv_ArbitraryFloatPowNINTEL(ap_int<WA> A, int32_t MA, ap_int<WB> B,
+                                int32_t Mout, int32_t EnableSubnormals = 0,
+                                int32_t RoundingMode = 0,
+                                int32_t RoundingAccuracy = 0) noexcept;
 
 template <typename dataT>
 extern SYCL_EXTERNAL int32_t __spirv_ReadPipe(RPipeTy<dataT> Pipe, dataT *Data,
Original file line number	Diff line number	Diff line change
`@@ -322,6 +322,9 @@ void visualstudio::Linker::constructMSVCLibCommand(Compilation &C,`
`322`	`322`	`}`
`323`	`323`	`CmdArgs.push_back(II.getFilename());`
`324`	`324`	`}`
	`325`	`+ if (Args.hasArg(options::OPT_fsycl_link_EQ) &&`
	`326`	`+ Args.hasArg(options::OPT_fintelfpga))`
	`327`	`+ CmdArgs.push_back("/IGNORE:4221");`
`325`	`328`	`CmdArgs.push_back(`
`326`	`329`	`C.getArgs().MakeArgString(Twine("-OUT:") + Output.getFilename()));`
`327`	`330`