blob: 86f0c0008eab1507258cae4a46d03b2e1fc24f5c [file] [log] [blame]
Nicolas Capens598f8d82016-09-26 15:09:10 -04001// Copyright 2016 The SwiftShader Authors. All Rights Reserved.
2//
3// Licensed under the Apache License, Version 2.0 (the "License");
4// you may not use this file except in compliance with the License.
5// You may obtain a copy of the License at
6//
7// http://www.apache.org/licenses/LICENSE-2.0
8//
9// Unless required by applicable law or agreed to in writing, software
10// distributed under the License is distributed on an "AS IS" BASIS,
11// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12// See the License for the specific language governing permissions and
13// limitations under the License.
14
Nicolas Capens598f8d82016-09-26 15:09:10 -040015#include "Reactor.hpp"
Ben Claytoneb50d252019-04-15 13:50:01 -040016#include "Debug.hpp"
Nicolas Capens598f8d82016-09-26 15:09:10 -040017
Nicolas Capens2ae9d742016-11-24 14:43:05 -050018#include "Optimizer.hpp"
Nicolas Capens1a3ce872018-10-10 10:42:36 -040019#include "ExecutableMemory.hpp"
Nicolas Capensa062f322018-09-06 15:34:46 -040020
Nicolas Capens598f8d82016-09-26 15:09:10 -040021#include "src/IceTypes.h"
22#include "src/IceCfg.h"
23#include "src/IceELFStreamer.h"
24#include "src/IceGlobalContext.h"
25#include "src/IceCfgNode.h"
26#include "src/IceELFObjectWriter.h"
Nicolas Capens8dfd9a72016-10-13 17:44:51 -040027#include "src/IceGlobalInits.h"
Nicolas Capens598f8d82016-09-26 15:09:10 -040028
29#include "llvm/Support/FileSystem.h"
30#include "llvm/Support/raw_os_ostream.h"
Nicolas Capens6a990f82018-07-06 15:54:07 -040031#include "llvm/Support/Compiler.h"
32
33#if __has_feature(memory_sanitizer)
34#include <sanitizer/msan_interface.h>
35#endif
Nicolas Capens598f8d82016-09-26 15:09:10 -040036
Nicolas Capensbd65da92017-01-05 16:31:06 -050037#if defined(_WIN32)
Alexis Hetu113e33a2017-01-19 10:49:19 -050038#ifndef WIN32_LEAN_AND_MEAN
Nicolas Capens598f8d82016-09-26 15:09:10 -040039#define WIN32_LEAN_AND_MEAN
Alexis Hetu113e33a2017-01-19 10:49:19 -050040#endif // !WIN32_LEAN_AND_MEAN
41#ifndef NOMINMAX
Nicolas Capens598f8d82016-09-26 15:09:10 -040042#define NOMINMAX
Alexis Hetu113e33a2017-01-19 10:49:19 -050043#endif // !NOMINMAX
Nicolas Capens598f8d82016-09-26 15:09:10 -040044#include <Windows.h>
Nicolas Capensbd65da92017-01-05 16:31:06 -050045#else
46#include <sys/mman.h>
Nicolas Capens411273e2017-01-26 15:13:36 -080047#if !defined(MAP_ANONYMOUS)
48#define MAP_ANONYMOUS MAP_ANON
Nicolas Capens8b275742017-01-20 17:11:41 -050049#endif
Nicolas Capensbd65da92017-01-05 16:31:06 -050050#endif
Nicolas Capens598f8d82016-09-26 15:09:10 -040051
Nicolas Capensc07dc4b2018-08-06 14:20:45 -040052#include <mutex>
Nicolas Capens598f8d82016-09-26 15:09:10 -040053#include <limits>
54#include <iostream>
Nicolas Capens598f8d82016-09-26 15:09:10 -040055
56namespace
57{
58 Ice::GlobalContext *context = nullptr;
59 Ice::Cfg *function = nullptr;
60 Ice::CfgNode *basicBlock = nullptr;
61 Ice::CfgLocalAllocatorScope *allocator = nullptr;
Nicolas Capens48461502018-08-06 14:20:45 -040062 rr::Routine *routine = nullptr;
Nicolas Capens598f8d82016-09-26 15:09:10 -040063
64 std::mutex codegenMutex;
65
66 Ice::ELFFileStreamer *elfFile = nullptr;
67 Ice::Fdstream *out = nullptr;
68}
69
Nicolas Capensccd5ecb2017-01-14 12:52:55 -050070namespace
71{
Nicolas Capens47dc8672017-04-25 12:54:39 -040072 #if !defined(__i386__) && defined(_M_IX86)
73 #define __i386__ 1
74 #endif
75
76 #if !defined(__x86_64__) && (defined(_M_AMD64) || defined (_M_X64))
77 #define __x86_64__ 1
78 #endif
79
Nicolas Capensccd5ecb2017-01-14 12:52:55 -050080 class CPUID
81 {
82 public:
Nicolas Capensf7b75882017-04-26 09:30:47 -040083 const static bool ARM;
Nicolas Capensccd5ecb2017-01-14 12:52:55 -050084 const static bool SSE4_1;
85
86 private:
87 static void cpuid(int registers[4], int info)
88 {
Nicolas Capens47dc8672017-04-25 12:54:39 -040089 #if defined(__i386__) || defined(__x86_64__)
90 #if defined(_WIN32)
91 __cpuid(registers, info);
92 #else
93 __asm volatile("cpuid": "=a" (registers[0]), "=b" (registers[1]), "=c" (registers[2]), "=d" (registers[3]): "a" (info));
94 #endif
Nicolas Capensccd5ecb2017-01-14 12:52:55 -050095 #else
Nicolas Capens47dc8672017-04-25 12:54:39 -040096 registers[0] = 0;
97 registers[1] = 0;
98 registers[2] = 0;
99 registers[3] = 0;
Nicolas Capensccd5ecb2017-01-14 12:52:55 -0500100 #endif
101 }
102
Nicolas Capensf7b75882017-04-26 09:30:47 -0400103 static bool detectARM()
104 {
Stephen Lanhamfe796492018-09-07 11:59:54 -0700105 #if defined(__arm__) || defined(__aarch64__)
Nicolas Capensf7b75882017-04-26 09:30:47 -0400106 return true;
107 #elif defined(__i386__) || defined(__x86_64__)
108 return false;
Gordana Cmiljanovic082dfec2018-10-19 11:36:15 +0200109 #elif defined(__mips__)
110 return false;
Nicolas Capensf7b75882017-04-26 09:30:47 -0400111 #else
112 #error "Unknown architecture"
113 #endif
114 }
115
Nicolas Capensccd5ecb2017-01-14 12:52:55 -0500116 static bool detectSSE4_1()
117 {
Nicolas Capens47dc8672017-04-25 12:54:39 -0400118 #if defined(__i386__) || defined(__x86_64__)
119 int registers[4];
120 cpuid(registers, 1);
121 return (registers[2] & 0x00080000) != 0;
122 #else
123 return false;
124 #endif
Nicolas Capensccd5ecb2017-01-14 12:52:55 -0500125 }
126 };
127
Nicolas Capensf7b75882017-04-26 09:30:47 -0400128 const bool CPUID::ARM = CPUID::detectARM();
Nicolas Capensccd5ecb2017-01-14 12:52:55 -0500129 const bool CPUID::SSE4_1 = CPUID::detectSSE4_1();
Nicolas Capens091f3502017-10-03 14:56:49 -0400130 const bool emulateIntrinsics = false;
Nicolas Capens2d8c3702017-07-25 13:56:46 -0400131 const bool emulateMismatchedBitCast = CPUID::ARM;
Nicolas Capensccd5ecb2017-01-14 12:52:55 -0500132}
133
Nicolas Capens48461502018-08-06 14:20:45 -0400134namespace rr
Nicolas Capens598f8d82016-09-26 15:09:10 -0400135{
Ben Claytonc7904162019-04-17 17:35:48 -0400136 const Capabilities Caps =
137 {
138 false, // CallSupported
139 };
140
Nicolas Capens23d99a42016-09-30 14:57:16 -0400141 enum EmulatedType
142 {
143 EmulatedShift = 16,
144 EmulatedV2 = 2 << EmulatedShift,
145 EmulatedV4 = 4 << EmulatedShift,
146 EmulatedV8 = 8 << EmulatedShift,
147 EmulatedBits = EmulatedV2 | EmulatedV4 | EmulatedV8,
148
149 Type_v2i32 = Ice::IceType_v4i32 | EmulatedV2,
150 Type_v4i16 = Ice::IceType_v8i16 | EmulatedV4,
151 Type_v2i16 = Ice::IceType_v8i16 | EmulatedV2,
152 Type_v8i8 = Ice::IceType_v16i8 | EmulatedV8,
153 Type_v4i8 = Ice::IceType_v16i8 | EmulatedV4,
Nicolas Capens4cfd4572016-10-20 01:00:19 -0400154 Type_v2f32 = Ice::IceType_v4f32 | EmulatedV2,
Nicolas Capens23d99a42016-09-30 14:57:16 -0400155 };
156
Nicolas Capens15060bb2016-12-05 22:17:19 -0500157 class Value : public Ice::Operand {};
Nicolas Capensb98fe5c2016-11-09 12:24:06 -0500158 class SwitchCases : public Ice::InstSwitch {};
Nicolas Capens598f8d82016-09-26 15:09:10 -0400159 class BasicBlock : public Ice::CfgNode {};
160
161 Ice::Type T(Type *t)
162 {
Alexis Hetu113e33a2017-01-19 10:49:19 -0500163 static_assert(static_cast<unsigned int>(Ice::IceType_NUM) < static_cast<unsigned int>(EmulatedBits), "Ice::Type overlaps with our emulated types!");
Nicolas Capens23d99a42016-09-30 14:57:16 -0400164 return (Ice::Type)(reinterpret_cast<std::intptr_t>(t) & ~EmulatedBits);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400165 }
166
167 Type *T(Ice::Type t)
168 {
169 return reinterpret_cast<Type*>(t);
170 }
171
Nicolas Capens23d99a42016-09-30 14:57:16 -0400172 Type *T(EmulatedType t)
173 {
174 return reinterpret_cast<Type*>(t);
175 }
176
Nicolas Capens15060bb2016-12-05 22:17:19 -0500177 Value *V(Ice::Operand *v)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400178 {
179 return reinterpret_cast<Value*>(v);
180 }
181
Nicolas Capens611642a2016-09-28 16:45:04 -0400182 BasicBlock *B(Ice::CfgNode *b)
183 {
184 return reinterpret_cast<BasicBlock*>(b);
185 }
186
Nicolas Capens584088c2017-01-26 16:05:18 -0800187 static size_t typeSize(Type *type)
188 {
189 if(reinterpret_cast<std::intptr_t>(type) & EmulatedBits)
190 {
191 switch(reinterpret_cast<std::intptr_t>(type))
192 {
193 case Type_v2i32: return 8;
194 case Type_v4i16: return 8;
195 case Type_v2i16: return 4;
196 case Type_v8i8: return 8;
197 case Type_v4i8: return 4;
198 case Type_v2f32: return 8;
Ben Claytoneb50d252019-04-15 13:50:01 -0400199 default: ASSERT(false);
Nicolas Capens584088c2017-01-26 16:05:18 -0800200 }
201 }
202
203 return Ice::typeWidthInBytes(T(type));
204 }
205
Nicolas Capens598f8d82016-09-26 15:09:10 -0400206 Optimization optimization[10] = {InstructionCombining, Disabled};
207
Nicolas Capens66478362016-10-13 15:36:36 -0400208 using ElfHeader = std::conditional<sizeof(void*) == 8, Elf64_Ehdr, Elf32_Ehdr>::type;
209 using SectionHeader = std::conditional<sizeof(void*) == 8, Elf64_Shdr, Elf32_Shdr>::type;
210
211 inline const SectionHeader *sectionHeader(const ElfHeader *elfHeader)
212 {
213 return reinterpret_cast<const SectionHeader*>((intptr_t)elfHeader + elfHeader->e_shoff);
214 }
Nicolas Capens87852e12016-11-24 14:45:06 -0500215
Nicolas Capens66478362016-10-13 15:36:36 -0400216 inline const SectionHeader *elfSection(const ElfHeader *elfHeader, int index)
217 {
218 return &sectionHeader(elfHeader)[index];
219 }
220
221 static void *relocateSymbol(const ElfHeader *elfHeader, const Elf32_Rel &relocation, const SectionHeader &relocationTable)
222 {
223 const SectionHeader *target = elfSection(elfHeader, relocationTable.sh_info);
Nicolas Capens87852e12016-11-24 14:45:06 -0500224
Nicolas Capens66478362016-10-13 15:36:36 -0400225 uint32_t index = relocation.getSymbol();
226 int table = relocationTable.sh_link;
227 void *symbolValue = nullptr;
Nicolas Capens87852e12016-11-24 14:45:06 -0500228
Nicolas Capens66478362016-10-13 15:36:36 -0400229 if(index != SHN_UNDEF)
230 {
231 if(table == SHN_UNDEF) return nullptr;
232 const SectionHeader *symbolTable = elfSection(elfHeader, table);
Nicolas Capens87852e12016-11-24 14:45:06 -0500233
Nicolas Capens66478362016-10-13 15:36:36 -0400234 uint32_t symtab_entries = symbolTable->sh_size / symbolTable->sh_entsize;
235 if(index >= symtab_entries)
236 {
Ben Claytoneb50d252019-04-15 13:50:01 -0400237 ASSERT(index < symtab_entries && "Symbol Index out of range");
Nicolas Capens66478362016-10-13 15:36:36 -0400238 return nullptr;
239 }
Nicolas Capens87852e12016-11-24 14:45:06 -0500240
Nicolas Capens66478362016-10-13 15:36:36 -0400241 intptr_t symbolAddress = (intptr_t)elfHeader + symbolTable->sh_offset;
242 Elf32_Sym &symbol = ((Elf32_Sym*)symbolAddress)[index];
243 uint16_t section = symbol.st_shndx;
244
245 if(section != SHN_UNDEF && section < SHN_LORESERVE)
246 {
247 const SectionHeader *target = elfSection(elfHeader, symbol.st_shndx);
248 symbolValue = reinterpret_cast<void*>((intptr_t)elfHeader + symbol.st_value + target->sh_offset);
249 }
250 else
251 {
252 return nullptr;
253 }
254 }
255
Nicolas Capens8d2cf752018-11-22 11:13:45 -0500256 intptr_t address = (intptr_t)elfHeader + target->sh_offset;
257 unaligned_ptr<int32_t> patchSite = (int32_t*)(address + relocation.r_offset);
258
Nicolas Capensf110e4d2017-05-03 15:33:49 -0400259 if(CPUID::ARM)
260 {
261 switch(relocation.getType())
262 {
263 case R_ARM_NONE:
264 // No relocation
265 break;
266 case R_ARM_MOVW_ABS_NC:
267 {
268 uint32_t thumb = 0; // Calls to Thumb code not supported.
269 uint32_t lo = (uint32_t)(intptr_t)symbolValue | thumb;
270 *patchSite = (*patchSite & 0xFFF0F000) | ((lo & 0xF000) << 4) | (lo & 0x0FFF);
271 }
272 break;
273 case R_ARM_MOVT_ABS:
274 {
275 uint32_t hi = (uint32_t)(intptr_t)(symbolValue) >> 16;
276 *patchSite = (*patchSite & 0xFFF0F000) | ((hi & 0xF000) << 4) | (hi & 0x0FFF);
277 }
278 break;
279 default:
Ben Claytoneb50d252019-04-15 13:50:01 -0400280 ASSERT(false && "Unsupported relocation type");
Nicolas Capensf110e4d2017-05-03 15:33:49 -0400281 return nullptr;
282 }
283 }
284 else
285 {
Nicolas Capens30cd7d42017-04-25 15:17:25 -0400286 switch(relocation.getType())
287 {
288 case R_386_NONE:
289 // No relocation
290 break;
291 case R_386_32:
292 *patchSite = (int32_t)((intptr_t)symbolValue + *patchSite);
293 break;
294 // case R_386_PC32:
295 // *patchSite = (int32_t)((intptr_t)symbolValue + *patchSite - (intptr_t)patchSite);
296 // break;
297 default:
Ben Claytoneb50d252019-04-15 13:50:01 -0400298 ASSERT(false && "Unsupported relocation type");
Nicolas Capens30cd7d42017-04-25 15:17:25 -0400299 return nullptr;
300 }
Nicolas Capensf110e4d2017-05-03 15:33:49 -0400301 }
302
Nicolas Capens66478362016-10-13 15:36:36 -0400303 return symbolValue;
304 }
305
306 static void *relocateSymbol(const ElfHeader *elfHeader, const Elf64_Rela &relocation, const SectionHeader &relocationTable)
307 {
308 const SectionHeader *target = elfSection(elfHeader, relocationTable.sh_info);
Nicolas Capens87852e12016-11-24 14:45:06 -0500309
Nicolas Capens66478362016-10-13 15:36:36 -0400310 uint32_t index = relocation.getSymbol();
311 int table = relocationTable.sh_link;
312 void *symbolValue = nullptr;
313
314 if(index != SHN_UNDEF)
315 {
316 if(table == SHN_UNDEF) return nullptr;
317 const SectionHeader *symbolTable = elfSection(elfHeader, table);
Nicolas Capens87852e12016-11-24 14:45:06 -0500318
Nicolas Capens66478362016-10-13 15:36:36 -0400319 uint32_t symtab_entries = symbolTable->sh_size / symbolTable->sh_entsize;
320 if(index >= symtab_entries)
321 {
Ben Claytoneb50d252019-04-15 13:50:01 -0400322 ASSERT(index < symtab_entries && "Symbol Index out of range");
Nicolas Capens66478362016-10-13 15:36:36 -0400323 return nullptr;
324 }
Nicolas Capens87852e12016-11-24 14:45:06 -0500325
Nicolas Capens66478362016-10-13 15:36:36 -0400326 intptr_t symbolAddress = (intptr_t)elfHeader + symbolTable->sh_offset;
327 Elf64_Sym &symbol = ((Elf64_Sym*)symbolAddress)[index];
328 uint16_t section = symbol.st_shndx;
329
330 if(section != SHN_UNDEF && section < SHN_LORESERVE)
331 {
332 const SectionHeader *target = elfSection(elfHeader, symbol.st_shndx);
333 symbolValue = reinterpret_cast<void*>((intptr_t)elfHeader + symbol.st_value + target->sh_offset);
334 }
335 else
336 {
337 return nullptr;
338 }
339 }
340
Nicolas Capens8d2cf752018-11-22 11:13:45 -0500341 intptr_t address = (intptr_t)elfHeader + target->sh_offset;
342 unaligned_ptr<int32_t> patchSite32 = (int32_t*)(address + relocation.r_offset);
343 unaligned_ptr<int64_t> patchSite64 = (int64_t*)(address + relocation.r_offset);
344
Nicolas Capensf110e4d2017-05-03 15:33:49 -0400345 switch(relocation.getType())
346 {
347 case R_X86_64_NONE:
348 // No relocation
349 break;
350 case R_X86_64_64:
Nicolas Capens8d2cf752018-11-22 11:13:45 -0500351 *patchSite64 = (int64_t)((intptr_t)symbolValue + *patchSite64 + relocation.r_addend);
Nicolas Capensf110e4d2017-05-03 15:33:49 -0400352 break;
353 case R_X86_64_PC32:
Nicolas Capens8d2cf752018-11-22 11:13:45 -0500354 *patchSite32 = (int32_t)((intptr_t)symbolValue + *patchSite32 - (intptr_t)patchSite32 + relocation.r_addend);
Nicolas Capensf110e4d2017-05-03 15:33:49 -0400355 break;
356 case R_X86_64_32S:
Nicolas Capens8d2cf752018-11-22 11:13:45 -0500357 *patchSite32 = (int32_t)((intptr_t)symbolValue + *patchSite32 + relocation.r_addend);
Nicolas Capensf110e4d2017-05-03 15:33:49 -0400358 break;
359 default:
Ben Claytoneb50d252019-04-15 13:50:01 -0400360 ASSERT(false && "Unsupported relocation type");
Nicolas Capensf110e4d2017-05-03 15:33:49 -0400361 return nullptr;
362 }
Nicolas Capens66478362016-10-13 15:36:36 -0400363
364 return symbolValue;
365 }
366
Nicolas Capens1cc44382017-04-25 10:52:16 -0400367 void *loadImage(uint8_t *const elfImage, size_t &codeSize)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400368 {
Nicolas Capens598f8d82016-09-26 15:09:10 -0400369 ElfHeader *elfHeader = (ElfHeader*)elfImage;
370
371 if(!elfHeader->checkMagic())
372 {
373 return nullptr;
374 }
375
Nicolas Capens66478362016-10-13 15:36:36 -0400376 // Expect ELF bitness to match platform
Ben Claytoneb50d252019-04-15 13:50:01 -0400377 ASSERT(sizeof(void*) == 8 ? elfHeader->getFileClass() == ELFCLASS64 : elfHeader->getFileClass() == ELFCLASS32);
Nicolas Capens30cd7d42017-04-25 15:17:25 -0400378 #if defined(__i386__)
Ben Claytoneb50d252019-04-15 13:50:01 -0400379 ASSERT(sizeof(void*) == 4 && elfHeader->e_machine == EM_386);
Nicolas Capens30cd7d42017-04-25 15:17:25 -0400380 #elif defined(__x86_64__)
Ben Claytoneb50d252019-04-15 13:50:01 -0400381 ASSERT(sizeof(void*) == 8 && elfHeader->e_machine == EM_X86_64);
Nicolas Capens30cd7d42017-04-25 15:17:25 -0400382 #elif defined(__arm__)
Ben Claytoneb50d252019-04-15 13:50:01 -0400383 ASSERT(sizeof(void*) == 4 && elfHeader->e_machine == EM_ARM);
Stephen Lanhamfe796492018-09-07 11:59:54 -0700384 #elif defined(__aarch64__)
Ben Claytoneb50d252019-04-15 13:50:01 -0400385 ASSERT(sizeof(void*) == 8 && elfHeader->e_machine == EM_AARCH64);
Gordana Cmiljanovic082dfec2018-10-19 11:36:15 +0200386 #elif defined(__mips__)
Ben Claytoneb50d252019-04-15 13:50:01 -0400387 ASSERT(sizeof(void*) == 4 && elfHeader->e_machine == EM_MIPS);
Nicolas Capens30cd7d42017-04-25 15:17:25 -0400388 #else
389 #error "Unsupported platform"
390 #endif
Nicolas Capens66478362016-10-13 15:36:36 -0400391
Nicolas Capens598f8d82016-09-26 15:09:10 -0400392 SectionHeader *sectionHeader = (SectionHeader*)(elfImage + elfHeader->e_shoff);
393 void *entry = nullptr;
394
395 for(int i = 0; i < elfHeader->e_shnum; i++)
396 {
Nicolas Capens66478362016-10-13 15:36:36 -0400397 if(sectionHeader[i].sh_type == SHT_PROGBITS)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400398 {
Nicolas Capens66478362016-10-13 15:36:36 -0400399 if(sectionHeader[i].sh_flags & SHF_EXECINSTR)
400 {
401 entry = elfImage + sectionHeader[i].sh_offset;
Nicolas Capens1cc44382017-04-25 10:52:16 -0400402 codeSize = sectionHeader[i].sh_size;
Nicolas Capens66478362016-10-13 15:36:36 -0400403 }
404 }
405 else if(sectionHeader[i].sh_type == SHT_REL)
406 {
Ben Claytoneb50d252019-04-15 13:50:01 -0400407 ASSERT(sizeof(void*) == 4 && "UNIMPLEMENTED"); // Only expected/implemented for 32-bit code
Nicolas Capens66478362016-10-13 15:36:36 -0400408
Alexis Hetu113e33a2017-01-19 10:49:19 -0500409 for(Elf32_Word index = 0; index < sectionHeader[i].sh_size / sectionHeader[i].sh_entsize; index++)
Nicolas Capens66478362016-10-13 15:36:36 -0400410 {
411 const Elf32_Rel &relocation = ((const Elf32_Rel*)(elfImage + sectionHeader[i].sh_offset))[index];
Alexis Hetu113e33a2017-01-19 10:49:19 -0500412 relocateSymbol(elfHeader, relocation, sectionHeader[i]);
Nicolas Capens66478362016-10-13 15:36:36 -0400413 }
414 }
415 else if(sectionHeader[i].sh_type == SHT_RELA)
416 {
Ben Claytoneb50d252019-04-15 13:50:01 -0400417 ASSERT(sizeof(void*) == 8 && "UNIMPLEMENTED"); // Only expected/implemented for 64-bit code
Nicolas Capens66478362016-10-13 15:36:36 -0400418
Alexis Hetu113e33a2017-01-19 10:49:19 -0500419 for(Elf32_Word index = 0; index < sectionHeader[i].sh_size / sectionHeader[i].sh_entsize; index++)
Nicolas Capens66478362016-10-13 15:36:36 -0400420 {
421 const Elf64_Rela &relocation = ((const Elf64_Rela*)(elfImage + sectionHeader[i].sh_offset))[index];
Alexis Hetu113e33a2017-01-19 10:49:19 -0500422 relocateSymbol(elfHeader, relocation, sectionHeader[i]);
Nicolas Capens66478362016-10-13 15:36:36 -0400423 }
Nicolas Capens598f8d82016-09-26 15:09:10 -0400424 }
425 }
426
427 return entry;
428 }
429
430 template<typename T>
431 struct ExecutableAllocator
432 {
433 ExecutableAllocator() {};
434 template<class U> ExecutableAllocator(const ExecutableAllocator<U> &other) {};
435
436 using value_type = T;
437 using size_type = std::size_t;
438
439 T *allocate(size_type n)
440 {
Nicolas Capensc07dc4b2018-08-06 14:20:45 -0400441 return (T*)allocateExecutable(sizeof(T) * n);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400442 }
443
444 void deallocate(T *p, size_type n)
445 {
Nicolas Capensc07dc4b2018-08-06 14:20:45 -0400446 deallocateExecutable(p, sizeof(T) * n);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400447 }
448 };
449
450 class ELFMemoryStreamer : public Ice::ELFStreamer, public Routine
451 {
452 ELFMemoryStreamer(const ELFMemoryStreamer &) = delete;
453 ELFMemoryStreamer &operator=(const ELFMemoryStreamer &) = delete;
454
455 public:
Nicolas Capens58274b52016-10-19 23:45:19 -0400456 ELFMemoryStreamer() : Routine(), entry(nullptr)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400457 {
458 position = 0;
459 buffer.reserve(0x1000);
460 }
461
Nicolas Capens81aa97b2017-06-27 17:08:08 -0400462 ~ELFMemoryStreamer() override
Nicolas Capens598f8d82016-09-26 15:09:10 -0400463 {
Nicolas Capensbd65da92017-01-05 16:31:06 -0500464 #if defined(_WIN32)
465 if(buffer.size() != 0)
466 {
467 DWORD exeProtection;
468 VirtualProtect(&buffer[0], buffer.size(), oldProtection, &exeProtection);
469 }
470 #endif
Nicolas Capens598f8d82016-09-26 15:09:10 -0400471 }
472
473 void write8(uint8_t Value) override
474 {
475 if(position == (uint64_t)buffer.size())
476 {
477 buffer.push_back(Value);
478 position++;
479 }
480 else if(position < (uint64_t)buffer.size())
481 {
482 buffer[position] = Value;
483 position++;
484 }
Ben Claytoneb50d252019-04-15 13:50:01 -0400485 else ASSERT(false && "UNIMPLEMENTED");
Nicolas Capens598f8d82016-09-26 15:09:10 -0400486 }
487
488 void writeBytes(llvm::StringRef Bytes) override
489 {
490 std::size_t oldSize = buffer.size();
491 buffer.resize(oldSize + Bytes.size());
492 memcpy(&buffer[oldSize], Bytes.begin(), Bytes.size());
493 position += Bytes.size();
494 }
495
496 uint64_t tell() const override { return position; }
497
498 void seek(uint64_t Off) override { position = Off; }
499
500 const void *getEntry() override
501 {
Nicolas Capens58274b52016-10-19 23:45:19 -0400502 if(!entry)
503 {
Nicolas Capensbd65da92017-01-05 16:31:06 -0500504 position = std::numeric_limits<std::size_t>::max(); // Can't stream more data after this
Nicolas Capens598f8d82016-09-26 15:09:10 -0400505
Nicolas Capens1cc44382017-04-25 10:52:16 -0400506 size_t codeSize = 0;
507 entry = loadImage(&buffer[0], codeSize);
508
509 #if defined(_WIN32)
Nicolas Capense745f5a2017-05-29 10:00:32 -0400510 VirtualProtect(&buffer[0], buffer.size(), PAGE_EXECUTE_READ, &oldProtection);
Nicolas Capens1cc44382017-04-25 10:52:16 -0400511 FlushInstructionCache(GetCurrentProcess(), NULL, 0);
512 #else
Nicolas Capense745f5a2017-05-29 10:00:32 -0400513 mprotect(&buffer[0], buffer.size(), PROT_READ | PROT_EXEC);
Nicolas Capens1cc44382017-04-25 10:52:16 -0400514 __builtin___clear_cache((char*)entry, (char*)entry + codeSize);
515 #endif
Nicolas Capens58274b52016-10-19 23:45:19 -0400516 }
517
518 return entry;
Nicolas Capens598f8d82016-09-26 15:09:10 -0400519 }
520
521 private:
Nicolas Capens58274b52016-10-19 23:45:19 -0400522 void *entry;
Nicolas Capens598f8d82016-09-26 15:09:10 -0400523 std::vector<uint8_t, ExecutableAllocator<uint8_t>> buffer;
524 std::size_t position;
Nicolas Capensbd65da92017-01-05 16:31:06 -0500525
526 #if defined(_WIN32)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400527 DWORD oldProtection;
Nicolas Capensbd65da92017-01-05 16:31:06 -0500528 #endif
Nicolas Capens598f8d82016-09-26 15:09:10 -0400529 };
530
531 Nucleus::Nucleus()
532 {
533 ::codegenMutex.lock(); // Reactor is currently not thread safe
534
Nicolas Capens66478362016-10-13 15:36:36 -0400535 Ice::ClFlags &Flags = Ice::ClFlags::Flags;
536 Ice::ClFlags::getParsedClFlags(Flags);
537
Nicolas Capens30cd7d42017-04-25 15:17:25 -0400538 #if defined(__arm__)
539 Flags.setTargetArch(Ice::Target_ARM32);
540 Flags.setTargetInstructionSet(Ice::ARM32InstructionSet_HWDivArm);
Gordana Cmiljanovic082dfec2018-10-19 11:36:15 +0200541 #elif defined(__mips__)
542 Flags.setTargetArch(Ice::Target_MIPS32);
543 Flags.setTargetInstructionSet(Ice::BaseInstructionSet);
Nicolas Capens30cd7d42017-04-25 15:17:25 -0400544 #else // x86
545 Flags.setTargetArch(sizeof(void*) == 8 ? Ice::Target_X8664 : Ice::Target_X8632);
546 Flags.setTargetInstructionSet(CPUID::SSE4_1 ? Ice::X86InstructionSet_SSE4_1 : Ice::X86InstructionSet_SSE2);
547 #endif
Nicolas Capens66478362016-10-13 15:36:36 -0400548 Flags.setOutFileType(Ice::FT_Elf);
549 Flags.setOptLevel(Ice::Opt_2);
550 Flags.setApplicationBinaryInterface(Ice::ABI_Platform);
Nicolas Capens30cd7d42017-04-25 15:17:25 -0400551 Flags.setVerbose(false ? Ice::IceV_Most : Ice::IceV_None);
552 Flags.setDisableHybridAssembly(true);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400553
Nicolas Capens65047112016-11-07 13:01:07 -0500554 static llvm::raw_os_ostream cout(std::cout);
555 static llvm::raw_os_ostream cerr(std::cerr);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400556
557 if(false) // Write out to a file
558 {
559 std::error_code errorCode;
560 ::out = new Ice::Fdstream("out.o", errorCode, llvm::sys::fs::F_None);
561 ::elfFile = new Ice::ELFFileStreamer(*out);
Nicolas Capens65047112016-11-07 13:01:07 -0500562 ::context = new Ice::GlobalContext(&cout, &cout, &cerr, elfFile);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400563 }
564 else
565 {
566 ELFMemoryStreamer *elfMemory = new ELFMemoryStreamer();
Nicolas Capens65047112016-11-07 13:01:07 -0500567 ::context = new Ice::GlobalContext(&cout, &cout, &cerr, elfMemory);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400568 ::routine = elfMemory;
569 }
570 }
571
572 Nucleus::~Nucleus()
573 {
Nicolas Capens619a8c52017-07-05 14:10:46 -0400574 delete ::routine;
575
Nicolas Capens598f8d82016-09-26 15:09:10 -0400576 delete ::allocator;
577 delete ::function;
578 delete ::context;
579
580 delete ::elfFile;
581 delete ::out;
582
583 ::codegenMutex.unlock();
584 }
585
Chris Forbes878d4b02019-01-21 10:48:35 -0800586 Routine *Nucleus::acquireRoutine(const char *name, bool runOptimizations)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400587 {
588 if(basicBlock->getInsts().empty() || basicBlock->getInsts().back().getKind() != Ice::Inst::Ret)
589 {
590 createRetVoid();
591 }
592
Chris Forbes878d4b02019-01-21 10:48:35 -0800593 ::function->setFunctionName(Ice::GlobalString::createWithString(::context, name));
Nicolas Capens598f8d82016-09-26 15:09:10 -0400594
Nicolas Capens2ae9d742016-11-24 14:43:05 -0500595 optimize();
596
Nicolas Capens598f8d82016-09-26 15:09:10 -0400597 ::function->translate();
Ben Claytoneb50d252019-04-15 13:50:01 -0400598 ASSERT(!::function->hasError());
Nicolas Capensde19f392016-10-19 10:29:49 -0400599
Nicolas Capens83a6bb92017-07-05 15:04:00 -0400600 auto globals = ::function->getGlobalInits();
Nicolas Capens66478362016-10-13 15:36:36 -0400601
602 if(globals && !globals->empty())
603 {
Nicolas Capens83a6bb92017-07-05 15:04:00 -0400604 ::context->getGlobals()->merge(globals.get());
Nicolas Capens66478362016-10-13 15:36:36 -0400605 }
Nicolas Capens598f8d82016-09-26 15:09:10 -0400606
607 ::context->emitFileHeader();
608 ::function->emitIAS();
609 auto assembler = ::function->releaseAssembler();
Nicolas Capens66478362016-10-13 15:36:36 -0400610 auto objectWriter = ::context->getObjectWriter();
611 assembler->alignFunction();
612 objectWriter->writeFunctionCode(::function->getFunctionName(), false, assembler.get());
613 ::context->lowerGlobals("last");
Nicolas Capens73dd7a22016-10-20 13:20:34 -0400614 ::context->lowerConstants();
Nicolas Capensb98fe5c2016-11-09 12:24:06 -0500615 ::context->lowerJumpTables();
Nicolas Capens66478362016-10-13 15:36:36 -0400616 objectWriter->setUndefinedSyms(::context->getConstantExternSyms());
617 objectWriter->writeNonUserSections();
Nicolas Capens598f8d82016-09-26 15:09:10 -0400618
Nicolas Capens619a8c52017-07-05 14:10:46 -0400619 Routine *handoffRoutine = ::routine;
620 ::routine = nullptr;
621
622 return handoffRoutine;
Nicolas Capens598f8d82016-09-26 15:09:10 -0400623 }
624
625 void Nucleus::optimize()
626 {
Nicolas Capens48461502018-08-06 14:20:45 -0400627 rr::optimize(::function);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400628 }
629
630 Value *Nucleus::allocateStackVariable(Type *t, int arraySize)
631 {
632 Ice::Type type = T(t);
Nicolas Capensa8f98632016-10-20 11:25:55 -0400633 int typeSize = Ice::typeWidthInBytes(type);
634 int totalSize = typeSize * (arraySize ? arraySize : 1);
Nicolas Capense12780d2016-09-27 14:18:07 -0400635
Nicolas Capensa8f98632016-10-20 11:25:55 -0400636 auto bytes = Ice::ConstantInteger32::create(::context, type, totalSize);
Nicolas Capense12780d2016-09-27 14:18:07 -0400637 auto address = ::function->makeVariable(T(getPointerType(t)));
Nicolas Capensa8f98632016-10-20 11:25:55 -0400638 auto alloca = Ice::InstAlloca::create(::function, address, bytes, typeSize);
Nicolas Capense12780d2016-09-27 14:18:07 -0400639 ::function->getEntryNode()->getInsts().push_front(alloca);
640
641 return V(address);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400642 }
643
644 BasicBlock *Nucleus::createBasicBlock()
645 {
Nicolas Capens611642a2016-09-28 16:45:04 -0400646 return B(::function->makeNode());
Nicolas Capens598f8d82016-09-26 15:09:10 -0400647 }
648
649 BasicBlock *Nucleus::getInsertBlock()
650 {
Nicolas Capens611642a2016-09-28 16:45:04 -0400651 return B(::basicBlock);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400652 }
653
654 void Nucleus::setInsertBlock(BasicBlock *basicBlock)
655 {
Ben Claytoneb50d252019-04-15 13:50:01 -0400656 // ASSERT(::basicBlock->getInsts().back().getTerminatorEdges().size() >= 0 && "Previous basic block must have a terminator");
Nicolas Capens0192d152019-03-27 14:46:07 -0400657
658 Variable::materializeAll();
659
Nicolas Capens611642a2016-09-28 16:45:04 -0400660 ::basicBlock = basicBlock;
Nicolas Capens598f8d82016-09-26 15:09:10 -0400661 }
662
Nicolas Capens598f8d82016-09-26 15:09:10 -0400663 void Nucleus::createFunction(Type *ReturnType, std::vector<Type*> &Params)
664 {
665 uint32_t sequenceNumber = 0;
666 ::function = Ice::Cfg::create(::context, sequenceNumber).release();
667 ::allocator = new Ice::CfgLocalAllocatorScope(::function);
668
669 for(Type *type : Params)
670 {
671 Ice::Variable *arg = ::function->makeVariable(T(type));
672 ::function->addArg(arg);
673 }
674
675 Ice::CfgNode *node = ::function->makeNode();
676 ::function->setEntryNode(node);
677 ::basicBlock = node;
678 }
679
680 Value *Nucleus::getArgument(unsigned int index)
681 {
682 return V(::function->getArgs()[index]);
683 }
684
685 void Nucleus::createRetVoid()
686 {
Nicolas Capens0192d152019-03-27 14:46:07 -0400687 // Code generated after this point is unreachable, so any variables
688 // being read can safely return an undefined value. We have to avoid
689 // materializing variables after the terminator ret instruction.
690 Variable::killUnmaterialized();
691
Nicolas Capensfdcca2d2016-10-20 11:31:36 -0400692 Ice::InstRet *ret = Ice::InstRet::create(::function);
693 ::basicBlock->appendInst(ret);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400694 }
695
696 void Nucleus::createRet(Value *v)
697 {
Nicolas Capens0192d152019-03-27 14:46:07 -0400698 // Code generated after this point is unreachable, so any variables
699 // being read can safely return an undefined value. We have to avoid
700 // materializing variables after the terminator ret instruction.
701 Variable::killUnmaterialized();
702
Nicolas Capensfdcca2d2016-10-20 11:31:36 -0400703 Ice::InstRet *ret = Ice::InstRet::create(::function, v);
704 ::basicBlock->appendInst(ret);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400705 }
706
707 void Nucleus::createBr(BasicBlock *dest)
708 {
Nicolas Capens0192d152019-03-27 14:46:07 -0400709 Variable::materializeAll();
710
Nicolas Capens611642a2016-09-28 16:45:04 -0400711 auto br = Ice::InstBr::create(::function, dest);
712 ::basicBlock->appendInst(br);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400713 }
714
715 void Nucleus::createCondBr(Value *cond, BasicBlock *ifTrue, BasicBlock *ifFalse)
716 {
Nicolas Capens0192d152019-03-27 14:46:07 -0400717 Variable::materializeAll();
718
Nicolas Capens611642a2016-09-28 16:45:04 -0400719 auto br = Ice::InstBr::create(::function, cond, ifTrue, ifFalse);
720 ::basicBlock->appendInst(br);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400721 }
722
Nicolas Capensf8360ba2017-01-25 11:35:00 -0800723 static bool isCommutative(Ice::InstArithmetic::OpKind op)
724 {
725 switch(op)
726 {
727 case Ice::InstArithmetic::Add:
728 case Ice::InstArithmetic::Fadd:
729 case Ice::InstArithmetic::Mul:
730 case Ice::InstArithmetic::Fmul:
731 case Ice::InstArithmetic::And:
732 case Ice::InstArithmetic::Or:
733 case Ice::InstArithmetic::Xor:
734 return true;
735 default:
736 return false;
737 }
738 }
739
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400740 static Value *createArithmetic(Ice::InstArithmetic::OpKind op, Value *lhs, Value *rhs)
741 {
Ben Claytoneb50d252019-04-15 13:50:01 -0400742 ASSERT(lhs->getType() == rhs->getType() || llvm::isa<Ice::Constant>(rhs));
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400743
Nicolas Capensf8360ba2017-01-25 11:35:00 -0800744 bool swapOperands = llvm::isa<Ice::Constant>(lhs) && isCommutative(op);
745
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400746 Ice::Variable *result = ::function->makeVariable(lhs->getType());
Nicolas Capensf8360ba2017-01-25 11:35:00 -0800747 Ice::InstArithmetic *arithmetic = Ice::InstArithmetic::create(::function, op, result, swapOperands ? rhs : lhs, swapOperands ? lhs : rhs);
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400748 ::basicBlock->appendInst(arithmetic);
749
750 return V(result);
751 }
752
Nicolas Capens598f8d82016-09-26 15:09:10 -0400753 Value *Nucleus::createAdd(Value *lhs, Value *rhs)
754 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400755 return createArithmetic(Ice::InstArithmetic::Add, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400756 }
757
758 Value *Nucleus::createSub(Value *lhs, Value *rhs)
759 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400760 return createArithmetic(Ice::InstArithmetic::Sub, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400761 }
762
763 Value *Nucleus::createMul(Value *lhs, Value *rhs)
764 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400765 return createArithmetic(Ice::InstArithmetic::Mul, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400766 }
767
768 Value *Nucleus::createUDiv(Value *lhs, Value *rhs)
769 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400770 return createArithmetic(Ice::InstArithmetic::Udiv, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400771 }
772
773 Value *Nucleus::createSDiv(Value *lhs, Value *rhs)
774 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400775 return createArithmetic(Ice::InstArithmetic::Sdiv, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400776 }
777
778 Value *Nucleus::createFAdd(Value *lhs, Value *rhs)
779 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400780 return createArithmetic(Ice::InstArithmetic::Fadd, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400781 }
782
783 Value *Nucleus::createFSub(Value *lhs, Value *rhs)
784 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400785 return createArithmetic(Ice::InstArithmetic::Fsub, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400786 }
787
788 Value *Nucleus::createFMul(Value *lhs, Value *rhs)
789 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400790 return createArithmetic(Ice::InstArithmetic::Fmul, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400791 }
792
793 Value *Nucleus::createFDiv(Value *lhs, Value *rhs)
794 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400795 return createArithmetic(Ice::InstArithmetic::Fdiv, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400796 }
797
798 Value *Nucleus::createURem(Value *lhs, Value *rhs)
799 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400800 return createArithmetic(Ice::InstArithmetic::Urem, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400801 }
802
803 Value *Nucleus::createSRem(Value *lhs, Value *rhs)
804 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400805 return createArithmetic(Ice::InstArithmetic::Srem, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400806 }
807
808 Value *Nucleus::createFRem(Value *lhs, Value *rhs)
809 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400810 return createArithmetic(Ice::InstArithmetic::Frem, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400811 }
812
813 Value *Nucleus::createShl(Value *lhs, Value *rhs)
814 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400815 return createArithmetic(Ice::InstArithmetic::Shl, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400816 }
817
818 Value *Nucleus::createLShr(Value *lhs, Value *rhs)
819 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400820 return createArithmetic(Ice::InstArithmetic::Lshr, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400821 }
822
823 Value *Nucleus::createAShr(Value *lhs, Value *rhs)
824 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400825 return createArithmetic(Ice::InstArithmetic::Ashr, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400826 }
827
828 Value *Nucleus::createAnd(Value *lhs, Value *rhs)
829 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400830 return createArithmetic(Ice::InstArithmetic::And, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400831 }
832
833 Value *Nucleus::createOr(Value *lhs, Value *rhs)
834 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400835 return createArithmetic(Ice::InstArithmetic::Or, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400836 }
837
838 Value *Nucleus::createXor(Value *lhs, Value *rhs)
839 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400840 return createArithmetic(Ice::InstArithmetic::Xor, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400841 }
842
843 Value *Nucleus::createNeg(Value *v)
844 {
Nicolas Capensc5c0c332016-11-08 11:37:01 -0500845 return createSub(createNullValue(T(v->getType())), v);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400846 }
847
848 Value *Nucleus::createFNeg(Value *v)
849 {
Nicolas Capensc5c0c332016-11-08 11:37:01 -0500850 double c[4] = {-0.0, -0.0, -0.0, -0.0};
851 Value *negativeZero = Ice::isVectorType(v->getType()) ?
852 createConstantVector(c, T(v->getType())) :
Nicolas Capens15060bb2016-12-05 22:17:19 -0500853 V(::context->getConstantFloat(-0.0f));
Nicolas Capensc5c0c332016-11-08 11:37:01 -0500854
855 return createFSub(negativeZero, v);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400856 }
857
858 Value *Nucleus::createNot(Value *v)
859 {
Nicolas Capensc5c0c332016-11-08 11:37:01 -0500860 if(Ice::isScalarIntegerType(v->getType()))
861 {
Nicolas Capens15060bb2016-12-05 22:17:19 -0500862 return createXor(v, V(::context->getConstantInt(v->getType(), -1)));
Nicolas Capensc5c0c332016-11-08 11:37:01 -0500863 }
864 else // Vector
865 {
Nicolas Capensf34d1ac2017-05-08 17:06:11 -0400866 int64_t c[16] = {-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1};
Nicolas Capensc5c0c332016-11-08 11:37:01 -0500867 return createXor(v, createConstantVector(c, T(v->getType())));
868 }
Nicolas Capens598f8d82016-09-26 15:09:10 -0400869 }
870
Nicolas Capens86509d92019-03-21 13:23:50 -0400871 Value *Nucleus::createLoad(Value *ptr, Type *type, bool isVolatile, unsigned int align, bool atomic, std::memory_order memoryOrder)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400872 {
Ben Claytoneb50d252019-04-15 13:50:01 -0400873 ASSERT(!atomic); // Unimplemented
874 ASSERT(memoryOrder == std::memory_order_relaxed); // Unimplemented
Nicolas Capens86509d92019-03-21 13:23:50 -0400875
Nicolas Capens23d99a42016-09-30 14:57:16 -0400876 int valueType = (int)reinterpret_cast<intptr_t>(type);
877 Ice::Variable *result = ::function->makeVariable(T(type));
878
Nicolas Capensf4c4eca2017-10-03 14:26:07 -0400879 if((valueType & EmulatedBits) && (align != 0)) // Narrow vector not stored on stack.
Nicolas Capens23d99a42016-09-30 14:57:16 -0400880 {
Nicolas Capens070d9f42017-04-26 13:36:33 -0400881 if(emulateIntrinsics)
882 {
883 if(typeSize(type) == 4)
884 {
885 auto pointer = RValue<Pointer<Byte>>(ptr);
Nicolas Capens1894cfa2017-07-27 14:21:46 -0400886 Int x = *Pointer<Int>(pointer);
Nicolas Capens070d9f42017-04-26 13:36:33 -0400887
888 Int4 vector;
889 vector = Insert(vector, x, 0);
890
891 auto bitcast = Ice::InstCast::create(::function, Ice::InstCast::Bitcast, result, vector.loadValue());
892 ::basicBlock->appendInst(bitcast);
893 }
894 else if(typeSize(type) == 8)
895 {
896 auto pointer = RValue<Pointer<Byte>>(ptr);
Nicolas Capens1894cfa2017-07-27 14:21:46 -0400897 Int x = *Pointer<Int>(pointer);
Nicolas Capens070d9f42017-04-26 13:36:33 -0400898 Int y = *Pointer<Int>(pointer + 4);
899
900 Int4 vector;
901 vector = Insert(vector, x, 0);
902 vector = Insert(vector, y, 1);
903
904 auto bitcast = Ice::InstCast::create(::function, Ice::InstCast::Bitcast, result, vector.loadValue());
905 ::basicBlock->appendInst(bitcast);
906 }
Ben Claytoneb50d252019-04-15 13:50:01 -0400907 else UNREACHABLE("typeSize(type): %d", int(typeSize(type)));
Nicolas Capens070d9f42017-04-26 13:36:33 -0400908 }
909 else
910 {
911 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::LoadSubVector, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
912 auto target = ::context->getConstantUndef(Ice::IceType_i32);
913 auto load = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
914 load->addArg(ptr);
915 load->addArg(::context->getConstantInt32(typeSize(type)));
916 ::basicBlock->appendInst(load);
917 }
Nicolas Capens23d99a42016-09-30 14:57:16 -0400918 }
919 else
920 {
921 auto load = Ice::InstLoad::create(::function, result, ptr, align);
922 ::basicBlock->appendInst(load);
923 }
924
925 return V(result);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400926 }
927
Nicolas Capens86509d92019-03-21 13:23:50 -0400928 Value *Nucleus::createStore(Value *value, Value *ptr, Type *type, bool isVolatile, unsigned int align, bool atomic, std::memory_order memoryOrder)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400929 {
Ben Claytoneb50d252019-04-15 13:50:01 -0400930 ASSERT(!atomic); // Unimplemented
931 ASSERT(memoryOrder == std::memory_order_relaxed); // Unimplemented
Nicolas Capens86509d92019-03-21 13:23:50 -0400932
Nicolas Capens6a990f82018-07-06 15:54:07 -0400933 #if __has_feature(memory_sanitizer)
934 // Mark all (non-stack) memory writes as initialized by calling __msan_unpoison
935 if(align != 0)
936 {
937 auto call = Ice::InstCall::create(::function, 2, nullptr, ::context->getConstantInt64(reinterpret_cast<intptr_t>(__msan_unpoison)), false);
938 call->addArg(ptr);
939 call->addArg(::context->getConstantInt64(typeSize(type)));
940 ::basicBlock->appendInst(call);
941 }
942 #endif
943
Nicolas Capens23d99a42016-09-30 14:57:16 -0400944 int valueType = (int)reinterpret_cast<intptr_t>(type);
945
Nicolas Capensf4c4eca2017-10-03 14:26:07 -0400946 if((valueType & EmulatedBits) && (align != 0)) // Narrow vector not stored on stack.
Nicolas Capens23d99a42016-09-30 14:57:16 -0400947 {
Nicolas Capens070d9f42017-04-26 13:36:33 -0400948 if(emulateIntrinsics)
949 {
950 if(typeSize(type) == 4)
951 {
952 Ice::Variable *vector = ::function->makeVariable(Ice::IceType_v4i32);
953 auto bitcast = Ice::InstCast::create(::function, Ice::InstCast::Bitcast, vector, value);
954 ::basicBlock->appendInst(bitcast);
955
956 RValue<Int4> v(V(vector));
957
958 auto pointer = RValue<Pointer<Byte>>(ptr);
959 Int x = Extract(v, 0);
960 *Pointer<Int>(pointer) = x;
961 }
962 else if(typeSize(type) == 8)
963 {
964 Ice::Variable *vector = ::function->makeVariable(Ice::IceType_v4i32);
965 auto bitcast = Ice::InstCast::create(::function, Ice::InstCast::Bitcast, vector, value);
966 ::basicBlock->appendInst(bitcast);
967
968 RValue<Int4> v(V(vector));
969
970 auto pointer = RValue<Pointer<Byte>>(ptr);
971 Int x = Extract(v, 0);
972 *Pointer<Int>(pointer) = x;
973 Int y = Extract(v, 1);
974 *Pointer<Int>(pointer + 4) = y;
975 }
Ben Claytoneb50d252019-04-15 13:50:01 -0400976 else UNREACHABLE("typeSize(type): %d", int(typeSize(type)));
Nicolas Capens070d9f42017-04-26 13:36:33 -0400977 }
978 else
979 {
980 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::StoreSubVector, Ice::Intrinsics::SideEffects_T, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_T};
981 auto target = ::context->getConstantUndef(Ice::IceType_i32);
982 auto store = Ice::InstIntrinsicCall::create(::function, 3, nullptr, target, intrinsic);
983 store->addArg(value);
984 store->addArg(ptr);
985 store->addArg(::context->getConstantInt32(typeSize(type)));
986 ::basicBlock->appendInst(store);
987 }
Nicolas Capens23d99a42016-09-30 14:57:16 -0400988 }
989 else
990 {
Ben Claytoneb50d252019-04-15 13:50:01 -0400991 ASSERT(value->getType() == T(type));
Nicolas Capens23d99a42016-09-30 14:57:16 -0400992
993 auto store = Ice::InstStore::create(::function, value, ptr, align);
994 ::basicBlock->appendInst(store);
995 }
996
Nicolas Capens598f8d82016-09-26 15:09:10 -0400997 return value;
998 }
999
Nicolas Capensd294def2017-01-26 17:44:37 -08001000 Value *Nucleus::createGEP(Value *ptr, Type *type, Value *index, bool unsignedIndex)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001001 {
Ben Claytoneb50d252019-04-15 13:50:01 -04001002 ASSERT(index->getType() == Ice::IceType_i32);
Nicolas Capens8820f642016-09-30 04:42:43 -04001003
Nicolas Capens15060bb2016-12-05 22:17:19 -05001004 if(auto *constant = llvm::dyn_cast<Ice::ConstantInteger32>(index))
1005 {
Nicolas Capens584088c2017-01-26 16:05:18 -08001006 int32_t offset = constant->getValue() * (int)typeSize(type);
Nicolas Capens15060bb2016-12-05 22:17:19 -05001007
1008 if(offset == 0)
1009 {
1010 return ptr;
1011 }
1012
1013 return createAdd(ptr, createConstantInt(offset));
1014 }
1015
Nicolas Capens8820f642016-09-30 04:42:43 -04001016 if(!Ice::isByteSizedType(T(type)))
1017 {
Nicolas Capens584088c2017-01-26 16:05:18 -08001018 index = createMul(index, createConstantInt((int)typeSize(type)));
Nicolas Capens8820f642016-09-30 04:42:43 -04001019 }
1020
1021 if(sizeof(void*) == 8)
1022 {
Nicolas Capensd294def2017-01-26 17:44:37 -08001023 if(unsignedIndex)
1024 {
1025 index = createZExt(index, T(Ice::IceType_i64));
1026 }
1027 else
1028 {
1029 index = createSExt(index, T(Ice::IceType_i64));
1030 }
Nicolas Capens8820f642016-09-30 04:42:43 -04001031 }
1032
1033 return createAdd(ptr, index);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001034 }
1035
Chris Forbes17813932019-04-18 11:45:54 -07001036 Value *Nucleus::createAtomicAdd(Value *ptr, Value *value, std::memory_order memoryOrder)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001037 {
Ben Claytoneb50d252019-04-15 13:50:01 -04001038 UNIMPLEMENTED("createAtomicAdd");
1039 return nullptr;
Nicolas Capens598f8d82016-09-26 15:09:10 -04001040 }
1041
Chris Forbes707ed992019-04-18 18:17:35 -07001042 Value *Nucleus::createAtomicSub(Value *ptr, Value *value, std::memory_order memoryOrder)
1043 {
1044 UNIMPLEMENTED("createAtomicSub");
1045 return nullptr;
1046 }
1047
Chris Forbes17813932019-04-18 11:45:54 -07001048 Value *Nucleus::createAtomicAnd(Value *ptr, Value *value, std::memory_order memoryOrder)
1049 {
1050 UNIMPLEMENTED("createAtomicAnd");
1051 return nullptr;
1052 }
1053
1054 Value *Nucleus::createAtomicOr(Value *ptr, Value *value, std::memory_order memoryOrder)
1055 {
1056 UNIMPLEMENTED("createAtomicOr");
1057 return nullptr;
1058 }
1059
1060 Value *Nucleus::createAtomicXor(Value *ptr, Value *value, std::memory_order memoryOrder)
1061 {
1062 UNIMPLEMENTED("createAtomicXor");
1063 return nullptr;
1064 }
1065
1066 Value *Nucleus::createAtomicMin(Value *ptr, Value *value, std::memory_order memoryOrder)
1067 {
1068 UNIMPLEMENTED("createAtomicMin");
1069 return nullptr;
1070 }
1071
1072 Value *Nucleus::createAtomicMax(Value *ptr, Value *value, std::memory_order memoryOrder)
1073 {
1074 UNIMPLEMENTED("createAtomicMax");
1075 return nullptr;
1076 }
1077
1078 Value *Nucleus::createAtomicExchange(Value *ptr, Value *value, std::memory_order memoryOrder)
1079 {
1080 UNIMPLEMENTED("createAtomicExchange");
1081 return nullptr;
1082 }
1083
Chris Forbesa16238d2019-04-18 16:31:54 -07001084 Value *Nucleus::createAtomicCompareExchange(Value *ptr, Value *value, Value *compare, std::memory_order memoryOrderEqual, std::memory_order memoryOrderUnequal)
1085 {
1086 UNIMPLEMENTED("createAtomicCompareExchange");
1087 return nullptr;
1088 }
1089
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001090 static Value *createCast(Ice::InstCast::OpKind op, Value *v, Type *destType)
1091 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04001092 if(v->getType() == T(destType))
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001093 {
1094 return v;
1095 }
1096
1097 Ice::Variable *result = ::function->makeVariable(T(destType));
1098 Ice::InstCast *cast = Ice::InstCast::create(::function, op, result, v);
1099 ::basicBlock->appendInst(cast);
1100
1101 return V(result);
1102 }
1103
Nicolas Capens598f8d82016-09-26 15:09:10 -04001104 Value *Nucleus::createTrunc(Value *v, Type *destType)
1105 {
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001106 return createCast(Ice::InstCast::Trunc, v, destType);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001107 }
1108
1109 Value *Nucleus::createZExt(Value *v, Type *destType)
1110 {
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001111 return createCast(Ice::InstCast::Zext, v, destType);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001112 }
1113
1114 Value *Nucleus::createSExt(Value *v, Type *destType)
1115 {
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001116 return createCast(Ice::InstCast::Sext, v, destType);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001117 }
1118
1119 Value *Nucleus::createFPToSI(Value *v, Type *destType)
1120 {
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001121 return createCast(Ice::InstCast::Fptosi, v, destType);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001122 }
1123
Nicolas Capens598f8d82016-09-26 15:09:10 -04001124 Value *Nucleus::createSIToFP(Value *v, Type *destType)
1125 {
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001126 return createCast(Ice::InstCast::Sitofp, v, destType);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001127 }
1128
1129 Value *Nucleus::createFPTrunc(Value *v, Type *destType)
1130 {
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001131 return createCast(Ice::InstCast::Fptrunc, v, destType);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001132 }
1133
1134 Value *Nucleus::createFPExt(Value *v, Type *destType)
1135 {
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001136 return createCast(Ice::InstCast::Fpext, v, destType);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001137 }
1138
1139 Value *Nucleus::createBitCast(Value *v, Type *destType)
1140 {
Nicolas Capens2d8c3702017-07-25 13:56:46 -04001141 // Bitcasts must be between types of the same logical size. But with emulated narrow vectors we need
1142 // support for casting between scalars and wide vectors. For platforms where this is not supported,
1143 // emulate them by writing to the stack and reading back as the destination type.
1144 if(emulateMismatchedBitCast)
1145 {
1146 if(!Ice::isVectorType(v->getType()) && Ice::isVectorType(T(destType)))
1147 {
1148 Value *address = allocateStackVariable(destType);
1149 createStore(v, address, T(v->getType()));
1150 return createLoad(address, destType);
1151 }
1152 else if(Ice::isVectorType(v->getType()) && !Ice::isVectorType(T(destType)))
1153 {
1154 Value *address = allocateStackVariable(T(v->getType()));
1155 createStore(v, address, T(v->getType()));
1156 return createLoad(address, destType);
1157 }
1158 }
1159
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001160 return createCast(Ice::InstCast::Bitcast, v, destType);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001161 }
1162
Nicolas Capens43dc6292016-10-20 00:01:38 -04001163 static Value *createIntCompare(Ice::InstIcmp::ICond condition, Value *lhs, Value *rhs)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001164 {
Ben Claytoneb50d252019-04-15 13:50:01 -04001165 ASSERT(lhs->getType() == rhs->getType());
Nicolas Capens611642a2016-09-28 16:45:04 -04001166
Nicolas Capens43dc6292016-10-20 00:01:38 -04001167 auto result = ::function->makeVariable(Ice::isScalarIntegerType(lhs->getType()) ? Ice::IceType_i1 : lhs->getType());
1168 auto cmp = Ice::InstIcmp::create(::function, condition, result, lhs, rhs);
Nicolas Capens611642a2016-09-28 16:45:04 -04001169 ::basicBlock->appendInst(cmp);
1170
1171 return V(result);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001172 }
1173
Nicolas Capens43dc6292016-10-20 00:01:38 -04001174 Value *Nucleus::createICmpEQ(Value *lhs, Value *rhs)
1175 {
1176 return createIntCompare(Ice::InstIcmp::Eq, lhs, rhs);
1177 }
1178
1179 Value *Nucleus::createICmpNE(Value *lhs, Value *rhs)
1180 {
1181 return createIntCompare(Ice::InstIcmp::Ne, lhs, rhs);
1182 }
1183
1184 Value *Nucleus::createICmpUGT(Value *lhs, Value *rhs)
1185 {
1186 return createIntCompare(Ice::InstIcmp::Ugt, lhs, rhs);
1187 }
1188
1189 Value *Nucleus::createICmpUGE(Value *lhs, Value *rhs)
1190 {
1191 return createIntCompare(Ice::InstIcmp::Uge, lhs, rhs);
1192 }
1193
1194 Value *Nucleus::createICmpULT(Value *lhs, Value *rhs)
1195 {
1196 return createIntCompare(Ice::InstIcmp::Ult, lhs, rhs);
1197 }
1198
1199 Value *Nucleus::createICmpULE(Value *lhs, Value *rhs)
1200 {
1201 return createIntCompare(Ice::InstIcmp::Ule, lhs, rhs);
1202 }
1203
1204 Value *Nucleus::createICmpSGT(Value *lhs, Value *rhs)
1205 {
1206 return createIntCompare(Ice::InstIcmp::Sgt, lhs, rhs);
1207 }
1208
1209 Value *Nucleus::createICmpSGE(Value *lhs, Value *rhs)
1210 {
1211 return createIntCompare(Ice::InstIcmp::Sge, lhs, rhs);
1212 }
1213
1214 Value *Nucleus::createICmpSLT(Value *lhs, Value *rhs)
1215 {
1216 return createIntCompare(Ice::InstIcmp::Slt, lhs, rhs);
1217 }
1218
Nicolas Capens598f8d82016-09-26 15:09:10 -04001219 Value *Nucleus::createICmpSLE(Value *lhs, Value *rhs)
1220 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001221 return createIntCompare(Ice::InstIcmp::Sle, lhs, rhs);
1222 }
1223
1224 static Value *createFloatCompare(Ice::InstFcmp::FCond condition, Value *lhs, Value *rhs)
1225 {
Ben Claytoneb50d252019-04-15 13:50:01 -04001226 ASSERT(lhs->getType() == rhs->getType());
1227 ASSERT(Ice::isScalarFloatingType(lhs->getType()) || lhs->getType() == Ice::IceType_v4f32);
Nicolas Capens43dc6292016-10-20 00:01:38 -04001228
1229 auto result = ::function->makeVariable(Ice::isScalarFloatingType(lhs->getType()) ? Ice::IceType_i1 : Ice::IceType_v4i32);
1230 auto cmp = Ice::InstFcmp::create(::function, condition, result, lhs, rhs);
1231 ::basicBlock->appendInst(cmp);
1232
1233 return V(result);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001234 }
1235
1236 Value *Nucleus::createFCmpOEQ(Value *lhs, Value *rhs)
1237 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001238 return createFloatCompare(Ice::InstFcmp::Oeq, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001239 }
1240
1241 Value *Nucleus::createFCmpOGT(Value *lhs, Value *rhs)
1242 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001243 return createFloatCompare(Ice::InstFcmp::Ogt, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001244 }
1245
1246 Value *Nucleus::createFCmpOGE(Value *lhs, Value *rhs)
1247 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001248 return createFloatCompare(Ice::InstFcmp::Oge, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001249 }
1250
1251 Value *Nucleus::createFCmpOLT(Value *lhs, Value *rhs)
1252 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001253 return createFloatCompare(Ice::InstFcmp::Olt, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001254 }
1255
1256 Value *Nucleus::createFCmpOLE(Value *lhs, Value *rhs)
1257 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001258 return createFloatCompare(Ice::InstFcmp::Ole, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001259 }
1260
1261 Value *Nucleus::createFCmpONE(Value *lhs, Value *rhs)
1262 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001263 return createFloatCompare(Ice::InstFcmp::One, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001264 }
1265
1266 Value *Nucleus::createFCmpORD(Value *lhs, Value *rhs)
1267 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001268 return createFloatCompare(Ice::InstFcmp::Ord, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001269 }
1270
1271 Value *Nucleus::createFCmpUNO(Value *lhs, Value *rhs)
1272 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001273 return createFloatCompare(Ice::InstFcmp::Uno, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001274 }
1275
1276 Value *Nucleus::createFCmpUEQ(Value *lhs, Value *rhs)
1277 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001278 return createFloatCompare(Ice::InstFcmp::Ueq, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001279 }
1280
1281 Value *Nucleus::createFCmpUGT(Value *lhs, Value *rhs)
1282 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001283 return createFloatCompare(Ice::InstFcmp::Ugt, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001284 }
1285
1286 Value *Nucleus::createFCmpUGE(Value *lhs, Value *rhs)
1287 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001288 return createFloatCompare(Ice::InstFcmp::Uge, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001289 }
1290
1291 Value *Nucleus::createFCmpULT(Value *lhs, Value *rhs)
1292 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001293 return createFloatCompare(Ice::InstFcmp::Ult, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001294 }
1295
1296 Value *Nucleus::createFCmpULE(Value *lhs, Value *rhs)
1297 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001298 return createFloatCompare(Ice::InstFcmp::Ule, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001299 }
1300
1301 Value *Nucleus::createFCmpUNE(Value *lhs, Value *rhs)
1302 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001303 return createFloatCompare(Ice::InstFcmp::Une, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001304 }
1305
Nicolas Capense95d5342016-09-30 11:37:28 -04001306 Value *Nucleus::createExtractElement(Value *vector, Type *type, int index)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001307 {
Nicolas Capens9709d4f2016-09-30 11:44:14 -04001308 auto result = ::function->makeVariable(T(type));
1309 auto extract = Ice::InstExtractElement::create(::function, result, vector, ::context->getConstantInt32(index));
1310 ::basicBlock->appendInst(extract);
1311
1312 return V(result);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001313 }
1314
1315 Value *Nucleus::createInsertElement(Value *vector, Value *element, int index)
1316 {
Nicolas Capens9709d4f2016-09-30 11:44:14 -04001317 auto result = ::function->makeVariable(vector->getType());
1318 auto insert = Ice::InstInsertElement::create(::function, result, vector, element, ::context->getConstantInt32(index));
1319 ::basicBlock->appendInst(insert);
1320
1321 return V(result);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001322 }
1323
Nicolas Capense89cd582016-09-30 14:23:47 -04001324 Value *Nucleus::createShuffleVector(Value *V1, Value *V2, const int *select)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001325 {
Ben Claytoneb50d252019-04-15 13:50:01 -04001326 ASSERT(V1->getType() == V2->getType());
Nicolas Capens619c0ab2016-09-30 14:46:24 -04001327
1328 int size = Ice::typeNumElements(V1->getType());
1329 auto result = ::function->makeVariable(V1->getType());
1330 auto shuffle = Ice::InstShuffleVector::create(::function, result, V1, V2);
1331
1332 for(int i = 0; i < size; i++)
1333 {
1334 shuffle->addIndex(llvm::cast<Ice::ConstantInteger32>(::context->getConstantInt32(select[i])));
1335 }
1336
1337 ::basicBlock->appendInst(shuffle);
1338
1339 return V(result);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001340 }
1341
1342 Value *Nucleus::createSelect(Value *C, Value *ifTrue, Value *ifFalse)
1343 {
Ben Claytoneb50d252019-04-15 13:50:01 -04001344 ASSERT(ifTrue->getType() == ifFalse->getType());
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04001345
1346 auto result = ::function->makeVariable(ifTrue->getType());
1347 auto *select = Ice::InstSelect::create(::function, result, C, ifTrue, ifFalse);
1348 ::basicBlock->appendInst(select);
1349
1350 return V(result);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001351 }
1352
Nicolas Capensb98fe5c2016-11-09 12:24:06 -05001353 SwitchCases *Nucleus::createSwitch(Value *control, BasicBlock *defaultBranch, unsigned numCases)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001354 {
Nicolas Capensb98fe5c2016-11-09 12:24:06 -05001355 auto switchInst = Ice::InstSwitch::create(::function, numCases, control, defaultBranch);
1356 ::basicBlock->appendInst(switchInst);
1357
1358 return reinterpret_cast<SwitchCases*>(switchInst);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001359 }
1360
Nicolas Capensb98fe5c2016-11-09 12:24:06 -05001361 void Nucleus::addSwitchCase(SwitchCases *switchCases, int label, BasicBlock *branch)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001362 {
Nicolas Capensb98fe5c2016-11-09 12:24:06 -05001363 switchCases->addBranch(label, label, branch);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001364 }
1365
1366 void Nucleus::createUnreachable()
1367 {
Nicolas Capensfdcca2d2016-10-20 11:31:36 -04001368 Ice::InstUnreachable *unreachable = Ice::InstUnreachable::create(::function);
1369 ::basicBlock->appendInst(unreachable);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001370 }
1371
Nicolas Capens598f8d82016-09-26 15:09:10 -04001372 Type *Nucleus::getPointerType(Type *ElementType)
1373 {
Nicolas Capense12780d2016-09-27 14:18:07 -04001374 if(sizeof(void*) == 8)
1375 {
1376 return T(Ice::IceType_i64);
1377 }
1378 else
1379 {
1380 return T(Ice::IceType_i32);
1381 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001382 }
1383
Nicolas Capens13ac2322016-10-13 14:52:12 -04001384 Value *Nucleus::createNullValue(Type *Ty)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001385 {
Nicolas Capens73dd7a22016-10-20 13:20:34 -04001386 if(Ice::isVectorType(T(Ty)))
1387 {
Ben Claytoneb50d252019-04-15 13:50:01 -04001388 ASSERT(Ice::typeNumElements(T(Ty)) <= 16);
Nicolas Capens30385f02017-04-18 13:03:47 -04001389 int64_t c[16] = {0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0};
Nicolas Capens73dd7a22016-10-20 13:20:34 -04001390 return createConstantVector(c, Ty);
1391 }
1392 else
1393 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001394 return V(::context->getConstantZero(T(Ty)));
Nicolas Capens73dd7a22016-10-20 13:20:34 -04001395 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001396 }
1397
Nicolas Capens13ac2322016-10-13 14:52:12 -04001398 Value *Nucleus::createConstantLong(int64_t i)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001399 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001400 return V(::context->getConstantInt64(i));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001401 }
1402
Nicolas Capens13ac2322016-10-13 14:52:12 -04001403 Value *Nucleus::createConstantInt(int i)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001404 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001405 return V(::context->getConstantInt32(i));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001406 }
1407
Nicolas Capens13ac2322016-10-13 14:52:12 -04001408 Value *Nucleus::createConstantInt(unsigned int i)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001409 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001410 return V(::context->getConstantInt32(i));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001411 }
1412
Nicolas Capens13ac2322016-10-13 14:52:12 -04001413 Value *Nucleus::createConstantBool(bool b)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001414 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001415 return V(::context->getConstantInt1(b));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001416 }
1417
Nicolas Capens13ac2322016-10-13 14:52:12 -04001418 Value *Nucleus::createConstantByte(signed char i)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001419 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001420 return V(::context->getConstantInt8(i));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001421 }
1422
Nicolas Capens13ac2322016-10-13 14:52:12 -04001423 Value *Nucleus::createConstantByte(unsigned char i)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001424 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001425 return V(::context->getConstantInt8(i));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001426 }
1427
Nicolas Capens13ac2322016-10-13 14:52:12 -04001428 Value *Nucleus::createConstantShort(short i)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001429 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001430 return V(::context->getConstantInt16(i));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001431 }
1432
Nicolas Capens13ac2322016-10-13 14:52:12 -04001433 Value *Nucleus::createConstantShort(unsigned short i)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001434 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001435 return V(::context->getConstantInt16(i));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001436 }
1437
Nicolas Capens13ac2322016-10-13 14:52:12 -04001438 Value *Nucleus::createConstantFloat(float x)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001439 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001440 return V(::context->getConstantFloat(x));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001441 }
1442
Nicolas Capens13ac2322016-10-13 14:52:12 -04001443 Value *Nucleus::createNullPointer(Type *Ty)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001444 {
Nicolas Capensa29d6532016-12-05 21:38:09 -05001445 return createNullValue(T(sizeof(void*) == 8 ? Ice::IceType_i64 : Ice::IceType_i32));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001446 }
1447
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001448 Value *Nucleus::createConstantVector(const int64_t *constants, Type *type)
Nicolas Capens13ac2322016-10-13 14:52:12 -04001449 {
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001450 const int vectorSize = 16;
Ben Claytoneb50d252019-04-15 13:50:01 -04001451 ASSERT(Ice::typeWidthInBytes(T(type)) == vectorSize);
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001452 const int alignment = vectorSize;
1453 auto globalPool = ::function->getGlobalPool();
1454
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001455 const int64_t *i = constants;
1456 const double *f = reinterpret_cast<const double*>(constants);
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001457 Ice::VariableDeclaration::DataInitializer *dataInitializer = nullptr;
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001458
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001459 switch((int)reinterpret_cast<intptr_t>(type))
1460 {
1461 case Ice::IceType_v4i32:
Nicolas Capensa4c30b02016-11-08 15:43:17 -05001462 case Ice::IceType_v4i1:
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001463 {
1464 const int initializer[4] = {(int)i[0], (int)i[1], (int)i[2], (int)i[3]};
1465 static_assert(sizeof(initializer) == vectorSize, "!");
1466 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1467 }
1468 break;
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001469 case Ice::IceType_v4f32:
1470 {
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001471 const float initializer[4] = {(float)f[0], (float)f[1], (float)f[2], (float)f[3]};
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001472 static_assert(sizeof(initializer) == vectorSize, "!");
1473 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1474 }
1475 break;
1476 case Ice::IceType_v8i16:
Nicolas Capensa4c30b02016-11-08 15:43:17 -05001477 case Ice::IceType_v8i1:
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001478 {
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001479 const short initializer[8] = {(short)i[0], (short)i[1], (short)i[2], (short)i[3], (short)i[4], (short)i[5], (short)i[6], (short)i[7]};
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001480 static_assert(sizeof(initializer) == vectorSize, "!");
1481 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1482 }
1483 break;
1484 case Ice::IceType_v16i8:
Nicolas Capensa4c30b02016-11-08 15:43:17 -05001485 case Ice::IceType_v16i1:
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001486 {
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001487 const char initializer[16] = {(char)i[0], (char)i[1], (char)i[2], (char)i[3], (char)i[4], (char)i[5], (char)i[6], (char)i[7], (char)i[8], (char)i[9], (char)i[10], (char)i[11], (char)i[12], (char)i[13], (char)i[14], (char)i[15]};
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001488 static_assert(sizeof(initializer) == vectorSize, "!");
1489 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1490 }
1491 break;
1492 case Type_v2i32:
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001493 {
1494 const int initializer[4] = {(int)i[0], (int)i[1], (int)i[0], (int)i[1]};
1495 static_assert(sizeof(initializer) == vectorSize, "!");
1496 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1497 }
1498 break;
Nicolas Capens4cfd4572016-10-20 01:00:19 -04001499 case Type_v2f32:
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001500 {
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001501 const float initializer[4] = {(float)f[0], (float)f[1], (float)f[0], (float)f[1]};
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001502 static_assert(sizeof(initializer) == vectorSize, "!");
1503 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1504 }
1505 break;
1506 case Type_v4i16:
1507 {
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001508 const short initializer[8] = {(short)i[0], (short)i[1], (short)i[2], (short)i[3], (short)i[0], (short)i[1], (short)i[2], (short)i[3]};
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001509 static_assert(sizeof(initializer) == vectorSize, "!");
1510 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1511 }
1512 break;
1513 case Type_v8i8:
1514 {
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001515 const char initializer[16] = {(char)i[0], (char)i[1], (char)i[2], (char)i[3], (char)i[4], (char)i[5], (char)i[6], (char)i[7], (char)i[0], (char)i[1], (char)i[2], (char)i[3], (char)i[4], (char)i[5], (char)i[6], (char)i[7]};
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001516 static_assert(sizeof(initializer) == vectorSize, "!");
1517 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1518 }
1519 break;
1520 case Type_v4i8:
1521 {
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001522 const char initializer[16] = {(char)i[0], (char)i[1], (char)i[2], (char)i[3], (char)i[0], (char)i[1], (char)i[2], (char)i[3], (char)i[0], (char)i[1], (char)i[2], (char)i[3], (char)i[0], (char)i[1], (char)i[2], (char)i[3]};
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001523 static_assert(sizeof(initializer) == vectorSize, "!");
1524 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1525 }
1526 break;
1527 default:
Ben Claytoneb50d252019-04-15 13:50:01 -04001528 UNREACHABLE("Unknown constant vector type: %d", (int)reinterpret_cast<intptr_t>(type));
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001529 }
1530
1531 auto name = Ice::GlobalString::createWithoutString(::context);
1532 auto *variableDeclaration = Ice::VariableDeclaration::create(globalPool);
1533 variableDeclaration->setName(name);
1534 variableDeclaration->setAlignment(alignment);
1535 variableDeclaration->setIsConstant(true);
1536 variableDeclaration->addInitializer(dataInitializer);
Nicolas Capens87852e12016-11-24 14:45:06 -05001537
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001538 ::function->addGlobal(variableDeclaration);
1539
1540 constexpr int32_t offset = 0;
1541 Ice::Operand *ptr = ::context->getConstantSym(offset, name);
1542
1543 Ice::Variable *result = ::function->makeVariable(T(type));
1544 auto load = Ice::InstLoad::create(::function, result, ptr, alignment);
1545 ::basicBlock->appendInst(load);
1546
1547 return V(result);
Nicolas Capens13ac2322016-10-13 14:52:12 -04001548 }
1549
1550 Value *Nucleus::createConstantVector(const double *constants, Type *type)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001551 {
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001552 return createConstantVector((const int64_t*)constants, type);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001553 }
1554
1555 Type *Void::getType()
1556 {
1557 return T(Ice::IceType_void);
1558 }
1559
Nicolas Capens598f8d82016-09-26 15:09:10 -04001560 Type *Bool::getType()
1561 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04001562 return T(Ice::IceType_i1);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001563 }
1564
Nicolas Capens598f8d82016-09-26 15:09:10 -04001565 Type *Byte::getType()
1566 {
Nicolas Capens6d738712016-09-30 04:15:22 -04001567 return T(Ice::IceType_i8);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001568 }
1569
Nicolas Capens598f8d82016-09-26 15:09:10 -04001570 Type *SByte::getType()
1571 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04001572 return T(Ice::IceType_i8);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001573 }
1574
Nicolas Capens598f8d82016-09-26 15:09:10 -04001575 Type *Short::getType()
1576 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04001577 return T(Ice::IceType_i16);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001578 }
1579
Nicolas Capens598f8d82016-09-26 15:09:10 -04001580 Type *UShort::getType()
1581 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04001582 return T(Ice::IceType_i16);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001583 }
1584
1585 Type *Byte4::getType()
1586 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04001587 return T(Type_v4i8);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001588 }
1589
1590 Type *SByte4::getType()
1591 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04001592 return T(Type_v4i8);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001593 }
1594
Nicolas Capensb6d4ce32019-03-12 23:00:24 -04001595 namespace
Nicolas Capens598f8d82016-09-26 15:09:10 -04001596 {
Nicolas Capensb6d4ce32019-03-12 23:00:24 -04001597 RValue<Byte> SaturateUnsigned(RValue<Short> x)
1598 {
1599 return Byte(IfThenElse(Int(x) > 0xFF, Int(0xFF), IfThenElse(Int(x) < 0, Int(0), Int(x))));
1600 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001601
Nicolas Capensb6d4ce32019-03-12 23:00:24 -04001602 RValue<Byte> Extract(RValue<Byte8> val, int i)
1603 {
1604 return RValue<Byte>(Nucleus::createExtractElement(val.value, Byte::getType(), i));
1605 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001606
Nicolas Capensb6d4ce32019-03-12 23:00:24 -04001607 RValue<Byte8> Insert(RValue<Byte8> val, RValue<Byte> element, int i)
1608 {
1609 return RValue<Byte8>(Nucleus::createInsertElement(val.value, element.value, i));
1610 }
Nicolas Capens98436732017-07-25 15:32:12 -04001611 }
1612
Nicolas Capens598f8d82016-09-26 15:09:10 -04001613 RValue<Byte8> AddSat(RValue<Byte8> x, RValue<Byte8> y)
1614 {
Nicolas Capens98436732017-07-25 15:32:12 -04001615 if(emulateIntrinsics)
1616 {
1617 Byte8 result;
Nicolas Capens33438a62017-09-27 11:47:35 -04001618 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 0)) + Int(Extract(y, 0)))), 0);
1619 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 1)) + Int(Extract(y, 1)))), 1);
1620 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 2)) + Int(Extract(y, 2)))), 2);
1621 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 3)) + Int(Extract(y, 3)))), 3);
1622 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 4)) + Int(Extract(y, 4)))), 4);
1623 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 5)) + Int(Extract(y, 5)))), 5);
1624 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 6)) + Int(Extract(y, 6)))), 6);
1625 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 7)) + Int(Extract(y, 7)))), 7);
Nicolas Capensc71bed22016-11-07 22:25:14 -05001626
Nicolas Capens98436732017-07-25 15:32:12 -04001627 return result;
1628 }
1629 else
1630 {
1631 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v16i8);
1632 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::AddSaturateUnsigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
1633 auto target = ::context->getConstantUndef(Ice::IceType_i32);
1634 auto paddusb = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
1635 paddusb->addArg(x.value);
1636 paddusb->addArg(y.value);
1637 ::basicBlock->appendInst(paddusb);
1638
1639 return RValue<Byte8>(V(result));
1640 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001641 }
1642
1643 RValue<Byte8> SubSat(RValue<Byte8> x, RValue<Byte8> y)
1644 {
Nicolas Capens98436732017-07-25 15:32:12 -04001645 if(emulateIntrinsics)
1646 {
1647 Byte8 result;
Nicolas Capens33438a62017-09-27 11:47:35 -04001648 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 0)) - Int(Extract(y, 0)))), 0);
1649 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 1)) - Int(Extract(y, 1)))), 1);
1650 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 2)) - Int(Extract(y, 2)))), 2);
1651 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 3)) - Int(Extract(y, 3)))), 3);
1652 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 4)) - Int(Extract(y, 4)))), 4);
1653 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 5)) - Int(Extract(y, 5)))), 5);
1654 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 6)) - Int(Extract(y, 6)))), 6);
1655 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 7)) - Int(Extract(y, 7)))), 7);
Nicolas Capensc71bed22016-11-07 22:25:14 -05001656
Nicolas Capens98436732017-07-25 15:32:12 -04001657 return result;
1658 }
1659 else
1660 {
1661 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v16i8);
1662 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::SubtractSaturateUnsigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
1663 auto target = ::context->getConstantUndef(Ice::IceType_i32);
1664 auto psubusw = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
1665 psubusw->addArg(x.value);
1666 psubusw->addArg(y.value);
1667 ::basicBlock->appendInst(psubusw);
1668
1669 return RValue<Byte8>(V(result));
1670 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001671 }
1672
Nicolas Capensd6cacad2017-07-25 15:32:12 -04001673 RValue<SByte> Extract(RValue<SByte8> val, int i)
1674 {
1675 return RValue<SByte>(Nucleus::createExtractElement(val.value, SByte::getType(), i));
1676 }
1677
1678 RValue<SByte8> Insert(RValue<SByte8> val, RValue<SByte> element, int i)
1679 {
1680 return RValue<SByte8>(Nucleus::createInsertElement(val.value, element.value, i));
1681 }
1682
1683 RValue<SByte8> operator>>(RValue<SByte8> lhs, unsigned char rhs)
1684 {
1685 if(emulateIntrinsics)
1686 {
1687 SByte8 result;
1688 result = Insert(result, Extract(lhs, 0) >> SByte(rhs), 0);
1689 result = Insert(result, Extract(lhs, 1) >> SByte(rhs), 1);
1690 result = Insert(result, Extract(lhs, 2) >> SByte(rhs), 2);
1691 result = Insert(result, Extract(lhs, 3) >> SByte(rhs), 3);
1692 result = Insert(result, Extract(lhs, 4) >> SByte(rhs), 4);
1693 result = Insert(result, Extract(lhs, 5) >> SByte(rhs), 5);
1694 result = Insert(result, Extract(lhs, 6) >> SByte(rhs), 6);
1695 result = Insert(result, Extract(lhs, 7) >> SByte(rhs), 7);
1696
1697 return result;
1698 }
1699 else
1700 {
1701 #if defined(__i386__) || defined(__x86_64__)
1702 // SSE2 doesn't support byte vector shifts, so shift as shorts and recombine.
Alexis Hetue18c5302017-08-04 11:48:17 -04001703 RValue<Short4> hi = (As<Short4>(lhs) >> rhs) & Short4(0xFF00u);
Nicolas Capensd6cacad2017-07-25 15:32:12 -04001704 RValue<Short4> lo = As<Short4>(As<UShort4>((As<Short4>(lhs) << 8) >> rhs) >> 8);
1705
1706 return As<SByte8>(hi | lo);
1707 #else
1708 return RValue<SByte8>(Nucleus::createAShr(lhs.value, V(::context->getConstantInt32(rhs))));
1709 #endif
1710 }
1711 }
1712
Nicolas Capens598f8d82016-09-26 15:09:10 -04001713 RValue<Int> SignMask(RValue<Byte8> x)
1714 {
Nicolas Capens091f3502017-10-03 14:56:49 -04001715 if(emulateIntrinsics || CPUID::ARM)
Nicolas Capensd6cacad2017-07-25 15:32:12 -04001716 {
1717 Byte8 xx = As<Byte8>(As<SByte8>(x) >> 7) & Byte8(0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80);
1718 return Int(Extract(xx, 0)) | Int(Extract(xx, 1)) | Int(Extract(xx, 2)) | Int(Extract(xx, 3)) | Int(Extract(xx, 4)) | Int(Extract(xx, 5)) | Int(Extract(xx, 6)) | Int(Extract(xx, 7));
1719 }
1720 else
1721 {
1722 Ice::Variable *result = ::function->makeVariable(Ice::IceType_i32);
1723 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::SignMask, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
1724 auto target = ::context->getConstantUndef(Ice::IceType_i32);
1725 auto movmsk = Ice::InstIntrinsicCall::create(::function, 1, result, target, intrinsic);
1726 movmsk->addArg(x.value);
1727 ::basicBlock->appendInst(movmsk);
Nicolas Capensc71bed22016-11-07 22:25:14 -05001728
Nicolas Capens0f70a7f2017-07-26 13:50:04 -04001729 return RValue<Int>(V(result)) & 0xFF;
Nicolas Capensd6cacad2017-07-25 15:32:12 -04001730 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001731 }
1732
1733// RValue<Byte8> CmpGT(RValue<Byte8> x, RValue<Byte8> y)
1734// {
Nicolas Capens2f970b62016-11-08 14:28:59 -05001735// return RValue<Byte8>(createIntCompare(Ice::InstIcmp::Ugt, x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001736// }
1737
1738 RValue<Byte8> CmpEQ(RValue<Byte8> x, RValue<Byte8> y)
1739 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05001740 return RValue<Byte8>(Nucleus::createICmpEQ(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001741 }
1742
1743 Type *Byte8::getType()
1744 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04001745 return T(Type_v8i8);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001746 }
1747
Nicolas Capens598f8d82016-09-26 15:09:10 -04001748// RValue<SByte8> operator<<(RValue<SByte8> lhs, unsigned char rhs)
1749// {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001750// return RValue<SByte8>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001751// }
1752
1753// RValue<SByte8> operator>>(RValue<SByte8> lhs, unsigned char rhs)
1754// {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001755// return RValue<SByte8>(Nucleus::createAShr(lhs.value, V(::context->getConstantInt32(rhs))));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001756// }
1757
Nicolas Capens33438a62017-09-27 11:47:35 -04001758 RValue<SByte> SaturateSigned(RValue<Short> x)
Nicolas Capens98436732017-07-25 15:32:12 -04001759 {
1760 return SByte(IfThenElse(Int(x) > 0x7F, Int(0x7F), IfThenElse(Int(x) < -0x80, Int(0x80), Int(x))));
1761 }
1762
Nicolas Capens598f8d82016-09-26 15:09:10 -04001763 RValue<SByte8> AddSat(RValue<SByte8> x, RValue<SByte8> y)
1764 {
Nicolas Capens98436732017-07-25 15:32:12 -04001765 if(emulateIntrinsics)
1766 {
1767 SByte8 result;
Nicolas Capens33438a62017-09-27 11:47:35 -04001768 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 0)) + Int(Extract(y, 0)))), 0);
1769 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 1)) + Int(Extract(y, 1)))), 1);
1770 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 2)) + Int(Extract(y, 2)))), 2);
1771 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 3)) + Int(Extract(y, 3)))), 3);
1772 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 4)) + Int(Extract(y, 4)))), 4);
1773 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 5)) + Int(Extract(y, 5)))), 5);
1774 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 6)) + Int(Extract(y, 6)))), 6);
1775 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 7)) + Int(Extract(y, 7)))), 7);
Nicolas Capensc71bed22016-11-07 22:25:14 -05001776
Nicolas Capens98436732017-07-25 15:32:12 -04001777 return result;
1778 }
1779 else
1780 {
1781 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v16i8);
1782 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::AddSaturateSigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
1783 auto target = ::context->getConstantUndef(Ice::IceType_i32);
1784 auto paddsb = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
1785 paddsb->addArg(x.value);
1786 paddsb->addArg(y.value);
1787 ::basicBlock->appendInst(paddsb);
1788
1789 return RValue<SByte8>(V(result));
1790 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001791 }
1792
1793 RValue<SByte8> SubSat(RValue<SByte8> x, RValue<SByte8> y)
1794 {
Nicolas Capens98436732017-07-25 15:32:12 -04001795 if(emulateIntrinsics)
1796 {
1797 SByte8 result;
Nicolas Capens33438a62017-09-27 11:47:35 -04001798 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 0)) - Int(Extract(y, 0)))), 0);
1799 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 1)) - Int(Extract(y, 1)))), 1);
1800 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 2)) - Int(Extract(y, 2)))), 2);
1801 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 3)) - Int(Extract(y, 3)))), 3);
1802 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 4)) - Int(Extract(y, 4)))), 4);
1803 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 5)) - Int(Extract(y, 5)))), 5);
1804 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 6)) - Int(Extract(y, 6)))), 6);
1805 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 7)) - Int(Extract(y, 7)))), 7);
Nicolas Capensc71bed22016-11-07 22:25:14 -05001806
Nicolas Capens98436732017-07-25 15:32:12 -04001807 return result;
1808 }
1809 else
1810 {
1811 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v16i8);
1812 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::SubtractSaturateSigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
1813 auto target = ::context->getConstantUndef(Ice::IceType_i32);
1814 auto psubsb = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
1815 psubsb->addArg(x.value);
1816 psubsb->addArg(y.value);
1817 ::basicBlock->appendInst(psubsb);
1818
1819 return RValue<SByte8>(V(result));
1820 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001821 }
1822
Nicolas Capens598f8d82016-09-26 15:09:10 -04001823 RValue<Int> SignMask(RValue<SByte8> x)
1824 {
Nicolas Capens091f3502017-10-03 14:56:49 -04001825 if(emulateIntrinsics || CPUID::ARM)
Nicolas Capensd6cacad2017-07-25 15:32:12 -04001826 {
1827 SByte8 xx = (x >> 7) & SByte8(0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80);
1828 return Int(Extract(xx, 0)) | Int(Extract(xx, 1)) | Int(Extract(xx, 2)) | Int(Extract(xx, 3)) | Int(Extract(xx, 4)) | Int(Extract(xx, 5)) | Int(Extract(xx, 6)) | Int(Extract(xx, 7));
1829 }
1830 else
1831 {
1832 Ice::Variable *result = ::function->makeVariable(Ice::IceType_i32);
1833 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::SignMask, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
1834 auto target = ::context->getConstantUndef(Ice::IceType_i32);
1835 auto movmsk = Ice::InstIntrinsicCall::create(::function, 1, result, target, intrinsic);
1836 movmsk->addArg(x.value);
1837 ::basicBlock->appendInst(movmsk);
Nicolas Capensf2cb9df2016-10-21 17:26:13 -04001838
Nicolas Capens0f70a7f2017-07-26 13:50:04 -04001839 return RValue<Int>(V(result)) & 0xFF;
Nicolas Capensd6cacad2017-07-25 15:32:12 -04001840 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001841 }
1842
1843 RValue<Byte8> CmpGT(RValue<SByte8> x, RValue<SByte8> y)
1844 {
Nicolas Capens2f970b62016-11-08 14:28:59 -05001845 return RValue<Byte8>(createIntCompare(Ice::InstIcmp::Sgt, x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001846 }
1847
1848 RValue<Byte8> CmpEQ(RValue<SByte8> x, RValue<SByte8> y)
1849 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05001850 return RValue<Byte8>(Nucleus::createICmpEQ(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001851 }
1852
1853 Type *SByte8::getType()
1854 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04001855 return T(Type_v8i8);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001856 }
1857
Nicolas Capens598f8d82016-09-26 15:09:10 -04001858 Type *Byte16::getType()
1859 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04001860 return T(Ice::IceType_v16i8);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001861 }
1862
1863 Type *SByte16::getType()
1864 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04001865 return T(Ice::IceType_v16i8);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001866 }
1867
Nicolas Capens16b5f152016-10-13 13:39:01 -04001868 Type *Short2::getType()
1869 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04001870 return T(Type_v2i16);
Nicolas Capens16b5f152016-10-13 13:39:01 -04001871 }
1872
Nicolas Capens16b5f152016-10-13 13:39:01 -04001873 Type *UShort2::getType()
1874 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04001875 return T(Type_v2i16);
Nicolas Capens16b5f152016-10-13 13:39:01 -04001876 }
1877
Nicolas Capens598f8d82016-09-26 15:09:10 -04001878 Short4::Short4(RValue<Int4> cast)
1879 {
Nicolas Capensf8beb4b2017-01-27 02:55:44 -08001880 int select[8] = {0, 2, 4, 6, 0, 2, 4, 6};
1881 Value *short8 = Nucleus::createBitCast(cast.value, Short8::getType());
1882 Value *packed = Nucleus::createShuffleVector(short8, short8, select);
Nicolas Capensd4227962016-11-09 14:24:25 -05001883
Nicolas Capensbea4dce2017-07-24 16:54:44 -04001884 Value *int2 = RValue<Int2>(Int2(As<Int4>(packed))).value;
Nicolas Capensd4227962016-11-09 14:24:25 -05001885 Value *short4 = Nucleus::createBitCast(int2, Short4::getType());
1886
1887 storeValue(short4);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001888 }
1889
1890// Short4::Short4(RValue<Float> cast)
1891// {
1892// }
1893
1894 Short4::Short4(RValue<Float4> cast)
1895 {
Ben Claytoneb50d252019-04-15 13:50:01 -04001896 UNIMPLEMENTED("Short4::Short4(RValue<Float4> cast)");
Nicolas Capens598f8d82016-09-26 15:09:10 -04001897 }
1898
Nicolas Capens598f8d82016-09-26 15:09:10 -04001899 RValue<Short4> operator<<(RValue<Short4> lhs, unsigned char rhs)
1900 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04001901 if(emulateIntrinsics)
1902 {
1903 Short4 result;
1904 result = Insert(result, Extract(lhs, 0) << Short(rhs), 0);
1905 result = Insert(result, Extract(lhs, 1) << Short(rhs), 1);
1906 result = Insert(result, Extract(lhs, 2) << Short(rhs), 2);
1907 result = Insert(result, Extract(lhs, 3) << Short(rhs), 3);
1908
1909 return result;
1910 }
1911 else
1912 {
1913 return RValue<Short4>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
1914 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001915 }
1916
1917 RValue<Short4> operator>>(RValue<Short4> lhs, unsigned char rhs)
1918 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04001919 if(emulateIntrinsics)
1920 {
1921 Short4 result;
1922 result = Insert(result, Extract(lhs, 0) >> Short(rhs), 0);
1923 result = Insert(result, Extract(lhs, 1) >> Short(rhs), 1);
1924 result = Insert(result, Extract(lhs, 2) >> Short(rhs), 2);
1925 result = Insert(result, Extract(lhs, 3) >> Short(rhs), 3);
1926
1927 return result;
1928 }
1929 else
1930 {
1931 return RValue<Short4>(Nucleus::createAShr(lhs.value, V(::context->getConstantInt32(rhs))));
1932 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001933 }
1934
Nicolas Capens598f8d82016-09-26 15:09:10 -04001935 RValue<Short4> Max(RValue<Short4> x, RValue<Short4> y)
1936 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04001937 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v8i1);
1938 auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Sle, condition, x.value, y.value);
1939 ::basicBlock->appendInst(cmp);
1940
1941 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
1942 auto select = Ice::InstSelect::create(::function, result, condition, y.value, x.value);
1943 ::basicBlock->appendInst(select);
1944
1945 return RValue<Short4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001946 }
1947
1948 RValue<Short4> Min(RValue<Short4> x, RValue<Short4> y)
1949 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04001950 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v8i1);
1951 auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Sgt, condition, x.value, y.value);
1952 ::basicBlock->appendInst(cmp);
1953
1954 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
1955 auto select = Ice::InstSelect::create(::function, result, condition, y.value, x.value);
1956 ::basicBlock->appendInst(select);
1957
1958 return RValue<Short4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001959 }
1960
Nicolas Capens33438a62017-09-27 11:47:35 -04001961 RValue<Short> SaturateSigned(RValue<Int> x)
Nicolas Capens98436732017-07-25 15:32:12 -04001962 {
1963 return Short(IfThenElse(x > 0x7FFF, Int(0x7FFF), IfThenElse(x < -0x8000, Int(0x8000), x)));
1964 }
1965
Nicolas Capens598f8d82016-09-26 15:09:10 -04001966 RValue<Short4> AddSat(RValue<Short4> x, RValue<Short4> y)
1967 {
Nicolas Capens98436732017-07-25 15:32:12 -04001968 if(emulateIntrinsics)
1969 {
1970 Short4 result;
Nicolas Capens33438a62017-09-27 11:47:35 -04001971 result = Insert(result, SaturateSigned(Int(Extract(x, 0)) + Int(Extract(y, 0))), 0);
1972 result = Insert(result, SaturateSigned(Int(Extract(x, 1)) + Int(Extract(y, 1))), 1);
1973 result = Insert(result, SaturateSigned(Int(Extract(x, 2)) + Int(Extract(y, 2))), 2);
1974 result = Insert(result, SaturateSigned(Int(Extract(x, 3)) + Int(Extract(y, 3))), 3);
Nicolas Capensc71bed22016-11-07 22:25:14 -05001975
Nicolas Capens98436732017-07-25 15:32:12 -04001976 return result;
1977 }
1978 else
1979 {
1980 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
1981 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::AddSaturateSigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
1982 auto target = ::context->getConstantUndef(Ice::IceType_i32);
1983 auto paddsw = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
1984 paddsw->addArg(x.value);
1985 paddsw->addArg(y.value);
1986 ::basicBlock->appendInst(paddsw);
1987
1988 return RValue<Short4>(V(result));
1989 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001990 }
1991
1992 RValue<Short4> SubSat(RValue<Short4> x, RValue<Short4> y)
1993 {
Nicolas Capens98436732017-07-25 15:32:12 -04001994 if(emulateIntrinsics)
1995 {
1996 Short4 result;
Nicolas Capens33438a62017-09-27 11:47:35 -04001997 result = Insert(result, SaturateSigned(Int(Extract(x, 0)) - Int(Extract(y, 0))), 0);
1998 result = Insert(result, SaturateSigned(Int(Extract(x, 1)) - Int(Extract(y, 1))), 1);
1999 result = Insert(result, SaturateSigned(Int(Extract(x, 2)) - Int(Extract(y, 2))), 2);
2000 result = Insert(result, SaturateSigned(Int(Extract(x, 3)) - Int(Extract(y, 3))), 3);
Nicolas Capensc71bed22016-11-07 22:25:14 -05002001
Nicolas Capens98436732017-07-25 15:32:12 -04002002 return result;
2003 }
2004 else
2005 {
2006 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2007 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::SubtractSaturateSigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2008 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2009 auto psubsw = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2010 psubsw->addArg(x.value);
2011 psubsw->addArg(y.value);
2012 ::basicBlock->appendInst(psubsw);
2013
2014 return RValue<Short4>(V(result));
2015 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002016 }
2017
2018 RValue<Short4> MulHigh(RValue<Short4> x, RValue<Short4> y)
2019 {
Nicolas Capens6c157442017-07-25 15:32:12 -04002020 if(emulateIntrinsics)
2021 {
2022 Short4 result;
2023 result = Insert(result, Short((Int(Extract(x, 0)) * Int(Extract(y, 0))) >> 16), 0);
2024 result = Insert(result, Short((Int(Extract(x, 1)) * Int(Extract(y, 1))) >> 16), 1);
2025 result = Insert(result, Short((Int(Extract(x, 2)) * Int(Extract(y, 2))) >> 16), 2);
2026 result = Insert(result, Short((Int(Extract(x, 3)) * Int(Extract(y, 3))) >> 16), 3);
Nicolas Capensc71bed22016-11-07 22:25:14 -05002027
Nicolas Capens6c157442017-07-25 15:32:12 -04002028 return result;
2029 }
2030 else
2031 {
2032 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2033 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::MultiplyHighSigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2034 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2035 auto pmulhw = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2036 pmulhw->addArg(x.value);
2037 pmulhw->addArg(y.value);
2038 ::basicBlock->appendInst(pmulhw);
2039
2040 return RValue<Short4>(V(result));
2041 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002042 }
2043
2044 RValue<Int2> MulAdd(RValue<Short4> x, RValue<Short4> y)
2045 {
Nicolas Capensafe27e92017-07-25 15:32:12 -04002046 if(emulateIntrinsics)
2047 {
2048 Int2 result;
2049 result = Insert(result, Int(Extract(x, 0)) * Int(Extract(y, 0)) + Int(Extract(x, 1)) * Int(Extract(y, 1)), 0);
2050 result = Insert(result, Int(Extract(x, 2)) * Int(Extract(y, 2)) + Int(Extract(x, 3)) * Int(Extract(y, 3)), 1);
Nicolas Capensc71bed22016-11-07 22:25:14 -05002051
Nicolas Capensafe27e92017-07-25 15:32:12 -04002052 return result;
2053 }
2054 else
2055 {
2056 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2057 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::MultiplyAddPairs, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2058 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2059 auto pmaddwd = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2060 pmaddwd->addArg(x.value);
2061 pmaddwd->addArg(y.value);
2062 ::basicBlock->appendInst(pmaddwd);
2063
2064 return As<Int2>(V(result));
2065 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002066 }
2067
Nicolas Capens33438a62017-09-27 11:47:35 -04002068 RValue<SByte8> PackSigned(RValue<Short4> x, RValue<Short4> y)
Nicolas Capens598f8d82016-09-26 15:09:10 -04002069 {
Nicolas Capens8960fbf2017-07-25 15:32:12 -04002070 if(emulateIntrinsics)
2071 {
2072 SByte8 result;
Nicolas Capens33438a62017-09-27 11:47:35 -04002073 result = Insert(result, SaturateSigned(Extract(x, 0)), 0);
2074 result = Insert(result, SaturateSigned(Extract(x, 1)), 1);
2075 result = Insert(result, SaturateSigned(Extract(x, 2)), 2);
2076 result = Insert(result, SaturateSigned(Extract(x, 3)), 3);
2077 result = Insert(result, SaturateSigned(Extract(y, 0)), 4);
2078 result = Insert(result, SaturateSigned(Extract(y, 1)), 5);
2079 result = Insert(result, SaturateSigned(Extract(y, 2)), 6);
2080 result = Insert(result, SaturateSigned(Extract(y, 3)), 7);
Nicolas Capensec54a172016-10-25 17:32:37 -04002081
Nicolas Capens8960fbf2017-07-25 15:32:12 -04002082 return result;
2083 }
2084 else
2085 {
2086 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v16i8);
2087 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::VectorPackSigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2088 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2089 auto pack = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2090 pack->addArg(x.value);
2091 pack->addArg(y.value);
2092 ::basicBlock->appendInst(pack);
2093
2094 return As<SByte8>(Swizzle(As<Int4>(V(result)), 0x88));
2095 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002096 }
2097
Nicolas Capens33438a62017-09-27 11:47:35 -04002098 RValue<Byte8> PackUnsigned(RValue<Short4> x, RValue<Short4> y)
2099 {
2100 if(emulateIntrinsics)
2101 {
2102 Byte8 result;
2103 result = Insert(result, SaturateUnsigned(Extract(x, 0)), 0);
2104 result = Insert(result, SaturateUnsigned(Extract(x, 1)), 1);
2105 result = Insert(result, SaturateUnsigned(Extract(x, 2)), 2);
2106 result = Insert(result, SaturateUnsigned(Extract(x, 3)), 3);
2107 result = Insert(result, SaturateUnsigned(Extract(y, 0)), 4);
2108 result = Insert(result, SaturateUnsigned(Extract(y, 1)), 5);
2109 result = Insert(result, SaturateUnsigned(Extract(y, 2)), 6);
2110 result = Insert(result, SaturateUnsigned(Extract(y, 3)), 7);
2111
2112 return result;
2113 }
2114 else
2115 {
2116 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v16i8);
2117 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::VectorPackUnsigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2118 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2119 auto pack = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2120 pack->addArg(x.value);
2121 pack->addArg(y.value);
2122 ::basicBlock->appendInst(pack);
2123
2124 return As<Byte8>(Swizzle(As<Int4>(V(result)), 0x88));
2125 }
2126 }
2127
Nicolas Capens598f8d82016-09-26 15:09:10 -04002128 RValue<Short4> CmpGT(RValue<Short4> x, RValue<Short4> y)
2129 {
Nicolas Capens2f970b62016-11-08 14:28:59 -05002130 return RValue<Short4>(createIntCompare(Ice::InstIcmp::Sgt, x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002131 }
2132
2133 RValue<Short4> CmpEQ(RValue<Short4> x, RValue<Short4> y)
2134 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05002135 return RValue<Short4>(Nucleus::createICmpEQ(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002136 }
2137
2138 Type *Short4::getType()
2139 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04002140 return T(Type_v4i16);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002141 }
2142
Nicolas Capens598f8d82016-09-26 15:09:10 -04002143 UShort4::UShort4(RValue<Float4> cast, bool saturate)
2144 {
Nicolas Capensd4227962016-11-09 14:24:25 -05002145 if(saturate)
2146 {
Nicolas Capens9ca48d52017-01-14 12:52:55 -05002147 if(CPUID::SSE4_1)
Nicolas Capensd4227962016-11-09 14:24:25 -05002148 {
Nicolas Capens091f3502017-10-03 14:56:49 -04002149 // x86 produces 0x80000000 on 32-bit integer overflow/underflow.
2150 // PackUnsigned takes care of 0x0000 saturation.
2151 Int4 int4(Min(cast, Float4(0xFFFF)));
2152 *this = As<UShort4>(PackUnsigned(int4, int4));
2153 }
2154 else if(CPUID::ARM)
2155 {
2156 // ARM saturates the 32-bit integer result on overflow/undeflow.
2157 Int4 int4(cast);
Nicolas Capens33438a62017-09-27 11:47:35 -04002158 *this = As<UShort4>(PackUnsigned(int4, int4));
Nicolas Capensd4227962016-11-09 14:24:25 -05002159 }
2160 else
2161 {
2162 *this = Short4(Int4(Max(Min(cast, Float4(0xFFFF)), Float4(0x0000))));
2163 }
2164 }
2165 else
2166 {
2167 *this = Short4(Int4(cast));
2168 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002169 }
2170
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002171 RValue<UShort> Extract(RValue<UShort4> val, int i)
2172 {
2173 return RValue<UShort>(Nucleus::createExtractElement(val.value, UShort::getType(), i));
2174 }
2175
2176 RValue<UShort4> Insert(RValue<UShort4> val, RValue<UShort> element, int i)
2177 {
2178 return RValue<UShort4>(Nucleus::createInsertElement(val.value, element.value, i));
2179 }
2180
Nicolas Capens598f8d82016-09-26 15:09:10 -04002181 RValue<UShort4> operator<<(RValue<UShort4> lhs, unsigned char rhs)
2182 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002183 if(emulateIntrinsics)
2184 {
2185 UShort4 result;
2186 result = Insert(result, Extract(lhs, 0) << UShort(rhs), 0);
2187 result = Insert(result, Extract(lhs, 1) << UShort(rhs), 1);
2188 result = Insert(result, Extract(lhs, 2) << UShort(rhs), 2);
2189 result = Insert(result, Extract(lhs, 3) << UShort(rhs), 3);
2190
2191 return result;
2192 }
2193 else
2194 {
2195 return RValue<UShort4>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
2196 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002197 }
2198
2199 RValue<UShort4> operator>>(RValue<UShort4> lhs, unsigned char rhs)
2200 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002201 if(emulateIntrinsics)
2202 {
2203 UShort4 result;
2204 result = Insert(result, Extract(lhs, 0) >> UShort(rhs), 0);
2205 result = Insert(result, Extract(lhs, 1) >> UShort(rhs), 1);
2206 result = Insert(result, Extract(lhs, 2) >> UShort(rhs), 2);
2207 result = Insert(result, Extract(lhs, 3) >> UShort(rhs), 3);
2208
2209 return result;
2210 }
2211 else
2212 {
2213 return RValue<UShort4>(Nucleus::createLShr(lhs.value, V(::context->getConstantInt32(rhs))));
2214 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002215 }
2216
Nicolas Capens598f8d82016-09-26 15:09:10 -04002217 RValue<UShort4> Max(RValue<UShort4> x, RValue<UShort4> y)
2218 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04002219 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v8i1);
2220 auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Ule, condition, x.value, y.value);
2221 ::basicBlock->appendInst(cmp);
2222
2223 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2224 auto select = Ice::InstSelect::create(::function, result, condition, y.value, x.value);
2225 ::basicBlock->appendInst(select);
2226
2227 return RValue<UShort4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002228 }
2229
2230 RValue<UShort4> Min(RValue<UShort4> x, RValue<UShort4> y)
2231 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04002232 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v8i1);
2233 auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Ugt, condition, x.value, y.value);
2234 ::basicBlock->appendInst(cmp);
2235
2236 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2237 auto select = Ice::InstSelect::create(::function, result, condition, y.value, x.value);
2238 ::basicBlock->appendInst(select);
2239
2240 return RValue<UShort4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002241 }
2242
Nicolas Capens7f301812017-10-02 17:32:34 -04002243 RValue<UShort> SaturateUnsigned(RValue<Int> x)
Nicolas Capens98436732017-07-25 15:32:12 -04002244 {
2245 return UShort(IfThenElse(x > 0xFFFF, Int(0xFFFF), IfThenElse(x < 0, Int(0), x)));
2246 }
2247
Nicolas Capens598f8d82016-09-26 15:09:10 -04002248 RValue<UShort4> AddSat(RValue<UShort4> x, RValue<UShort4> y)
2249 {
Nicolas Capens98436732017-07-25 15:32:12 -04002250 if(emulateIntrinsics)
2251 {
2252 UShort4 result;
Nicolas Capens7f301812017-10-02 17:32:34 -04002253 result = Insert(result, SaturateUnsigned(Int(Extract(x, 0)) + Int(Extract(y, 0))), 0);
2254 result = Insert(result, SaturateUnsigned(Int(Extract(x, 1)) + Int(Extract(y, 1))), 1);
2255 result = Insert(result, SaturateUnsigned(Int(Extract(x, 2)) + Int(Extract(y, 2))), 2);
2256 result = Insert(result, SaturateUnsigned(Int(Extract(x, 3)) + Int(Extract(y, 3))), 3);
Nicolas Capensc71bed22016-11-07 22:25:14 -05002257
Nicolas Capens98436732017-07-25 15:32:12 -04002258 return result;
2259 }
2260 else
2261 {
2262 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2263 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::AddSaturateUnsigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2264 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2265 auto paddusw = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2266 paddusw->addArg(x.value);
2267 paddusw->addArg(y.value);
2268 ::basicBlock->appendInst(paddusw);
2269
2270 return RValue<UShort4>(V(result));
2271 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002272 }
2273
2274 RValue<UShort4> SubSat(RValue<UShort4> x, RValue<UShort4> y)
2275 {
Nicolas Capens98436732017-07-25 15:32:12 -04002276 if(emulateIntrinsics)
2277 {
2278 UShort4 result;
Nicolas Capens7f301812017-10-02 17:32:34 -04002279 result = Insert(result, SaturateUnsigned(Int(Extract(x, 0)) - Int(Extract(y, 0))), 0);
2280 result = Insert(result, SaturateUnsigned(Int(Extract(x, 1)) - Int(Extract(y, 1))), 1);
2281 result = Insert(result, SaturateUnsigned(Int(Extract(x, 2)) - Int(Extract(y, 2))), 2);
2282 result = Insert(result, SaturateUnsigned(Int(Extract(x, 3)) - Int(Extract(y, 3))), 3);
Nicolas Capensc71bed22016-11-07 22:25:14 -05002283
Nicolas Capens98436732017-07-25 15:32:12 -04002284 return result;
2285 }
2286 else
2287 {
2288 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2289 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::SubtractSaturateUnsigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2290 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2291 auto psubusw = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2292 psubusw->addArg(x.value);
2293 psubusw->addArg(y.value);
2294 ::basicBlock->appendInst(psubusw);
2295
2296 return RValue<UShort4>(V(result));
2297 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002298 }
2299
2300 RValue<UShort4> MulHigh(RValue<UShort4> x, RValue<UShort4> y)
2301 {
Nicolas Capens6c157442017-07-25 15:32:12 -04002302 if(emulateIntrinsics)
2303 {
2304 UShort4 result;
2305 result = Insert(result, UShort((UInt(Extract(x, 0)) * UInt(Extract(y, 0))) >> 16), 0);
2306 result = Insert(result, UShort((UInt(Extract(x, 1)) * UInt(Extract(y, 1))) >> 16), 1);
2307 result = Insert(result, UShort((UInt(Extract(x, 2)) * UInt(Extract(y, 2))) >> 16), 2);
2308 result = Insert(result, UShort((UInt(Extract(x, 3)) * UInt(Extract(y, 3))) >> 16), 3);
Nicolas Capensc71bed22016-11-07 22:25:14 -05002309
Nicolas Capens6c157442017-07-25 15:32:12 -04002310 return result;
2311 }
2312 else
2313 {
2314 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2315 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::MultiplyHighUnsigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2316 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2317 auto pmulhuw = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2318 pmulhuw->addArg(x.value);
2319 pmulhuw->addArg(y.value);
2320 ::basicBlock->appendInst(pmulhuw);
2321
2322 return RValue<UShort4>(V(result));
2323 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002324 }
2325
Chris Forbesaa8f6992019-03-01 14:18:30 -08002326 RValue<Int4> MulHigh(RValue<Int4> x, RValue<Int4> y)
2327 {
2328 // TODO: For x86, build an intrinsics version of this which uses shuffles + pmuludq.
2329
2330 // Scalarized implementation.
2331 Int4 result;
2332 result = Insert(result, Int((Long(Extract(x, 0)) * Long(Extract(y, 0))) >> Long(Int(32))), 0);
2333 result = Insert(result, Int((Long(Extract(x, 1)) * Long(Extract(y, 1))) >> Long(Int(32))), 1);
2334 result = Insert(result, Int((Long(Extract(x, 2)) * Long(Extract(y, 2))) >> Long(Int(32))), 2);
2335 result = Insert(result, Int((Long(Extract(x, 3)) * Long(Extract(y, 3))) >> Long(Int(32))), 3);
2336
2337 return result;
2338 }
2339
2340 RValue<UInt4> MulHigh(RValue<UInt4> x, RValue<UInt4> y)
2341 {
2342 // TODO: For x86, build an intrinsics version of this which uses shuffles + pmuludq.
2343
2344 if(false) // Partial product based implementation.
2345 {
2346 auto xh = x >> 16;
2347 auto yh = y >> 16;
2348 auto xl = x & UInt4(0x0000FFFF);
2349 auto yl = y & UInt4(0x0000FFFF);
2350 auto xlyh = xl * yh;
2351 auto xhyl = xh * yl;
2352 auto xlyhh = xlyh >> 16;
2353 auto xhylh = xhyl >> 16;
2354 auto xlyhl = xlyh & UInt4(0x0000FFFF);
2355 auto xhyll = xhyl & UInt4(0x0000FFFF);
2356 auto xlylh = (xl * yl) >> 16;
2357 auto oflow = (xlyhl + xhyll + xlylh) >> 16;
2358
2359 return (xh * yh) + (xlyhh + xhylh) + oflow;
2360 }
2361
2362 // Scalarized implementation.
2363 Int4 result;
2364 result = Insert(result, Int((Long(UInt(Extract(As<Int4>(x), 0))) * Long(UInt(Extract(As<Int4>(y), 0)))) >> Long(Int(32))), 0);
2365 result = Insert(result, Int((Long(UInt(Extract(As<Int4>(x), 1))) * Long(UInt(Extract(As<Int4>(y), 1)))) >> Long(Int(32))), 1);
2366 result = Insert(result, Int((Long(UInt(Extract(As<Int4>(x), 2))) * Long(UInt(Extract(As<Int4>(y), 2)))) >> Long(Int(32))), 2);
2367 result = Insert(result, Int((Long(UInt(Extract(As<Int4>(x), 3))) * Long(UInt(Extract(As<Int4>(y), 3)))) >> Long(Int(32))), 3);
2368
2369 return As<UInt4>(result);
2370 }
2371
Nicolas Capens598f8d82016-09-26 15:09:10 -04002372 RValue<UShort4> Average(RValue<UShort4> x, RValue<UShort4> y)
2373 {
Ben Claytoneb50d252019-04-15 13:50:01 -04002374 UNIMPLEMENTED("RValue<UShort4> Average(RValue<UShort4> x, RValue<UShort4> y)");
2375 return UShort4(0);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002376 }
2377
Nicolas Capens598f8d82016-09-26 15:09:10 -04002378 Type *UShort4::getType()
2379 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04002380 return T(Type_v4i16);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002381 }
2382
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002383 RValue<Short> Extract(RValue<Short8> val, int i)
2384 {
2385 return RValue<Short>(Nucleus::createExtractElement(val.value, Short::getType(), i));
2386 }
2387
2388 RValue<Short8> Insert(RValue<Short8> val, RValue<Short> element, int i)
2389 {
2390 return RValue<Short8>(Nucleus::createInsertElement(val.value, element.value, i));
2391 }
2392
Nicolas Capens598f8d82016-09-26 15:09:10 -04002393 RValue<Short8> operator<<(RValue<Short8> lhs, unsigned char rhs)
2394 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002395 if(emulateIntrinsics)
2396 {
2397 Short8 result;
2398 result = Insert(result, Extract(lhs, 0) << Short(rhs), 0);
2399 result = Insert(result, Extract(lhs, 1) << Short(rhs), 1);
2400 result = Insert(result, Extract(lhs, 2) << Short(rhs), 2);
2401 result = Insert(result, Extract(lhs, 3) << Short(rhs), 3);
2402 result = Insert(result, Extract(lhs, 4) << Short(rhs), 4);
2403 result = Insert(result, Extract(lhs, 5) << Short(rhs), 5);
2404 result = Insert(result, Extract(lhs, 6) << Short(rhs), 6);
2405 result = Insert(result, Extract(lhs, 7) << Short(rhs), 7);
2406
2407 return result;
2408 }
2409 else
2410 {
2411 return RValue<Short8>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
2412 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002413 }
2414
2415 RValue<Short8> operator>>(RValue<Short8> lhs, unsigned char rhs)
2416 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002417 if(emulateIntrinsics)
2418 {
2419 Short8 result;
2420 result = Insert(result, Extract(lhs, 0) >> Short(rhs), 0);
2421 result = Insert(result, Extract(lhs, 1) >> Short(rhs), 1);
2422 result = Insert(result, Extract(lhs, 2) >> Short(rhs), 2);
2423 result = Insert(result, Extract(lhs, 3) >> Short(rhs), 3);
2424 result = Insert(result, Extract(lhs, 4) >> Short(rhs), 4);
2425 result = Insert(result, Extract(lhs, 5) >> Short(rhs), 5);
2426 result = Insert(result, Extract(lhs, 6) >> Short(rhs), 6);
2427 result = Insert(result, Extract(lhs, 7) >> Short(rhs), 7);
2428
2429 return result;
2430 }
2431 else
2432 {
2433 return RValue<Short8>(Nucleus::createAShr(lhs.value, V(::context->getConstantInt32(rhs))));
2434 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002435 }
2436
2437 RValue<Int4> MulAdd(RValue<Short8> x, RValue<Short8> y)
2438 {
Ben Claytoneb50d252019-04-15 13:50:01 -04002439 UNIMPLEMENTED("RValue<Int4> MulAdd(RValue<Short8> x, RValue<Short8> y)");
2440 return Int4(0);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002441 }
2442
Nicolas Capens598f8d82016-09-26 15:09:10 -04002443 RValue<Short8> MulHigh(RValue<Short8> x, RValue<Short8> y)
2444 {
Ben Claytoneb50d252019-04-15 13:50:01 -04002445 UNIMPLEMENTED("RValue<Short8> MulHigh(RValue<Short8> x, RValue<Short8> y)");
2446 return Short8(0);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002447 }
2448
2449 Type *Short8::getType()
2450 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04002451 return T(Ice::IceType_v8i16);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002452 }
2453
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002454 RValue<UShort> Extract(RValue<UShort8> val, int i)
2455 {
2456 return RValue<UShort>(Nucleus::createExtractElement(val.value, UShort::getType(), i));
2457 }
2458
2459 RValue<UShort8> Insert(RValue<UShort8> val, RValue<UShort> element, int i)
2460 {
2461 return RValue<UShort8>(Nucleus::createInsertElement(val.value, element.value, i));
2462 }
2463
Nicolas Capens598f8d82016-09-26 15:09:10 -04002464 RValue<UShort8> operator<<(RValue<UShort8> lhs, unsigned char rhs)
2465 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002466 if(emulateIntrinsics)
2467 {
2468 UShort8 result;
2469 result = Insert(result, Extract(lhs, 0) << UShort(rhs), 0);
2470 result = Insert(result, Extract(lhs, 1) << UShort(rhs), 1);
2471 result = Insert(result, Extract(lhs, 2) << UShort(rhs), 2);
2472 result = Insert(result, Extract(lhs, 3) << UShort(rhs), 3);
2473 result = Insert(result, Extract(lhs, 4) << UShort(rhs), 4);
2474 result = Insert(result, Extract(lhs, 5) << UShort(rhs), 5);
2475 result = Insert(result, Extract(lhs, 6) << UShort(rhs), 6);
2476 result = Insert(result, Extract(lhs, 7) << UShort(rhs), 7);
2477
2478 return result;
2479 }
2480 else
2481 {
2482 return RValue<UShort8>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
2483 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002484 }
2485
2486 RValue<UShort8> operator>>(RValue<UShort8> lhs, unsigned char rhs)
2487 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002488 if(emulateIntrinsics)
2489 {
2490 UShort8 result;
2491 result = Insert(result, Extract(lhs, 0) >> UShort(rhs), 0);
2492 result = Insert(result, Extract(lhs, 1) >> UShort(rhs), 1);
2493 result = Insert(result, Extract(lhs, 2) >> UShort(rhs), 2);
2494 result = Insert(result, Extract(lhs, 3) >> UShort(rhs), 3);
2495 result = Insert(result, Extract(lhs, 4) >> UShort(rhs), 4);
2496 result = Insert(result, Extract(lhs, 5) >> UShort(rhs), 5);
2497 result = Insert(result, Extract(lhs, 6) >> UShort(rhs), 6);
2498 result = Insert(result, Extract(lhs, 7) >> UShort(rhs), 7);
2499
2500 return result;
2501 }
2502 else
2503 {
2504 return RValue<UShort8>(Nucleus::createLShr(lhs.value, V(::context->getConstantInt32(rhs))));
2505 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002506 }
2507
Nicolas Capens598f8d82016-09-26 15:09:10 -04002508 RValue<UShort8> Swizzle(RValue<UShort8> x, char select0, char select1, char select2, char select3, char select4, char select5, char select6, char select7)
2509 {
Ben Claytoneb50d252019-04-15 13:50:01 -04002510 UNIMPLEMENTED("RValue<UShort8> Swizzle(RValue<UShort8> x, char select0, char select1, char select2, char select3, char select4, char select5, char select6, char select7)");
2511 return UShort8(0);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002512 }
2513
2514 RValue<UShort8> MulHigh(RValue<UShort8> x, RValue<UShort8> y)
2515 {
Ben Claytoneb50d252019-04-15 13:50:01 -04002516 UNIMPLEMENTED("RValue<UShort8> MulHigh(RValue<UShort8> x, RValue<UShort8> y)");
2517 return UShort8(0);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002518 }
2519
2520 // FIXME: Implement as Shuffle(x, y, Select(i0, ..., i16)) and Shuffle(x, y, SELECT_PACK_REPEAT(element))
2521// RValue<UShort8> PackRepeat(RValue<Byte16> x, RValue<Byte16> y, int element)
2522// {
Ben Claytoneb50d252019-04-15 13:50:01 -04002523// ASSERT(false && "UNIMPLEMENTED"); return RValue<UShort8>(V(nullptr));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002524// }
2525
2526 Type *UShort8::getType()
2527 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04002528 return T(Ice::IceType_v8i16);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002529 }
2530
Nicolas Capens96d4e092016-11-18 14:22:38 -05002531 RValue<Int> operator++(Int &val, int) // Post-increment
Nicolas Capens598f8d82016-09-26 15:09:10 -04002532 {
Nicolas Capens5b41ba32016-12-08 14:34:00 -05002533 RValue<Int> res = val;
Nicolas Capensd1229402016-11-07 16:05:22 -05002534 val += 1;
2535 return res;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002536 }
2537
Nicolas Capens96d4e092016-11-18 14:22:38 -05002538 const Int &operator++(Int &val) // Pre-increment
Nicolas Capens598f8d82016-09-26 15:09:10 -04002539 {
Nicolas Capensd1229402016-11-07 16:05:22 -05002540 val += 1;
2541 return val;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002542 }
2543
Nicolas Capens96d4e092016-11-18 14:22:38 -05002544 RValue<Int> operator--(Int &val, int) // Post-decrement
Nicolas Capens598f8d82016-09-26 15:09:10 -04002545 {
Nicolas Capensd1229402016-11-07 16:05:22 -05002546 RValue<Int> res = val;
2547 val -= 1;
2548 return res;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002549 }
2550
Nicolas Capens96d4e092016-11-18 14:22:38 -05002551 const Int &operator--(Int &val) // Pre-decrement
Nicolas Capens598f8d82016-09-26 15:09:10 -04002552 {
Nicolas Capensd1229402016-11-07 16:05:22 -05002553 val -= 1;
2554 return val;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002555 }
2556
Nicolas Capens598f8d82016-09-26 15:09:10 -04002557 RValue<Int> RoundInt(RValue<Float> cast)
2558 {
Nicolas Capens091f3502017-10-03 14:56:49 -04002559 if(emulateIntrinsics || CPUID::ARM)
Nicolas Capensf7b75882017-04-26 09:30:47 -04002560 {
2561 // Push the fractional part off the mantissa. Accurate up to +/-2^22.
2562 return Int((cast + Float(0x00C00000)) - Float(0x00C00000));
2563 }
2564 else
2565 {
2566 Ice::Variable *result = ::function->makeVariable(Ice::IceType_i32);
2567 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::Nearbyint, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2568 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2569 auto nearbyint = Ice::InstIntrinsicCall::create(::function, 1, result, target, intrinsic);
2570 nearbyint->addArg(cast.value);
2571 ::basicBlock->appendInst(nearbyint);
Nicolas Capensa8086512016-11-07 17:32:17 -05002572
Nicolas Capensf7b75882017-04-26 09:30:47 -04002573 return RValue<Int>(V(result));
2574 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002575 }
2576
2577 Type *Int::getType()
2578 {
2579 return T(Ice::IceType_i32);
2580 }
2581
Nicolas Capens598f8d82016-09-26 15:09:10 -04002582 Type *Long::getType()
2583 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04002584 return T(Ice::IceType_i64);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002585 }
2586
Nicolas Capens598f8d82016-09-26 15:09:10 -04002587 UInt::UInt(RValue<Float> cast)
2588 {
Nicolas Capensc70a1162016-12-03 00:16:14 -05002589 // Smallest positive value representable in UInt, but not in Int
2590 const unsigned int ustart = 0x80000000u;
2591 const float ustartf = float(ustart);
2592
2593 // If the value is negative, store 0, otherwise store the result of the conversion
2594 storeValue((~(As<Int>(cast) >> 31) &
2595 // Check if the value can be represented as an Int
2596 IfThenElse(cast >= ustartf,
2597 // If the value is too large, subtract ustart and re-add it after conversion.
2598 As<Int>(As<UInt>(Int(cast - Float(ustartf))) + UInt(ustart)),
2599 // Otherwise, just convert normally
2600 Int(cast))).value);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002601 }
2602
Nicolas Capens96d4e092016-11-18 14:22:38 -05002603 RValue<UInt> operator++(UInt &val, int) // Post-increment
Nicolas Capens598f8d82016-09-26 15:09:10 -04002604 {
Nicolas Capensd1229402016-11-07 16:05:22 -05002605 RValue<UInt> res = val;
2606 val += 1;
2607 return res;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002608 }
2609
Nicolas Capens96d4e092016-11-18 14:22:38 -05002610 const UInt &operator++(UInt &val) // Pre-increment
Nicolas Capens598f8d82016-09-26 15:09:10 -04002611 {
Nicolas Capensd1229402016-11-07 16:05:22 -05002612 val += 1;
2613 return val;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002614 }
2615
Nicolas Capens96d4e092016-11-18 14:22:38 -05002616 RValue<UInt> operator--(UInt &val, int) // Post-decrement
Nicolas Capens598f8d82016-09-26 15:09:10 -04002617 {
Nicolas Capensd1229402016-11-07 16:05:22 -05002618 RValue<UInt> res = val;
2619 val -= 1;
2620 return res;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002621 }
2622
Nicolas Capens96d4e092016-11-18 14:22:38 -05002623 const UInt &operator--(UInt &val) // Pre-decrement
Nicolas Capens598f8d82016-09-26 15:09:10 -04002624 {
Nicolas Capensd1229402016-11-07 16:05:22 -05002625 val -= 1;
2626 return val;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002627 }
2628
Nicolas Capens598f8d82016-09-26 15:09:10 -04002629// RValue<UInt> RoundUInt(RValue<Float> cast)
2630// {
Ben Claytoneb50d252019-04-15 13:50:01 -04002631// ASSERT(false && "UNIMPLEMENTED"); return RValue<UInt>(V(nullptr));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002632// }
2633
2634 Type *UInt::getType()
2635 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04002636 return T(Ice::IceType_i32);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002637 }
2638
2639// Int2::Int2(RValue<Int> cast)
2640// {
2641// Value *extend = Nucleus::createZExt(cast.value, Long::getType());
2642// Value *vector = Nucleus::createBitCast(extend, Int2::getType());
2643//
2644// Constant *shuffle[2];
2645// shuffle[0] = Nucleus::createConstantInt(0);
2646// shuffle[1] = Nucleus::createConstantInt(0);
2647//
2648// Value *replicate = Nucleus::createShuffleVector(vector, UndefValue::get(Int2::getType()), Nucleus::createConstantVector(shuffle, 2));
2649//
2650// storeValue(replicate);
2651// }
2652
Nicolas Capens598f8d82016-09-26 15:09:10 -04002653 RValue<Int2> operator<<(RValue<Int2> lhs, unsigned char rhs)
2654 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002655 if(emulateIntrinsics)
2656 {
2657 Int2 result;
2658 result = Insert(result, Extract(lhs, 0) << Int(rhs), 0);
2659 result = Insert(result, Extract(lhs, 1) << Int(rhs), 1);
2660
2661 return result;
2662 }
2663 else
2664 {
2665 return RValue<Int2>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
2666 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002667 }
2668
2669 RValue<Int2> operator>>(RValue<Int2> lhs, unsigned char rhs)
2670 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002671 if(emulateIntrinsics)
2672 {
2673 Int2 result;
2674 result = Insert(result, Extract(lhs, 0) >> Int(rhs), 0);
2675 result = Insert(result, Extract(lhs, 1) >> Int(rhs), 1);
2676
2677 return result;
2678 }
2679 else
2680 {
2681 return RValue<Int2>(Nucleus::createAShr(lhs.value, V(::context->getConstantInt32(rhs))));
2682 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002683 }
2684
Nicolas Capens598f8d82016-09-26 15:09:10 -04002685 Type *Int2::getType()
2686 {
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04002687 return T(Type_v2i32);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002688 }
2689
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002690 RValue<UInt> Extract(RValue<UInt2> val, int i)
2691 {
2692 return RValue<UInt>(Nucleus::createExtractElement(val.value, UInt::getType(), i));
2693 }
2694
2695 RValue<UInt2> Insert(RValue<UInt2> val, RValue<UInt> element, int i)
2696 {
2697 return RValue<UInt2>(Nucleus::createInsertElement(val.value, element.value, i));
2698 }
2699
Nicolas Capens598f8d82016-09-26 15:09:10 -04002700 RValue<UInt2> operator<<(RValue<UInt2> lhs, unsigned char rhs)
2701 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002702 if(emulateIntrinsics)
2703 {
2704 UInt2 result;
2705 result = Insert(result, Extract(lhs, 0) << UInt(rhs), 0);
2706 result = Insert(result, Extract(lhs, 1) << UInt(rhs), 1);
2707
2708 return result;
2709 }
2710 else
2711 {
2712 return RValue<UInt2>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
2713 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002714 }
2715
2716 RValue<UInt2> operator>>(RValue<UInt2> lhs, unsigned char rhs)
2717 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002718 if(emulateIntrinsics)
2719 {
2720 UInt2 result;
2721 result = Insert(result, Extract(lhs, 0) >> UInt(rhs), 0);
2722 result = Insert(result, Extract(lhs, 1) >> UInt(rhs), 1);
2723
2724 return result;
2725 }
2726 else
2727 {
2728 return RValue<UInt2>(Nucleus::createLShr(lhs.value, V(::context->getConstantInt32(rhs))));
2729 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002730 }
2731
Nicolas Capens598f8d82016-09-26 15:09:10 -04002732 Type *UInt2::getType()
2733 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04002734 return T(Type_v2i32);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002735 }
2736
Nicolas Capenscb986762017-01-20 11:34:37 -05002737 Int4::Int4(RValue<Byte4> cast) : XYZW(this)
Nicolas Capens598f8d82016-09-26 15:09:10 -04002738 {
Nicolas Capensd4227962016-11-09 14:24:25 -05002739 Value *x = Nucleus::createBitCast(cast.value, Int::getType());
2740 Value *a = Nucleus::createInsertElement(loadValue(), x, 0);
2741
2742 Value *e;
2743 int swizzle[16] = {0, 16, 1, 17, 2, 18, 3, 19, 4, 20, 5, 21, 6, 22, 7, 23};
2744 Value *b = Nucleus::createBitCast(a, Byte16::getType());
2745 Value *c = Nucleus::createShuffleVector(b, V(Nucleus::createNullValue(Byte16::getType())), swizzle);
2746
2747 int swizzle2[8] = {0, 8, 1, 9, 2, 10, 3, 11};
2748 Value *d = Nucleus::createBitCast(c, Short8::getType());
2749 e = Nucleus::createShuffleVector(d, V(Nucleus::createNullValue(Short8::getType())), swizzle2);
2750
2751 Value *f = Nucleus::createBitCast(e, Int4::getType());
2752 storeValue(f);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002753 }
2754
Nicolas Capenscb986762017-01-20 11:34:37 -05002755 Int4::Int4(RValue<SByte4> cast) : XYZW(this)
Nicolas Capens598f8d82016-09-26 15:09:10 -04002756 {
Nicolas Capensd4227962016-11-09 14:24:25 -05002757 Value *x = Nucleus::createBitCast(cast.value, Int::getType());
2758 Value *a = Nucleus::createInsertElement(loadValue(), x, 0);
2759
Nicolas Capensd4227962016-11-09 14:24:25 -05002760 int swizzle[16] = {0, 0, 1, 1, 2, 2, 3, 3, 4, 4, 5, 5, 6, 6, 7, 7};
2761 Value *b = Nucleus::createBitCast(a, Byte16::getType());
2762 Value *c = Nucleus::createShuffleVector(b, b, swizzle);
2763
2764 int swizzle2[8] = {0, 0, 1, 1, 2, 2, 3, 3};
2765 Value *d = Nucleus::createBitCast(c, Short8::getType());
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002766 Value *e = Nucleus::createShuffleVector(d, d, swizzle2);
Nicolas Capensd4227962016-11-09 14:24:25 -05002767
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002768 *this = As<Int4>(e) >> 24;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002769 }
2770
Nicolas Capenscb986762017-01-20 11:34:37 -05002771 Int4::Int4(RValue<Short4> cast) : XYZW(this)
Nicolas Capens598f8d82016-09-26 15:09:10 -04002772 {
Nicolas Capensd4227962016-11-09 14:24:25 -05002773 int swizzle[8] = {0, 0, 1, 1, 2, 2, 3, 3};
2774 Value *c = Nucleus::createShuffleVector(cast.value, cast.value, swizzle);
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002775
2776 *this = As<Int4>(c) >> 16;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002777 }
2778
Nicolas Capenscb986762017-01-20 11:34:37 -05002779 Int4::Int4(RValue<UShort4> cast) : XYZW(this)
Nicolas Capens598f8d82016-09-26 15:09:10 -04002780 {
Nicolas Capensd4227962016-11-09 14:24:25 -05002781 int swizzle[8] = {0, 8, 1, 9, 2, 10, 3, 11};
2782 Value *c = Nucleus::createShuffleVector(cast.value, Short8(0, 0, 0, 0, 0, 0, 0, 0).loadValue(), swizzle);
2783 Value *d = Nucleus::createBitCast(c, Int4::getType());
2784 storeValue(d);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002785 }
2786
Nicolas Capenscb986762017-01-20 11:34:37 -05002787 Int4::Int4(RValue<Int> rhs) : XYZW(this)
Nicolas Capens598f8d82016-09-26 15:09:10 -04002788 {
Nicolas Capensf8beb4b2017-01-27 02:55:44 -08002789 Value *vector = Nucleus::createBitCast(rhs.value, Int4::getType());
Nicolas Capensd4227962016-11-09 14:24:25 -05002790
2791 int swizzle[4] = {0, 0, 0, 0};
Nicolas Capensf8beb4b2017-01-27 02:55:44 -08002792 Value *replicate = Nucleus::createShuffleVector(vector, vector, swizzle);
Nicolas Capensd4227962016-11-09 14:24:25 -05002793
2794 storeValue(replicate);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002795 }
2796
Nicolas Capens598f8d82016-09-26 15:09:10 -04002797 RValue<Int4> operator<<(RValue<Int4> lhs, unsigned char rhs)
2798 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002799 if(emulateIntrinsics)
2800 {
2801 Int4 result;
2802 result = Insert(result, Extract(lhs, 0) << Int(rhs), 0);
2803 result = Insert(result, Extract(lhs, 1) << Int(rhs), 1);
2804 result = Insert(result, Extract(lhs, 2) << Int(rhs), 2);
2805 result = Insert(result, Extract(lhs, 3) << Int(rhs), 3);
2806
2807 return result;
2808 }
2809 else
2810 {
2811 return RValue<Int4>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
2812 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002813 }
2814
2815 RValue<Int4> operator>>(RValue<Int4> lhs, unsigned char rhs)
2816 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002817 if(emulateIntrinsics)
2818 {
2819 Int4 result;
2820 result = Insert(result, Extract(lhs, 0) >> Int(rhs), 0);
2821 result = Insert(result, Extract(lhs, 1) >> Int(rhs), 1);
2822 result = Insert(result, Extract(lhs, 2) >> Int(rhs), 2);
2823 result = Insert(result, Extract(lhs, 3) >> Int(rhs), 3);
2824
2825 return result;
2826 }
2827 else
2828 {
2829 return RValue<Int4>(Nucleus::createAShr(lhs.value, V(::context->getConstantInt32(rhs))));
2830 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002831 }
2832
Nicolas Capens598f8d82016-09-26 15:09:10 -04002833 RValue<Int4> CmpEQ(RValue<Int4> x, RValue<Int4> y)
2834 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05002835 return RValue<Int4>(Nucleus::createICmpEQ(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002836 }
2837
2838 RValue<Int4> CmpLT(RValue<Int4> x, RValue<Int4> y)
2839 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05002840 return RValue<Int4>(Nucleus::createICmpSLT(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002841 }
2842
2843 RValue<Int4> CmpLE(RValue<Int4> x, RValue<Int4> y)
2844 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05002845 return RValue<Int4>(Nucleus::createICmpSLE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002846 }
2847
2848 RValue<Int4> CmpNEQ(RValue<Int4> x, RValue<Int4> y)
2849 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05002850 return RValue<Int4>(Nucleus::createICmpNE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002851 }
2852
2853 RValue<Int4> CmpNLT(RValue<Int4> x, RValue<Int4> y)
2854 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05002855 return RValue<Int4>(Nucleus::createICmpSGE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002856 }
2857
2858 RValue<Int4> CmpNLE(RValue<Int4> x, RValue<Int4> y)
2859 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05002860 return RValue<Int4>(Nucleus::createICmpSGT(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002861 }
2862
2863 RValue<Int4> Max(RValue<Int4> x, RValue<Int4> y)
2864 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04002865 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
2866 auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Sle, condition, x.value, y.value);
2867 ::basicBlock->appendInst(cmp);
2868
2869 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4i32);
2870 auto select = Ice::InstSelect::create(::function, result, condition, y.value, x.value);
2871 ::basicBlock->appendInst(select);
2872
2873 return RValue<Int4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002874 }
2875
2876 RValue<Int4> Min(RValue<Int4> x, RValue<Int4> y)
2877 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04002878 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
2879 auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Sgt, condition, x.value, y.value);
2880 ::basicBlock->appendInst(cmp);
2881
2882 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4i32);
2883 auto select = Ice::InstSelect::create(::function, result, condition, y.value, x.value);
2884 ::basicBlock->appendInst(select);
2885
2886 return RValue<Int4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002887 }
2888
2889 RValue<Int4> RoundInt(RValue<Float4> cast)
2890 {
Nicolas Capens091f3502017-10-03 14:56:49 -04002891 if(emulateIntrinsics || CPUID::ARM)
Nicolas Capensf7b75882017-04-26 09:30:47 -04002892 {
2893 // Push the fractional part off the mantissa. Accurate up to +/-2^22.
2894 return Int4((cast + Float4(0x00C00000)) - Float4(0x00C00000));
2895 }
2896 else
2897 {
2898 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4i32);
2899 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::Nearbyint, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2900 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2901 auto nearbyint = Ice::InstIntrinsicCall::create(::function, 1, result, target, intrinsic);
2902 nearbyint->addArg(cast.value);
2903 ::basicBlock->appendInst(nearbyint);
Nicolas Capensa8086512016-11-07 17:32:17 -05002904
Nicolas Capensf7b75882017-04-26 09:30:47 -04002905 return RValue<Int4>(V(result));
2906 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002907 }
2908
Nicolas Capens33438a62017-09-27 11:47:35 -04002909 RValue<Short8> PackSigned(RValue<Int4> x, RValue<Int4> y)
Nicolas Capens598f8d82016-09-26 15:09:10 -04002910 {
Nicolas Capens8960fbf2017-07-25 15:32:12 -04002911 if(emulateIntrinsics)
2912 {
2913 Short8 result;
Nicolas Capens33438a62017-09-27 11:47:35 -04002914 result = Insert(result, SaturateSigned(Extract(x, 0)), 0);
2915 result = Insert(result, SaturateSigned(Extract(x, 1)), 1);
2916 result = Insert(result, SaturateSigned(Extract(x, 2)), 2);
2917 result = Insert(result, SaturateSigned(Extract(x, 3)), 3);
2918 result = Insert(result, SaturateSigned(Extract(y, 0)), 4);
2919 result = Insert(result, SaturateSigned(Extract(y, 1)), 5);
2920 result = Insert(result, SaturateSigned(Extract(y, 2)), 6);
2921 result = Insert(result, SaturateSigned(Extract(y, 3)), 7);
Nicolas Capensec54a172016-10-25 17:32:37 -04002922
Nicolas Capens8960fbf2017-07-25 15:32:12 -04002923 return result;
2924 }
2925 else
2926 {
2927 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2928 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::VectorPackSigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2929 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2930 auto pack = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2931 pack->addArg(x.value);
2932 pack->addArg(y.value);
2933 ::basicBlock->appendInst(pack);
2934
2935 return RValue<Short8>(V(result));
2936 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002937 }
2938
Nicolas Capens33438a62017-09-27 11:47:35 -04002939 RValue<UShort8> PackUnsigned(RValue<Int4> x, RValue<Int4> y)
2940 {
Nicolas Capens091f3502017-10-03 14:56:49 -04002941 if(emulateIntrinsics || !(CPUID::SSE4_1 || CPUID::ARM))
2942 {
2943 RValue<Int4> sx = As<Int4>(x);
2944 RValue<Int4> bx = (sx & ~(sx >> 31)) - Int4(0x8000);
2945
2946 RValue<Int4> sy = As<Int4>(y);
2947 RValue<Int4> by = (sy & ~(sy >> 31)) - Int4(0x8000);
2948
2949 return As<UShort8>(PackSigned(bx, by) + Short8(0x8000u));
2950 }
2951 else
Nicolas Capens33438a62017-09-27 11:47:35 -04002952 {
2953 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2954 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::VectorPackUnsigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2955 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2956 auto pack = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2957 pack->addArg(x.value);
2958 pack->addArg(y.value);
2959 ::basicBlock->appendInst(pack);
2960
2961 return RValue<UShort8>(V(result));
2962 }
Nicolas Capens33438a62017-09-27 11:47:35 -04002963 }
2964
Nicolas Capens598f8d82016-09-26 15:09:10 -04002965 RValue<Int> SignMask(RValue<Int4> x)
2966 {
Nicolas Capens091f3502017-10-03 14:56:49 -04002967 if(emulateIntrinsics || CPUID::ARM)
Nicolas Capensd6cacad2017-07-25 15:32:12 -04002968 {
2969 Int4 xx = (x >> 31) & Int4(0x00000001, 0x00000002, 0x00000004, 0x00000008);
2970 return Extract(xx, 0) | Extract(xx, 1) | Extract(xx, 2) | Extract(xx, 3);
2971 }
2972 else
2973 {
2974 Ice::Variable *result = ::function->makeVariable(Ice::IceType_i32);
2975 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::SignMask, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2976 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2977 auto movmsk = Ice::InstIntrinsicCall::create(::function, 1, result, target, intrinsic);
2978 movmsk->addArg(x.value);
2979 ::basicBlock->appendInst(movmsk);
Nicolas Capensf2cb9df2016-10-21 17:26:13 -04002980
Nicolas Capensd6cacad2017-07-25 15:32:12 -04002981 return RValue<Int>(V(result));
2982 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002983 }
2984
Nicolas Capens598f8d82016-09-26 15:09:10 -04002985 Type *Int4::getType()
2986 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04002987 return T(Ice::IceType_v4i32);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002988 }
2989
Nicolas Capenscb986762017-01-20 11:34:37 -05002990 UInt4::UInt4(RValue<Float4> cast) : XYZW(this)
Nicolas Capens598f8d82016-09-26 15:09:10 -04002991 {
Nicolas Capensc70a1162016-12-03 00:16:14 -05002992 // Smallest positive value representable in UInt, but not in Int
2993 const unsigned int ustart = 0x80000000u;
2994 const float ustartf = float(ustart);
2995
2996 // Check if the value can be represented as an Int
2997 Int4 uiValue = CmpNLT(cast, Float4(ustartf));
2998 // If the value is too large, subtract ustart and re-add it after conversion.
2999 uiValue = (uiValue & As<Int4>(As<UInt4>(Int4(cast - Float4(ustartf))) + UInt4(ustart))) |
3000 // Otherwise, just convert normally
3001 (~uiValue & Int4(cast));
3002 // If the value is negative, store 0, otherwise store the result of the conversion
3003 storeValue((~(As<Int4>(cast) >> 31) & uiValue).value);
Nicolas Capens598f8d82016-09-26 15:09:10 -04003004 }
3005
Nicolas Capens598f8d82016-09-26 15:09:10 -04003006 RValue<UInt4> operator<<(RValue<UInt4> lhs, unsigned char rhs)
3007 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04003008 if(emulateIntrinsics)
3009 {
3010 UInt4 result;
3011 result = Insert(result, Extract(lhs, 0) << UInt(rhs), 0);
3012 result = Insert(result, Extract(lhs, 1) << UInt(rhs), 1);
3013 result = Insert(result, Extract(lhs, 2) << UInt(rhs), 2);
3014 result = Insert(result, Extract(lhs, 3) << UInt(rhs), 3);
3015
3016 return result;
3017 }
3018 else
3019 {
3020 return RValue<UInt4>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
3021 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04003022 }
3023
3024 RValue<UInt4> operator>>(RValue<UInt4> lhs, unsigned char rhs)
3025 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04003026 if(emulateIntrinsics)
3027 {
3028 UInt4 result;
3029 result = Insert(result, Extract(lhs, 0) >> UInt(rhs), 0);
3030 result = Insert(result, Extract(lhs, 1) >> UInt(rhs), 1);
3031 result = Insert(result, Extract(lhs, 2) >> UInt(rhs), 2);
3032 result = Insert(result, Extract(lhs, 3) >> UInt(rhs), 3);
3033
3034 return result;
3035 }
3036 else
3037 {
3038 return RValue<UInt4>(Nucleus::createLShr(lhs.value, V(::context->getConstantInt32(rhs))));
3039 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04003040 }
3041
Nicolas Capens598f8d82016-09-26 15:09:10 -04003042 RValue<UInt4> CmpEQ(RValue<UInt4> x, RValue<UInt4> y)
3043 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003044 return RValue<UInt4>(Nucleus::createICmpEQ(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003045 }
3046
3047 RValue<UInt4> CmpLT(RValue<UInt4> x, RValue<UInt4> y)
3048 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003049 return RValue<UInt4>(Nucleus::createICmpULT(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003050 }
3051
3052 RValue<UInt4> CmpLE(RValue<UInt4> x, RValue<UInt4> y)
3053 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003054 return RValue<UInt4>(Nucleus::createICmpULE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003055 }
3056
3057 RValue<UInt4> CmpNEQ(RValue<UInt4> x, RValue<UInt4> y)
3058 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003059 return RValue<UInt4>(Nucleus::createICmpNE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003060 }
3061
3062 RValue<UInt4> CmpNLT(RValue<UInt4> x, RValue<UInt4> y)
3063 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003064 return RValue<UInt4>(Nucleus::createICmpUGE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003065 }
3066
3067 RValue<UInt4> CmpNLE(RValue<UInt4> x, RValue<UInt4> y)
3068 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003069 return RValue<UInt4>(Nucleus::createICmpUGT(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003070 }
3071
3072 RValue<UInt4> Max(RValue<UInt4> x, RValue<UInt4> y)
3073 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04003074 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
3075 auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Ule, condition, x.value, y.value);
3076 ::basicBlock->appendInst(cmp);
3077
3078 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4i32);
3079 auto select = Ice::InstSelect::create(::function, result, condition, y.value, x.value);
3080 ::basicBlock->appendInst(select);
3081
3082 return RValue<UInt4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003083 }
3084
3085 RValue<UInt4> Min(RValue<UInt4> x, RValue<UInt4> y)
3086 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04003087 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
3088 auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Ugt, condition, x.value, y.value);
3089 ::basicBlock->appendInst(cmp);
3090
3091 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4i32);
3092 auto select = Ice::InstSelect::create(::function, result, condition, y.value, x.value);
3093 ::basicBlock->appendInst(select);
3094
3095 return RValue<UInt4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003096 }
3097
Nicolas Capens598f8d82016-09-26 15:09:10 -04003098 Type *UInt4::getType()
3099 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04003100 return T(Ice::IceType_v4i32);
Nicolas Capens598f8d82016-09-26 15:09:10 -04003101 }
3102
Ben Claytonec1aeb82019-03-04 19:33:27 +00003103 Type *Half::getType()
3104 {
3105 return T(Ice::IceType_i16);
3106 }
Alexis Hetu734e2572018-12-20 14:00:49 -05003107
Nicolas Capens598f8d82016-09-26 15:09:10 -04003108 RValue<Float> Rcp_pp(RValue<Float> x, bool exactAtPow2)
3109 {
Nicolas Capensd52e9362016-10-31 23:23:15 -04003110 return 1.0f / x;
Nicolas Capens598f8d82016-09-26 15:09:10 -04003111 }
3112
3113 RValue<Float> RcpSqrt_pp(RValue<Float> x)
3114 {
Nicolas Capensd52e9362016-10-31 23:23:15 -04003115 return Rcp_pp(Sqrt(x));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003116 }
3117
3118 RValue<Float> Sqrt(RValue<Float> x)
3119 {
Nicolas Capensd52e9362016-10-31 23:23:15 -04003120 Ice::Variable *result = ::function->makeVariable(Ice::IceType_f32);
3121 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::Sqrt, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
3122 auto target = ::context->getConstantUndef(Ice::IceType_i32);
3123 auto sqrt = Ice::InstIntrinsicCall::create(::function, 1, result, target, intrinsic);
3124 sqrt->addArg(x.value);
3125 ::basicBlock->appendInst(sqrt);
3126
3127 return RValue<Float>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003128 }
3129
3130 RValue<Float> Round(RValue<Float> x)
3131 {
Nicolas Capensa8086512016-11-07 17:32:17 -05003132 return Float4(Round(Float4(x))).x;
Nicolas Capens598f8d82016-09-26 15:09:10 -04003133 }
3134
3135 RValue<Float> Trunc(RValue<Float> x)
3136 {
Nicolas Capensa8086512016-11-07 17:32:17 -05003137 return Float4(Trunc(Float4(x))).x;
Nicolas Capens598f8d82016-09-26 15:09:10 -04003138 }
3139
3140 RValue<Float> Frac(RValue<Float> x)
3141 {
Nicolas Capensa8086512016-11-07 17:32:17 -05003142 return Float4(Frac(Float4(x))).x;
Nicolas Capens598f8d82016-09-26 15:09:10 -04003143 }
3144
3145 RValue<Float> Floor(RValue<Float> x)
3146 {
Nicolas Capensa8086512016-11-07 17:32:17 -05003147 return Float4(Floor(Float4(x))).x;
Nicolas Capens598f8d82016-09-26 15:09:10 -04003148 }
3149
3150 RValue<Float> Ceil(RValue<Float> x)
3151 {
Nicolas Capensa8086512016-11-07 17:32:17 -05003152 return Float4(Ceil(Float4(x))).x;
Nicolas Capens598f8d82016-09-26 15:09:10 -04003153 }
3154
3155 Type *Float::getType()
3156 {
Nicolas Capens9709d4f2016-09-30 11:44:14 -04003157 return T(Ice::IceType_f32);
Nicolas Capens598f8d82016-09-26 15:09:10 -04003158 }
3159
Nicolas Capens598f8d82016-09-26 15:09:10 -04003160 Type *Float2::getType()
3161 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04003162 return T(Type_v2f32);
Nicolas Capens598f8d82016-09-26 15:09:10 -04003163 }
3164
Nicolas Capenscb986762017-01-20 11:34:37 -05003165 Float4::Float4(RValue<Float> rhs) : XYZW(this)
Nicolas Capens598f8d82016-09-26 15:09:10 -04003166 {
Nicolas Capensf8beb4b2017-01-27 02:55:44 -08003167 Value *vector = Nucleus::createBitCast(rhs.value, Float4::getType());
Nicolas Capensd4227962016-11-09 14:24:25 -05003168
3169 int swizzle[4] = {0, 0, 0, 0};
Nicolas Capensf8beb4b2017-01-27 02:55:44 -08003170 Value *replicate = Nucleus::createShuffleVector(vector, vector, swizzle);
Nicolas Capensd4227962016-11-09 14:24:25 -05003171
3172 storeValue(replicate);
Nicolas Capens598f8d82016-09-26 15:09:10 -04003173 }
3174
Nicolas Capens598f8d82016-09-26 15:09:10 -04003175 RValue<Float4> Max(RValue<Float4> x, RValue<Float4> y)
3176 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04003177 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
Nicolas Capens5cdb91a2017-02-13 12:39:18 -05003178 auto cmp = Ice::InstFcmp::create(::function, Ice::InstFcmp::Ogt, condition, x.value, y.value);
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04003179 ::basicBlock->appendInst(cmp);
3180
3181 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
Nicolas Capens5cdb91a2017-02-13 12:39:18 -05003182 auto select = Ice::InstSelect::create(::function, result, condition, x.value, y.value);
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04003183 ::basicBlock->appendInst(select);
3184
3185 return RValue<Float4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003186 }
3187
3188 RValue<Float4> Min(RValue<Float4> x, RValue<Float4> y)
3189 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04003190 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
Nicolas Capens5cdb91a2017-02-13 12:39:18 -05003191 auto cmp = Ice::InstFcmp::create(::function, Ice::InstFcmp::Olt, condition, x.value, y.value);
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04003192 ::basicBlock->appendInst(cmp);
3193
3194 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
Nicolas Capens5cdb91a2017-02-13 12:39:18 -05003195 auto select = Ice::InstSelect::create(::function, result, condition, x.value, y.value);
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04003196 ::basicBlock->appendInst(select);
3197
3198 return RValue<Float4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003199 }
3200
3201 RValue<Float4> Rcp_pp(RValue<Float4> x, bool exactAtPow2)
3202 {
Nicolas Capensd52e9362016-10-31 23:23:15 -04003203 return Float4(1.0f) / x;
Nicolas Capens598f8d82016-09-26 15:09:10 -04003204 }
3205
3206 RValue<Float4> RcpSqrt_pp(RValue<Float4> x)
3207 {
Nicolas Capensd52e9362016-10-31 23:23:15 -04003208 return Rcp_pp(Sqrt(x));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003209 }
3210
3211 RValue<Float4> Sqrt(RValue<Float4> x)
3212 {
Nicolas Capens091f3502017-10-03 14:56:49 -04003213 if(emulateIntrinsics || CPUID::ARM)
Nicolas Capens9f737d32017-07-25 17:26:14 -04003214 {
3215 Float4 result;
3216 result.x = Sqrt(Float(Float4(x).x));
3217 result.y = Sqrt(Float(Float4(x).y));
3218 result.z = Sqrt(Float(Float4(x).z));
3219 result.w = Sqrt(Float(Float4(x).w));
Nicolas Capensd52e9362016-10-31 23:23:15 -04003220
Nicolas Capens9f737d32017-07-25 17:26:14 -04003221 return result;
3222 }
3223 else
3224 {
3225 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
3226 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::Sqrt, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
3227 auto target = ::context->getConstantUndef(Ice::IceType_i32);
3228 auto sqrt = Ice::InstIntrinsicCall::create(::function, 1, result, target, intrinsic);
3229 sqrt->addArg(x.value);
3230 ::basicBlock->appendInst(sqrt);
3231
3232 return RValue<Float4>(V(result));
3233 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04003234 }
3235
Nicolas Capens598f8d82016-09-26 15:09:10 -04003236 RValue<Int> SignMask(RValue<Float4> x)
3237 {
Nicolas Capens091f3502017-10-03 14:56:49 -04003238 if(emulateIntrinsics || CPUID::ARM)
Nicolas Capensd6cacad2017-07-25 15:32:12 -04003239 {
3240 Int4 xx = (As<Int4>(x) >> 31) & Int4(0x00000001, 0x00000002, 0x00000004, 0x00000008);
3241 return Extract(xx, 0) | Extract(xx, 1) | Extract(xx, 2) | Extract(xx, 3);
3242 }
3243 else
3244 {
3245 Ice::Variable *result = ::function->makeVariable(Ice::IceType_i32);
3246 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::SignMask, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
3247 auto target = ::context->getConstantUndef(Ice::IceType_i32);
3248 auto movmsk = Ice::InstIntrinsicCall::create(::function, 1, result, target, intrinsic);
3249 movmsk->addArg(x.value);
3250 ::basicBlock->appendInst(movmsk);
Nicolas Capensf2cb9df2016-10-21 17:26:13 -04003251
Nicolas Capensd6cacad2017-07-25 15:32:12 -04003252 return RValue<Int>(V(result));
3253 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04003254 }
3255
3256 RValue<Int4> CmpEQ(RValue<Float4> x, RValue<Float4> y)
3257 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003258 return RValue<Int4>(Nucleus::createFCmpOEQ(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003259 }
3260
3261 RValue<Int4> CmpLT(RValue<Float4> x, RValue<Float4> y)
3262 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003263 return RValue<Int4>(Nucleus::createFCmpOLT(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003264 }
3265
3266 RValue<Int4> CmpLE(RValue<Float4> x, RValue<Float4> y)
3267 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003268 return RValue<Int4>(Nucleus::createFCmpOLE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003269 }
3270
3271 RValue<Int4> CmpNEQ(RValue<Float4> x, RValue<Float4> y)
3272 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003273 return RValue<Int4>(Nucleus::createFCmpONE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003274 }
3275
3276 RValue<Int4> CmpNLT(RValue<Float4> x, RValue<Float4> y)
3277 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003278 return RValue<Int4>(Nucleus::createFCmpOGE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003279 }
3280
3281 RValue<Int4> CmpNLE(RValue<Float4> x, RValue<Float4> y)
3282 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003283 return RValue<Int4>(Nucleus::createFCmpOGT(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003284 }
3285
Ben Claytonec1aeb82019-03-04 19:33:27 +00003286 RValue<Int4> CmpUEQ(RValue<Float4> x, RValue<Float4> y)
3287 {
3288 return RValue<Int4>(Nucleus::createFCmpUEQ(x.value, y.value));
3289 }
3290
3291 RValue<Int4> CmpULT(RValue<Float4> x, RValue<Float4> y)
3292 {
3293 return RValue<Int4>(Nucleus::createFCmpULT(x.value, y.value));
3294 }
3295
3296 RValue<Int4> CmpULE(RValue<Float4> x, RValue<Float4> y)
3297 {
3298 return RValue<Int4>(Nucleus::createFCmpULE(x.value, y.value));
3299 }
3300
3301 RValue<Int4> CmpUNEQ(RValue<Float4> x, RValue<Float4> y)
3302 {
3303 return RValue<Int4>(Nucleus::createFCmpUNE(x.value, y.value));
3304 }
3305
3306 RValue<Int4> CmpUNLT(RValue<Float4> x, RValue<Float4> y)
3307 {
3308 return RValue<Int4>(Nucleus::createFCmpUGE(x.value, y.value));
3309 }
3310
3311 RValue<Int4> CmpUNLE(RValue<Float4> x, RValue<Float4> y)
3312 {
3313 return RValue<Int4>(Nucleus::createFCmpUGT(x.value, y.value));
3314 }
3315
Nicolas Capens598f8d82016-09-26 15:09:10 -04003316 RValue<Float4> Round(RValue<Float4> x)
3317 {
Nicolas Capens091f3502017-10-03 14:56:49 -04003318 if(emulateIntrinsics || CPUID::ARM)
Nicolas Capensf7b75882017-04-26 09:30:47 -04003319 {
3320 // Push the fractional part off the mantissa. Accurate up to +/-2^22.
3321 return (x + Float4(0x00C00000)) - Float4(0x00C00000);
3322 }
3323 else if(CPUID::SSE4_1)
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003324 {
3325 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
3326 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::Round, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
3327 auto target = ::context->getConstantUndef(Ice::IceType_i32);
3328 auto round = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
3329 round->addArg(x.value);
3330 round->addArg(::context->getConstantInt32(0));
3331 ::basicBlock->appendInst(round);
Nicolas Capensa8086512016-11-07 17:32:17 -05003332
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003333 return RValue<Float4>(V(result));
3334 }
3335 else
3336 {
3337 return Float4(RoundInt(x));
3338 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04003339 }
3340
3341 RValue<Float4> Trunc(RValue<Float4> x)
3342 {
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003343 if(CPUID::SSE4_1)
3344 {
3345 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
3346 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::Round, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
3347 auto target = ::context->getConstantUndef(Ice::IceType_i32);
3348 auto round = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
3349 round->addArg(x.value);
3350 round->addArg(::context->getConstantInt32(3));
3351 ::basicBlock->appendInst(round);
Nicolas Capensa8086512016-11-07 17:32:17 -05003352
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003353 return RValue<Float4>(V(result));
3354 }
3355 else
3356 {
3357 return Float4(Int4(x));
3358 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04003359 }
3360
3361 RValue<Float4> Frac(RValue<Float4> x)
3362 {
Nicolas Capensb9230422017-07-17 10:27:33 -04003363 Float4 frc;
3364
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003365 if(CPUID::SSE4_1)
3366 {
Nicolas Capensb9230422017-07-17 10:27:33 -04003367 frc = x - Floor(x);
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003368 }
3369 else
3370 {
Nicolas Capensb9230422017-07-17 10:27:33 -04003371 frc = x - Float4(Int4(x)); // Signed fractional part.
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003372
Nicolas Capensb9230422017-07-17 10:27:33 -04003373 frc += As<Float4>(As<Int4>(CmpNLE(Float4(0.0f), frc)) & As<Int4>(Float4(1, 1, 1, 1))); // Add 1.0 if negative.
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003374 }
Nicolas Capensb9230422017-07-17 10:27:33 -04003375
3376 // x - floor(x) can be 1.0 for very small negative x.
3377 // Clamp against the value just below 1.0.
3378 return Min(frc, As<Float4>(Int4(0x3F7FFFFF)));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003379 }
3380
3381 RValue<Float4> Floor(RValue<Float4> x)
3382 {
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003383 if(CPUID::SSE4_1)
3384 {
3385 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
3386 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::Round, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
3387 auto target = ::context->getConstantUndef(Ice::IceType_i32);
3388 auto round = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
3389 round->addArg(x.value);
3390 round->addArg(::context->getConstantInt32(1));
3391 ::basicBlock->appendInst(round);
Nicolas Capensa8086512016-11-07 17:32:17 -05003392
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003393 return RValue<Float4>(V(result));
3394 }
3395 else
3396 {
3397 return x - Frac(x);
3398 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04003399 }
3400
3401 RValue<Float4> Ceil(RValue<Float4> x)
3402 {
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003403 if(CPUID::SSE4_1)
3404 {
3405 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
3406 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::Round, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
3407 auto target = ::context->getConstantUndef(Ice::IceType_i32);
3408 auto round = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
3409 round->addArg(x.value);
3410 round->addArg(::context->getConstantInt32(2));
3411 ::basicBlock->appendInst(round);
Nicolas Capensa8086512016-11-07 17:32:17 -05003412
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003413 return RValue<Float4>(V(result));
3414 }
3415 else
3416 {
3417 return -Floor(-x);
3418 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04003419 }
3420
3421 Type *Float4::getType()
3422 {
Nicolas Capens9709d4f2016-09-30 11:44:14 -04003423 return T(Ice::IceType_v4f32);
Nicolas Capens598f8d82016-09-26 15:09:10 -04003424 }
3425
Nicolas Capens598f8d82016-09-26 15:09:10 -04003426 RValue<Long> Ticks()
3427 {
Ben Claytoneb50d252019-04-15 13:50:01 -04003428 UNIMPLEMENTED("RValue<Long> Ticks()");
3429 return Long(Int(0));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003430 }
Ben Clayton147c4912019-04-11 00:17:59 -04003431
Ben Claytond853c122019-04-16 17:51:49 -04003432 RValue<Pointer<Byte>> ConstantPointer(void const * ptr)
3433 {
3434 return RValue<Pointer<Byte>>(V(::context->getConstantInt64(reinterpret_cast<intptr_t>(ptr))));
3435 }
3436
3437 Value* Call(RValue<Pointer<Byte>> fptr, Type* retTy, std::initializer_list<Value*> args, std::initializer_list<Type*> argTys)
3438 {
3439 // FIXME: This does not currently work on Windows.
3440 Ice::Variable *ret = nullptr;
3441 if (retTy != nullptr)
3442 {
3443 ret = ::function->makeVariable(T(retTy));
3444 }
3445 auto call = Ice::InstCall::create(::function, args.size(), ret, V(fptr.value), false);
3446 for (auto arg : args)
3447 {
3448 call->addArg(V(arg));
3449 }
3450 ::basicBlock->appendInst(call);
3451 return V(ret);
3452 }
3453
Ben Clayton147c4912019-04-11 00:17:59 -04003454 // Below are functions currently unimplemented for the Subzero backend.
3455 // They are stubbed to satisfy the linker.
Ben Clayton147c4912019-04-11 00:17:59 -04003456 RValue<Float4> Sin(RValue<Float4> x) { UNIMPLEMENTED("Subzero Sin()"); return Float4(0); }
3457 RValue<Float4> Cos(RValue<Float4> x) { UNIMPLEMENTED("Subzero Cos()"); return Float4(0); }
3458 RValue<Float4> Tan(RValue<Float4> x) { UNIMPLEMENTED("Subzero Tan()"); return Float4(0); }
3459 RValue<Float4> Asin(RValue<Float4> x) { UNIMPLEMENTED("Subzero Asin()"); return Float4(0); }
3460 RValue<Float4> Acos(RValue<Float4> x) { UNIMPLEMENTED("Subzero Acos()"); return Float4(0); }
3461 RValue<Float4> Atan(RValue<Float4> x) { UNIMPLEMENTED("Subzero Atan()"); return Float4(0); }
3462 RValue<Float4> Sinh(RValue<Float4> x) { UNIMPLEMENTED("Subzero Sinh()"); return Float4(0); }
3463 RValue<Float4> Cosh(RValue<Float4> x) { UNIMPLEMENTED("Subzero Cosh()"); return Float4(0); }
3464 RValue<Float4> Tanh(RValue<Float4> x) { UNIMPLEMENTED("Subzero Tanh()"); return Float4(0); }
3465 RValue<Float4> Asinh(RValue<Float4> x) { UNIMPLEMENTED("Subzero Asinh()"); return Float4(0); }
3466 RValue<Float4> Acosh(RValue<Float4> x) { UNIMPLEMENTED("Subzero Acosh()"); return Float4(0); }
3467 RValue<Float4> Atanh(RValue<Float4> x) { UNIMPLEMENTED("Subzero Atanh()"); return Float4(0); }
3468 RValue<Float4> Atan2(RValue<Float4> x, RValue<Float4> y) { UNIMPLEMENTED("Subzero Atan2()"); return Float4(0); }
3469 RValue<Float4> Pow(RValue<Float4> x, RValue<Float4> y) { UNIMPLEMENTED("Subzero Pow()"); return Float4(0); }
3470 RValue<Float4> Exp(RValue<Float4> x) { UNIMPLEMENTED("Subzero Exp()"); return Float4(0); }
3471 RValue<Float4> Log(RValue<Float4> x) { UNIMPLEMENTED("Subzero Log()"); return Float4(0); }
3472 RValue<Float4> Exp2(RValue<Float4> x) { UNIMPLEMENTED("Subzero Exp2()"); return Float4(0); }
3473 RValue<Float4> Log2(RValue<Float4> x) { UNIMPLEMENTED("Subzero Log2()"); return Float4(0); }
3474 RValue<UInt4> Ctlz(RValue<UInt4> x, bool isZeroUndef) { UNIMPLEMENTED("Subzero Ctlz()"); return UInt4(0); }
3475 RValue<UInt4> Cttz(RValue<UInt4> x, bool isZeroUndef) { UNIMPLEMENTED("Subzero Cttz()"); return UInt4(0); }
Ben Claytonac07ed82019-03-26 14:17:41 +00003476
3477 void EmitDebugLocation() {}
3478 void EmitDebugVariable(Value* value) {}
3479 void FlushDebug() {}
Nicolas Capens598f8d82016-09-26 15:09:10 -04003480}