blob: dee4af0ebe709bde9ff381e132b03d5b27ed574e [file] [log] [blame]
Nicolas Capens598f8d82016-09-26 15:09:10 -04001// Copyright 2016 The SwiftShader Authors. All Rights Reserved.
2//
3// Licensed under the Apache License, Version 2.0 (the "License");
4// you may not use this file except in compliance with the License.
5// You may obtain a copy of the License at
6//
7// http://www.apache.org/licenses/LICENSE-2.0
8//
9// Unless required by applicable law or agreed to in writing, software
10// distributed under the License is distributed on an "AS IS" BASIS,
11// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12// See the License for the specific language governing permissions and
13// limitations under the License.
14
Nicolas Capens598f8d82016-09-26 15:09:10 -040015#include "Reactor.hpp"
Nicolas Capens598f8d82016-09-26 15:09:10 -040016
Nicolas Capens2ae9d742016-11-24 14:43:05 -050017#include "Optimizer.hpp"
Nicolas Capens1a3ce872018-10-10 10:42:36 -040018#include "ExecutableMemory.hpp"
Nicolas Capensa062f322018-09-06 15:34:46 -040019
Nicolas Capens598f8d82016-09-26 15:09:10 -040020#include "src/IceTypes.h"
21#include "src/IceCfg.h"
22#include "src/IceELFStreamer.h"
23#include "src/IceGlobalContext.h"
24#include "src/IceCfgNode.h"
25#include "src/IceELFObjectWriter.h"
Nicolas Capens8dfd9a72016-10-13 17:44:51 -040026#include "src/IceGlobalInits.h"
Nicolas Capens598f8d82016-09-26 15:09:10 -040027
28#include "llvm/Support/FileSystem.h"
29#include "llvm/Support/raw_os_ostream.h"
Nicolas Capens6a990f82018-07-06 15:54:07 -040030#include "llvm/Support/Compiler.h"
31
32#if __has_feature(memory_sanitizer)
33#include <sanitizer/msan_interface.h>
34#endif
Nicolas Capens598f8d82016-09-26 15:09:10 -040035
Nicolas Capensbd65da92017-01-05 16:31:06 -050036#if defined(_WIN32)
Alexis Hetu113e33a2017-01-19 10:49:19 -050037#ifndef WIN32_LEAN_AND_MEAN
Nicolas Capens598f8d82016-09-26 15:09:10 -040038#define WIN32_LEAN_AND_MEAN
Alexis Hetu113e33a2017-01-19 10:49:19 -050039#endif // !WIN32_LEAN_AND_MEAN
40#ifndef NOMINMAX
Nicolas Capens598f8d82016-09-26 15:09:10 -040041#define NOMINMAX
Alexis Hetu113e33a2017-01-19 10:49:19 -050042#endif // !NOMINMAX
Nicolas Capens598f8d82016-09-26 15:09:10 -040043#include <Windows.h>
Nicolas Capensbd65da92017-01-05 16:31:06 -050044#else
45#include <sys/mman.h>
Nicolas Capens411273e2017-01-26 15:13:36 -080046#if !defined(MAP_ANONYMOUS)
47#define MAP_ANONYMOUS MAP_ANON
Nicolas Capens8b275742017-01-20 17:11:41 -050048#endif
Nicolas Capensbd65da92017-01-05 16:31:06 -050049#endif
Nicolas Capens598f8d82016-09-26 15:09:10 -040050
Nicolas Capensc07dc4b2018-08-06 14:20:45 -040051#include <mutex>
Nicolas Capens598f8d82016-09-26 15:09:10 -040052#include <limits>
53#include <iostream>
54#include <cassert>
55
56namespace
57{
58 Ice::GlobalContext *context = nullptr;
59 Ice::Cfg *function = nullptr;
60 Ice::CfgNode *basicBlock = nullptr;
61 Ice::CfgLocalAllocatorScope *allocator = nullptr;
Nicolas Capens48461502018-08-06 14:20:45 -040062 rr::Routine *routine = nullptr;
Nicolas Capens598f8d82016-09-26 15:09:10 -040063
64 std::mutex codegenMutex;
65
66 Ice::ELFFileStreamer *elfFile = nullptr;
67 Ice::Fdstream *out = nullptr;
68}
69
Nicolas Capensccd5ecb2017-01-14 12:52:55 -050070namespace
71{
Nicolas Capens47dc8672017-04-25 12:54:39 -040072 #if !defined(__i386__) && defined(_M_IX86)
73 #define __i386__ 1
74 #endif
75
76 #if !defined(__x86_64__) && (defined(_M_AMD64) || defined (_M_X64))
77 #define __x86_64__ 1
78 #endif
79
Nicolas Capensccd5ecb2017-01-14 12:52:55 -050080 class CPUID
81 {
82 public:
Nicolas Capensf7b75882017-04-26 09:30:47 -040083 const static bool ARM;
Nicolas Capensccd5ecb2017-01-14 12:52:55 -050084 const static bool SSE4_1;
85
86 private:
87 static void cpuid(int registers[4], int info)
88 {
Nicolas Capens47dc8672017-04-25 12:54:39 -040089 #if defined(__i386__) || defined(__x86_64__)
90 #if defined(_WIN32)
91 __cpuid(registers, info);
92 #else
93 __asm volatile("cpuid": "=a" (registers[0]), "=b" (registers[1]), "=c" (registers[2]), "=d" (registers[3]): "a" (info));
94 #endif
Nicolas Capensccd5ecb2017-01-14 12:52:55 -050095 #else
Nicolas Capens47dc8672017-04-25 12:54:39 -040096 registers[0] = 0;
97 registers[1] = 0;
98 registers[2] = 0;
99 registers[3] = 0;
Nicolas Capensccd5ecb2017-01-14 12:52:55 -0500100 #endif
101 }
102
Nicolas Capensf7b75882017-04-26 09:30:47 -0400103 static bool detectARM()
104 {
Stephen Lanhamfe796492018-09-07 11:59:54 -0700105 #if defined(__arm__) || defined(__aarch64__)
Nicolas Capensf7b75882017-04-26 09:30:47 -0400106 return true;
107 #elif defined(__i386__) || defined(__x86_64__)
108 return false;
Gordana Cmiljanovic082dfec2018-10-19 11:36:15 +0200109 #elif defined(__mips__)
110 return false;
Nicolas Capensf7b75882017-04-26 09:30:47 -0400111 #else
112 #error "Unknown architecture"
113 #endif
114 }
115
Nicolas Capensccd5ecb2017-01-14 12:52:55 -0500116 static bool detectSSE4_1()
117 {
Nicolas Capens47dc8672017-04-25 12:54:39 -0400118 #if defined(__i386__) || defined(__x86_64__)
119 int registers[4];
120 cpuid(registers, 1);
121 return (registers[2] & 0x00080000) != 0;
122 #else
123 return false;
124 #endif
Nicolas Capensccd5ecb2017-01-14 12:52:55 -0500125 }
126 };
127
Nicolas Capensf7b75882017-04-26 09:30:47 -0400128 const bool CPUID::ARM = CPUID::detectARM();
Nicolas Capensccd5ecb2017-01-14 12:52:55 -0500129 const bool CPUID::SSE4_1 = CPUID::detectSSE4_1();
Nicolas Capens091f3502017-10-03 14:56:49 -0400130 const bool emulateIntrinsics = false;
Nicolas Capens2d8c3702017-07-25 13:56:46 -0400131 const bool emulateMismatchedBitCast = CPUID::ARM;
Nicolas Capensccd5ecb2017-01-14 12:52:55 -0500132}
133
Nicolas Capens48461502018-08-06 14:20:45 -0400134namespace rr
Nicolas Capens598f8d82016-09-26 15:09:10 -0400135{
Nicolas Capens23d99a42016-09-30 14:57:16 -0400136 enum EmulatedType
137 {
138 EmulatedShift = 16,
139 EmulatedV2 = 2 << EmulatedShift,
140 EmulatedV4 = 4 << EmulatedShift,
141 EmulatedV8 = 8 << EmulatedShift,
142 EmulatedBits = EmulatedV2 | EmulatedV4 | EmulatedV8,
143
144 Type_v2i32 = Ice::IceType_v4i32 | EmulatedV2,
145 Type_v4i16 = Ice::IceType_v8i16 | EmulatedV4,
146 Type_v2i16 = Ice::IceType_v8i16 | EmulatedV2,
147 Type_v8i8 = Ice::IceType_v16i8 | EmulatedV8,
148 Type_v4i8 = Ice::IceType_v16i8 | EmulatedV4,
Nicolas Capens4cfd4572016-10-20 01:00:19 -0400149 Type_v2f32 = Ice::IceType_v4f32 | EmulatedV2,
Nicolas Capens23d99a42016-09-30 14:57:16 -0400150 };
151
Nicolas Capens15060bb2016-12-05 22:17:19 -0500152 class Value : public Ice::Operand {};
Nicolas Capensb98fe5c2016-11-09 12:24:06 -0500153 class SwitchCases : public Ice::InstSwitch {};
Nicolas Capens598f8d82016-09-26 15:09:10 -0400154 class BasicBlock : public Ice::CfgNode {};
155
156 Ice::Type T(Type *t)
157 {
Alexis Hetu113e33a2017-01-19 10:49:19 -0500158 static_assert(static_cast<unsigned int>(Ice::IceType_NUM) < static_cast<unsigned int>(EmulatedBits), "Ice::Type overlaps with our emulated types!");
Nicolas Capens23d99a42016-09-30 14:57:16 -0400159 return (Ice::Type)(reinterpret_cast<std::intptr_t>(t) & ~EmulatedBits);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400160 }
161
162 Type *T(Ice::Type t)
163 {
164 return reinterpret_cast<Type*>(t);
165 }
166
Nicolas Capens23d99a42016-09-30 14:57:16 -0400167 Type *T(EmulatedType t)
168 {
169 return reinterpret_cast<Type*>(t);
170 }
171
Nicolas Capens15060bb2016-12-05 22:17:19 -0500172 Value *V(Ice::Operand *v)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400173 {
174 return reinterpret_cast<Value*>(v);
175 }
176
Nicolas Capens611642a2016-09-28 16:45:04 -0400177 BasicBlock *B(Ice::CfgNode *b)
178 {
179 return reinterpret_cast<BasicBlock*>(b);
180 }
181
Nicolas Capens584088c2017-01-26 16:05:18 -0800182 static size_t typeSize(Type *type)
183 {
184 if(reinterpret_cast<std::intptr_t>(type) & EmulatedBits)
185 {
186 switch(reinterpret_cast<std::intptr_t>(type))
187 {
188 case Type_v2i32: return 8;
189 case Type_v4i16: return 8;
190 case Type_v2i16: return 4;
191 case Type_v8i8: return 8;
192 case Type_v4i8: return 4;
193 case Type_v2f32: return 8;
194 default: assert(false);
195 }
196 }
197
198 return Ice::typeWidthInBytes(T(type));
199 }
200
Nicolas Capens598f8d82016-09-26 15:09:10 -0400201 Optimization optimization[10] = {InstructionCombining, Disabled};
202
Nicolas Capens66478362016-10-13 15:36:36 -0400203 using ElfHeader = std::conditional<sizeof(void*) == 8, Elf64_Ehdr, Elf32_Ehdr>::type;
204 using SectionHeader = std::conditional<sizeof(void*) == 8, Elf64_Shdr, Elf32_Shdr>::type;
205
206 inline const SectionHeader *sectionHeader(const ElfHeader *elfHeader)
207 {
208 return reinterpret_cast<const SectionHeader*>((intptr_t)elfHeader + elfHeader->e_shoff);
209 }
Nicolas Capens87852e12016-11-24 14:45:06 -0500210
Nicolas Capens66478362016-10-13 15:36:36 -0400211 inline const SectionHeader *elfSection(const ElfHeader *elfHeader, int index)
212 {
213 return &sectionHeader(elfHeader)[index];
214 }
215
216 static void *relocateSymbol(const ElfHeader *elfHeader, const Elf32_Rel &relocation, const SectionHeader &relocationTable)
217 {
218 const SectionHeader *target = elfSection(elfHeader, relocationTable.sh_info);
Nicolas Capens87852e12016-11-24 14:45:06 -0500219
Nicolas Capens66478362016-10-13 15:36:36 -0400220 uint32_t index = relocation.getSymbol();
221 int table = relocationTable.sh_link;
222 void *symbolValue = nullptr;
Nicolas Capens87852e12016-11-24 14:45:06 -0500223
Nicolas Capens66478362016-10-13 15:36:36 -0400224 if(index != SHN_UNDEF)
225 {
226 if(table == SHN_UNDEF) return nullptr;
227 const SectionHeader *symbolTable = elfSection(elfHeader, table);
Nicolas Capens87852e12016-11-24 14:45:06 -0500228
Nicolas Capens66478362016-10-13 15:36:36 -0400229 uint32_t symtab_entries = symbolTable->sh_size / symbolTable->sh_entsize;
230 if(index >= symtab_entries)
231 {
232 assert(index < symtab_entries && "Symbol Index out of range");
233 return nullptr;
234 }
Nicolas Capens87852e12016-11-24 14:45:06 -0500235
Nicolas Capens66478362016-10-13 15:36:36 -0400236 intptr_t symbolAddress = (intptr_t)elfHeader + symbolTable->sh_offset;
237 Elf32_Sym &symbol = ((Elf32_Sym*)symbolAddress)[index];
238 uint16_t section = symbol.st_shndx;
239
240 if(section != SHN_UNDEF && section < SHN_LORESERVE)
241 {
242 const SectionHeader *target = elfSection(elfHeader, symbol.st_shndx);
243 symbolValue = reinterpret_cast<void*>((intptr_t)elfHeader + symbol.st_value + target->sh_offset);
244 }
245 else
246 {
247 return nullptr;
248 }
249 }
250
Nicolas Capens8d2cf752018-11-22 11:13:45 -0500251 intptr_t address = (intptr_t)elfHeader + target->sh_offset;
252 unaligned_ptr<int32_t> patchSite = (int32_t*)(address + relocation.r_offset);
253
Nicolas Capensf110e4d2017-05-03 15:33:49 -0400254 if(CPUID::ARM)
255 {
256 switch(relocation.getType())
257 {
258 case R_ARM_NONE:
259 // No relocation
260 break;
261 case R_ARM_MOVW_ABS_NC:
262 {
263 uint32_t thumb = 0; // Calls to Thumb code not supported.
264 uint32_t lo = (uint32_t)(intptr_t)symbolValue | thumb;
265 *patchSite = (*patchSite & 0xFFF0F000) | ((lo & 0xF000) << 4) | (lo & 0x0FFF);
266 }
267 break;
268 case R_ARM_MOVT_ABS:
269 {
270 uint32_t hi = (uint32_t)(intptr_t)(symbolValue) >> 16;
271 *patchSite = (*patchSite & 0xFFF0F000) | ((hi & 0xF000) << 4) | (hi & 0x0FFF);
272 }
273 break;
274 default:
275 assert(false && "Unsupported relocation type");
276 return nullptr;
277 }
278 }
279 else
280 {
Nicolas Capens30cd7d42017-04-25 15:17:25 -0400281 switch(relocation.getType())
282 {
283 case R_386_NONE:
284 // No relocation
285 break;
286 case R_386_32:
287 *patchSite = (int32_t)((intptr_t)symbolValue + *patchSite);
288 break;
289 // case R_386_PC32:
290 // *patchSite = (int32_t)((intptr_t)symbolValue + *patchSite - (intptr_t)patchSite);
291 // break;
292 default:
293 assert(false && "Unsupported relocation type");
294 return nullptr;
295 }
Nicolas Capensf110e4d2017-05-03 15:33:49 -0400296 }
297
Nicolas Capens66478362016-10-13 15:36:36 -0400298 return symbolValue;
299 }
300
301 static void *relocateSymbol(const ElfHeader *elfHeader, const Elf64_Rela &relocation, const SectionHeader &relocationTable)
302 {
303 const SectionHeader *target = elfSection(elfHeader, relocationTable.sh_info);
Nicolas Capens87852e12016-11-24 14:45:06 -0500304
Nicolas Capens66478362016-10-13 15:36:36 -0400305 uint32_t index = relocation.getSymbol();
306 int table = relocationTable.sh_link;
307 void *symbolValue = nullptr;
308
309 if(index != SHN_UNDEF)
310 {
311 if(table == SHN_UNDEF) return nullptr;
312 const SectionHeader *symbolTable = elfSection(elfHeader, table);
Nicolas Capens87852e12016-11-24 14:45:06 -0500313
Nicolas Capens66478362016-10-13 15:36:36 -0400314 uint32_t symtab_entries = symbolTable->sh_size / symbolTable->sh_entsize;
315 if(index >= symtab_entries)
316 {
317 assert(index < symtab_entries && "Symbol Index out of range");
318 return nullptr;
319 }
Nicolas Capens87852e12016-11-24 14:45:06 -0500320
Nicolas Capens66478362016-10-13 15:36:36 -0400321 intptr_t symbolAddress = (intptr_t)elfHeader + symbolTable->sh_offset;
322 Elf64_Sym &symbol = ((Elf64_Sym*)symbolAddress)[index];
323 uint16_t section = symbol.st_shndx;
324
325 if(section != SHN_UNDEF && section < SHN_LORESERVE)
326 {
327 const SectionHeader *target = elfSection(elfHeader, symbol.st_shndx);
328 symbolValue = reinterpret_cast<void*>((intptr_t)elfHeader + symbol.st_value + target->sh_offset);
329 }
330 else
331 {
332 return nullptr;
333 }
334 }
335
Nicolas Capens8d2cf752018-11-22 11:13:45 -0500336 intptr_t address = (intptr_t)elfHeader + target->sh_offset;
337 unaligned_ptr<int32_t> patchSite32 = (int32_t*)(address + relocation.r_offset);
338 unaligned_ptr<int64_t> patchSite64 = (int64_t*)(address + relocation.r_offset);
339
Nicolas Capensf110e4d2017-05-03 15:33:49 -0400340 switch(relocation.getType())
341 {
342 case R_X86_64_NONE:
343 // No relocation
344 break;
345 case R_X86_64_64:
Nicolas Capens8d2cf752018-11-22 11:13:45 -0500346 *patchSite64 = (int64_t)((intptr_t)symbolValue + *patchSite64 + relocation.r_addend);
Nicolas Capensf110e4d2017-05-03 15:33:49 -0400347 break;
348 case R_X86_64_PC32:
Nicolas Capens8d2cf752018-11-22 11:13:45 -0500349 *patchSite32 = (int32_t)((intptr_t)symbolValue + *patchSite32 - (intptr_t)patchSite32 + relocation.r_addend);
Nicolas Capensf110e4d2017-05-03 15:33:49 -0400350 break;
351 case R_X86_64_32S:
Nicolas Capens8d2cf752018-11-22 11:13:45 -0500352 *patchSite32 = (int32_t)((intptr_t)symbolValue + *patchSite32 + relocation.r_addend);
Nicolas Capensf110e4d2017-05-03 15:33:49 -0400353 break;
354 default:
355 assert(false && "Unsupported relocation type");
356 return nullptr;
357 }
Nicolas Capens66478362016-10-13 15:36:36 -0400358
359 return symbolValue;
360 }
361
Nicolas Capens1cc44382017-04-25 10:52:16 -0400362 void *loadImage(uint8_t *const elfImage, size_t &codeSize)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400363 {
Nicolas Capens598f8d82016-09-26 15:09:10 -0400364 ElfHeader *elfHeader = (ElfHeader*)elfImage;
365
366 if(!elfHeader->checkMagic())
367 {
368 return nullptr;
369 }
370
Nicolas Capens66478362016-10-13 15:36:36 -0400371 // Expect ELF bitness to match platform
Nicolas Capens65047112016-11-07 13:01:07 -0500372 assert(sizeof(void*) == 8 ? elfHeader->getFileClass() == ELFCLASS64 : elfHeader->getFileClass() == ELFCLASS32);
Nicolas Capens30cd7d42017-04-25 15:17:25 -0400373 #if defined(__i386__)
374 assert(sizeof(void*) == 4 && elfHeader->e_machine == EM_386);
375 #elif defined(__x86_64__)
376 assert(sizeof(void*) == 8 && elfHeader->e_machine == EM_X86_64);
377 #elif defined(__arm__)
378 assert(sizeof(void*) == 4 && elfHeader->e_machine == EM_ARM);
Stephen Lanhamfe796492018-09-07 11:59:54 -0700379 #elif defined(__aarch64__)
380 assert(sizeof(void*) == 8 && elfHeader->e_machine == EM_AARCH64);
Gordana Cmiljanovic082dfec2018-10-19 11:36:15 +0200381 #elif defined(__mips__)
382 assert(sizeof(void*) == 4 && elfHeader->e_machine == EM_MIPS);
Nicolas Capens30cd7d42017-04-25 15:17:25 -0400383 #else
384 #error "Unsupported platform"
385 #endif
Nicolas Capens66478362016-10-13 15:36:36 -0400386
Nicolas Capens598f8d82016-09-26 15:09:10 -0400387 SectionHeader *sectionHeader = (SectionHeader*)(elfImage + elfHeader->e_shoff);
388 void *entry = nullptr;
389
390 for(int i = 0; i < elfHeader->e_shnum; i++)
391 {
Nicolas Capens66478362016-10-13 15:36:36 -0400392 if(sectionHeader[i].sh_type == SHT_PROGBITS)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400393 {
Nicolas Capens66478362016-10-13 15:36:36 -0400394 if(sectionHeader[i].sh_flags & SHF_EXECINSTR)
395 {
396 entry = elfImage + sectionHeader[i].sh_offset;
Nicolas Capens1cc44382017-04-25 10:52:16 -0400397 codeSize = sectionHeader[i].sh_size;
Nicolas Capens66478362016-10-13 15:36:36 -0400398 }
399 }
400 else if(sectionHeader[i].sh_type == SHT_REL)
401 {
402 assert(sizeof(void*) == 4 && "UNIMPLEMENTED"); // Only expected/implemented for 32-bit code
403
Alexis Hetu113e33a2017-01-19 10:49:19 -0500404 for(Elf32_Word index = 0; index < sectionHeader[i].sh_size / sectionHeader[i].sh_entsize; index++)
Nicolas Capens66478362016-10-13 15:36:36 -0400405 {
406 const Elf32_Rel &relocation = ((const Elf32_Rel*)(elfImage + sectionHeader[i].sh_offset))[index];
Alexis Hetu113e33a2017-01-19 10:49:19 -0500407 relocateSymbol(elfHeader, relocation, sectionHeader[i]);
Nicolas Capens66478362016-10-13 15:36:36 -0400408 }
409 }
410 else if(sectionHeader[i].sh_type == SHT_RELA)
411 {
412 assert(sizeof(void*) == 8 && "UNIMPLEMENTED"); // Only expected/implemented for 64-bit code
413
Alexis Hetu113e33a2017-01-19 10:49:19 -0500414 for(Elf32_Word index = 0; index < sectionHeader[i].sh_size / sectionHeader[i].sh_entsize; index++)
Nicolas Capens66478362016-10-13 15:36:36 -0400415 {
416 const Elf64_Rela &relocation = ((const Elf64_Rela*)(elfImage + sectionHeader[i].sh_offset))[index];
Alexis Hetu113e33a2017-01-19 10:49:19 -0500417 relocateSymbol(elfHeader, relocation, sectionHeader[i]);
Nicolas Capens66478362016-10-13 15:36:36 -0400418 }
Nicolas Capens598f8d82016-09-26 15:09:10 -0400419 }
420 }
421
422 return entry;
423 }
424
425 template<typename T>
426 struct ExecutableAllocator
427 {
428 ExecutableAllocator() {};
429 template<class U> ExecutableAllocator(const ExecutableAllocator<U> &other) {};
430
431 using value_type = T;
432 using size_type = std::size_t;
433
434 T *allocate(size_type n)
435 {
Nicolas Capensc07dc4b2018-08-06 14:20:45 -0400436 return (T*)allocateExecutable(sizeof(T) * n);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400437 }
438
439 void deallocate(T *p, size_type n)
440 {
Nicolas Capensc07dc4b2018-08-06 14:20:45 -0400441 deallocateExecutable(p, sizeof(T) * n);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400442 }
443 };
444
445 class ELFMemoryStreamer : public Ice::ELFStreamer, public Routine
446 {
447 ELFMemoryStreamer(const ELFMemoryStreamer &) = delete;
448 ELFMemoryStreamer &operator=(const ELFMemoryStreamer &) = delete;
449
450 public:
Nicolas Capens58274b52016-10-19 23:45:19 -0400451 ELFMemoryStreamer() : Routine(), entry(nullptr)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400452 {
453 position = 0;
454 buffer.reserve(0x1000);
455 }
456
Nicolas Capens81aa97b2017-06-27 17:08:08 -0400457 ~ELFMemoryStreamer() override
Nicolas Capens598f8d82016-09-26 15:09:10 -0400458 {
Nicolas Capensbd65da92017-01-05 16:31:06 -0500459 #if defined(_WIN32)
460 if(buffer.size() != 0)
461 {
462 DWORD exeProtection;
463 VirtualProtect(&buffer[0], buffer.size(), oldProtection, &exeProtection);
464 }
465 #endif
Nicolas Capens598f8d82016-09-26 15:09:10 -0400466 }
467
468 void write8(uint8_t Value) override
469 {
470 if(position == (uint64_t)buffer.size())
471 {
472 buffer.push_back(Value);
473 position++;
474 }
475 else if(position < (uint64_t)buffer.size())
476 {
477 buffer[position] = Value;
478 position++;
479 }
480 else assert(false && "UNIMPLEMENTED");
481 }
482
483 void writeBytes(llvm::StringRef Bytes) override
484 {
485 std::size_t oldSize = buffer.size();
486 buffer.resize(oldSize + Bytes.size());
487 memcpy(&buffer[oldSize], Bytes.begin(), Bytes.size());
488 position += Bytes.size();
489 }
490
491 uint64_t tell() const override { return position; }
492
493 void seek(uint64_t Off) override { position = Off; }
494
495 const void *getEntry() override
496 {
Nicolas Capens58274b52016-10-19 23:45:19 -0400497 if(!entry)
498 {
Nicolas Capensbd65da92017-01-05 16:31:06 -0500499 position = std::numeric_limits<std::size_t>::max(); // Can't stream more data after this
Nicolas Capens598f8d82016-09-26 15:09:10 -0400500
Nicolas Capens1cc44382017-04-25 10:52:16 -0400501 size_t codeSize = 0;
502 entry = loadImage(&buffer[0], codeSize);
503
504 #if defined(_WIN32)
Nicolas Capense745f5a2017-05-29 10:00:32 -0400505 VirtualProtect(&buffer[0], buffer.size(), PAGE_EXECUTE_READ, &oldProtection);
Nicolas Capens1cc44382017-04-25 10:52:16 -0400506 FlushInstructionCache(GetCurrentProcess(), NULL, 0);
507 #else
Nicolas Capense745f5a2017-05-29 10:00:32 -0400508 mprotect(&buffer[0], buffer.size(), PROT_READ | PROT_EXEC);
Nicolas Capens1cc44382017-04-25 10:52:16 -0400509 __builtin___clear_cache((char*)entry, (char*)entry + codeSize);
510 #endif
Nicolas Capens58274b52016-10-19 23:45:19 -0400511 }
512
513 return entry;
Nicolas Capens598f8d82016-09-26 15:09:10 -0400514 }
515
516 private:
Nicolas Capens58274b52016-10-19 23:45:19 -0400517 void *entry;
Nicolas Capens598f8d82016-09-26 15:09:10 -0400518 std::vector<uint8_t, ExecutableAllocator<uint8_t>> buffer;
519 std::size_t position;
Nicolas Capensbd65da92017-01-05 16:31:06 -0500520
521 #if defined(_WIN32)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400522 DWORD oldProtection;
Nicolas Capensbd65da92017-01-05 16:31:06 -0500523 #endif
Nicolas Capens598f8d82016-09-26 15:09:10 -0400524 };
525
526 Nucleus::Nucleus()
527 {
528 ::codegenMutex.lock(); // Reactor is currently not thread safe
529
Nicolas Capens66478362016-10-13 15:36:36 -0400530 Ice::ClFlags &Flags = Ice::ClFlags::Flags;
531 Ice::ClFlags::getParsedClFlags(Flags);
532
Nicolas Capens30cd7d42017-04-25 15:17:25 -0400533 #if defined(__arm__)
534 Flags.setTargetArch(Ice::Target_ARM32);
535 Flags.setTargetInstructionSet(Ice::ARM32InstructionSet_HWDivArm);
Gordana Cmiljanovic082dfec2018-10-19 11:36:15 +0200536 #elif defined(__mips__)
537 Flags.setTargetArch(Ice::Target_MIPS32);
538 Flags.setTargetInstructionSet(Ice::BaseInstructionSet);
Nicolas Capens30cd7d42017-04-25 15:17:25 -0400539 #else // x86
540 Flags.setTargetArch(sizeof(void*) == 8 ? Ice::Target_X8664 : Ice::Target_X8632);
541 Flags.setTargetInstructionSet(CPUID::SSE4_1 ? Ice::X86InstructionSet_SSE4_1 : Ice::X86InstructionSet_SSE2);
542 #endif
Nicolas Capens66478362016-10-13 15:36:36 -0400543 Flags.setOutFileType(Ice::FT_Elf);
544 Flags.setOptLevel(Ice::Opt_2);
545 Flags.setApplicationBinaryInterface(Ice::ABI_Platform);
Nicolas Capens30cd7d42017-04-25 15:17:25 -0400546 Flags.setVerbose(false ? Ice::IceV_Most : Ice::IceV_None);
547 Flags.setDisableHybridAssembly(true);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400548
Nicolas Capens65047112016-11-07 13:01:07 -0500549 static llvm::raw_os_ostream cout(std::cout);
550 static llvm::raw_os_ostream cerr(std::cerr);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400551
552 if(false) // Write out to a file
553 {
554 std::error_code errorCode;
555 ::out = new Ice::Fdstream("out.o", errorCode, llvm::sys::fs::F_None);
556 ::elfFile = new Ice::ELFFileStreamer(*out);
Nicolas Capens65047112016-11-07 13:01:07 -0500557 ::context = new Ice::GlobalContext(&cout, &cout, &cerr, elfFile);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400558 }
559 else
560 {
561 ELFMemoryStreamer *elfMemory = new ELFMemoryStreamer();
Nicolas Capens65047112016-11-07 13:01:07 -0500562 ::context = new Ice::GlobalContext(&cout, &cout, &cerr, elfMemory);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400563 ::routine = elfMemory;
564 }
565 }
566
567 Nucleus::~Nucleus()
568 {
Nicolas Capens619a8c52017-07-05 14:10:46 -0400569 delete ::routine;
570
Nicolas Capens598f8d82016-09-26 15:09:10 -0400571 delete ::allocator;
572 delete ::function;
573 delete ::context;
574
575 delete ::elfFile;
576 delete ::out;
577
578 ::codegenMutex.unlock();
579 }
580
Chris Forbes878d4b02019-01-21 10:48:35 -0800581 Routine *Nucleus::acquireRoutine(const char *name, bool runOptimizations)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400582 {
583 if(basicBlock->getInsts().empty() || basicBlock->getInsts().back().getKind() != Ice::Inst::Ret)
584 {
585 createRetVoid();
586 }
587
Chris Forbes878d4b02019-01-21 10:48:35 -0800588 ::function->setFunctionName(Ice::GlobalString::createWithString(::context, name));
Nicolas Capens598f8d82016-09-26 15:09:10 -0400589
Nicolas Capens2ae9d742016-11-24 14:43:05 -0500590 optimize();
591
Nicolas Capens598f8d82016-09-26 15:09:10 -0400592 ::function->translate();
Nicolas Capensde19f392016-10-19 10:29:49 -0400593 assert(!::function->hasError());
594
Nicolas Capens83a6bb92017-07-05 15:04:00 -0400595 auto globals = ::function->getGlobalInits();
Nicolas Capens66478362016-10-13 15:36:36 -0400596
597 if(globals && !globals->empty())
598 {
Nicolas Capens83a6bb92017-07-05 15:04:00 -0400599 ::context->getGlobals()->merge(globals.get());
Nicolas Capens66478362016-10-13 15:36:36 -0400600 }
Nicolas Capens598f8d82016-09-26 15:09:10 -0400601
602 ::context->emitFileHeader();
603 ::function->emitIAS();
604 auto assembler = ::function->releaseAssembler();
Nicolas Capens66478362016-10-13 15:36:36 -0400605 auto objectWriter = ::context->getObjectWriter();
606 assembler->alignFunction();
607 objectWriter->writeFunctionCode(::function->getFunctionName(), false, assembler.get());
608 ::context->lowerGlobals("last");
Nicolas Capens73dd7a22016-10-20 13:20:34 -0400609 ::context->lowerConstants();
Nicolas Capensb98fe5c2016-11-09 12:24:06 -0500610 ::context->lowerJumpTables();
Nicolas Capens66478362016-10-13 15:36:36 -0400611 objectWriter->setUndefinedSyms(::context->getConstantExternSyms());
612 objectWriter->writeNonUserSections();
Nicolas Capens598f8d82016-09-26 15:09:10 -0400613
Nicolas Capens619a8c52017-07-05 14:10:46 -0400614 Routine *handoffRoutine = ::routine;
615 ::routine = nullptr;
616
617 return handoffRoutine;
Nicolas Capens598f8d82016-09-26 15:09:10 -0400618 }
619
620 void Nucleus::optimize()
621 {
Nicolas Capens48461502018-08-06 14:20:45 -0400622 rr::optimize(::function);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400623 }
624
625 Value *Nucleus::allocateStackVariable(Type *t, int arraySize)
626 {
627 Ice::Type type = T(t);
Nicolas Capensa8f98632016-10-20 11:25:55 -0400628 int typeSize = Ice::typeWidthInBytes(type);
629 int totalSize = typeSize * (arraySize ? arraySize : 1);
Nicolas Capense12780d2016-09-27 14:18:07 -0400630
Nicolas Capensa8f98632016-10-20 11:25:55 -0400631 auto bytes = Ice::ConstantInteger32::create(::context, type, totalSize);
Nicolas Capense12780d2016-09-27 14:18:07 -0400632 auto address = ::function->makeVariable(T(getPointerType(t)));
Nicolas Capensa8f98632016-10-20 11:25:55 -0400633 auto alloca = Ice::InstAlloca::create(::function, address, bytes, typeSize);
Nicolas Capense12780d2016-09-27 14:18:07 -0400634 ::function->getEntryNode()->getInsts().push_front(alloca);
635
636 return V(address);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400637 }
638
639 BasicBlock *Nucleus::createBasicBlock()
640 {
Nicolas Capens611642a2016-09-28 16:45:04 -0400641 return B(::function->makeNode());
Nicolas Capens598f8d82016-09-26 15:09:10 -0400642 }
643
644 BasicBlock *Nucleus::getInsertBlock()
645 {
Nicolas Capens611642a2016-09-28 16:45:04 -0400646 return B(::basicBlock);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400647 }
648
649 void Nucleus::setInsertBlock(BasicBlock *basicBlock)
650 {
Nicolas Capens9ed1a182016-10-24 09:52:23 -0400651 // assert(::basicBlock->getInsts().back().getTerminatorEdges().size() >= 0 && "Previous basic block must have a terminator");
Nicolas Capens0192d152019-03-27 14:46:07 -0400652
653 Variable::materializeAll();
654
Nicolas Capens611642a2016-09-28 16:45:04 -0400655 ::basicBlock = basicBlock;
Nicolas Capens598f8d82016-09-26 15:09:10 -0400656 }
657
Nicolas Capens598f8d82016-09-26 15:09:10 -0400658 void Nucleus::createFunction(Type *ReturnType, std::vector<Type*> &Params)
659 {
660 uint32_t sequenceNumber = 0;
661 ::function = Ice::Cfg::create(::context, sequenceNumber).release();
662 ::allocator = new Ice::CfgLocalAllocatorScope(::function);
663
664 for(Type *type : Params)
665 {
666 Ice::Variable *arg = ::function->makeVariable(T(type));
667 ::function->addArg(arg);
668 }
669
670 Ice::CfgNode *node = ::function->makeNode();
671 ::function->setEntryNode(node);
672 ::basicBlock = node;
673 }
674
675 Value *Nucleus::getArgument(unsigned int index)
676 {
677 return V(::function->getArgs()[index]);
678 }
679
680 void Nucleus::createRetVoid()
681 {
Nicolas Capens0192d152019-03-27 14:46:07 -0400682 // Code generated after this point is unreachable, so any variables
683 // being read can safely return an undefined value. We have to avoid
684 // materializing variables after the terminator ret instruction.
685 Variable::killUnmaterialized();
686
Nicolas Capensfdcca2d2016-10-20 11:31:36 -0400687 Ice::InstRet *ret = Ice::InstRet::create(::function);
688 ::basicBlock->appendInst(ret);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400689 }
690
691 void Nucleus::createRet(Value *v)
692 {
Nicolas Capens0192d152019-03-27 14:46:07 -0400693 // Code generated after this point is unreachable, so any variables
694 // being read can safely return an undefined value. We have to avoid
695 // materializing variables after the terminator ret instruction.
696 Variable::killUnmaterialized();
697
Nicolas Capensfdcca2d2016-10-20 11:31:36 -0400698 Ice::InstRet *ret = Ice::InstRet::create(::function, v);
699 ::basicBlock->appendInst(ret);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400700 }
701
702 void Nucleus::createBr(BasicBlock *dest)
703 {
Nicolas Capens0192d152019-03-27 14:46:07 -0400704 Variable::materializeAll();
705
Nicolas Capens611642a2016-09-28 16:45:04 -0400706 auto br = Ice::InstBr::create(::function, dest);
707 ::basicBlock->appendInst(br);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400708 }
709
710 void Nucleus::createCondBr(Value *cond, BasicBlock *ifTrue, BasicBlock *ifFalse)
711 {
Nicolas Capens0192d152019-03-27 14:46:07 -0400712 Variable::materializeAll();
713
Nicolas Capens611642a2016-09-28 16:45:04 -0400714 auto br = Ice::InstBr::create(::function, cond, ifTrue, ifFalse);
715 ::basicBlock->appendInst(br);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400716 }
717
Nicolas Capensf8360ba2017-01-25 11:35:00 -0800718 static bool isCommutative(Ice::InstArithmetic::OpKind op)
719 {
720 switch(op)
721 {
722 case Ice::InstArithmetic::Add:
723 case Ice::InstArithmetic::Fadd:
724 case Ice::InstArithmetic::Mul:
725 case Ice::InstArithmetic::Fmul:
726 case Ice::InstArithmetic::And:
727 case Ice::InstArithmetic::Or:
728 case Ice::InstArithmetic::Xor:
729 return true;
730 default:
731 return false;
732 }
733 }
734
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400735 static Value *createArithmetic(Ice::InstArithmetic::OpKind op, Value *lhs, Value *rhs)
736 {
Nicolas Capensb64e0ce2018-01-26 01:24:57 +0000737 assert(lhs->getType() == rhs->getType() || llvm::isa<Ice::Constant>(rhs));
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400738
Nicolas Capensf8360ba2017-01-25 11:35:00 -0800739 bool swapOperands = llvm::isa<Ice::Constant>(lhs) && isCommutative(op);
740
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400741 Ice::Variable *result = ::function->makeVariable(lhs->getType());
Nicolas Capensf8360ba2017-01-25 11:35:00 -0800742 Ice::InstArithmetic *arithmetic = Ice::InstArithmetic::create(::function, op, result, swapOperands ? rhs : lhs, swapOperands ? lhs : rhs);
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400743 ::basicBlock->appendInst(arithmetic);
744
745 return V(result);
746 }
747
Nicolas Capens598f8d82016-09-26 15:09:10 -0400748 Value *Nucleus::createAdd(Value *lhs, Value *rhs)
749 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400750 return createArithmetic(Ice::InstArithmetic::Add, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400751 }
752
753 Value *Nucleus::createSub(Value *lhs, Value *rhs)
754 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400755 return createArithmetic(Ice::InstArithmetic::Sub, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400756 }
757
758 Value *Nucleus::createMul(Value *lhs, Value *rhs)
759 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400760 return createArithmetic(Ice::InstArithmetic::Mul, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400761 }
762
763 Value *Nucleus::createUDiv(Value *lhs, Value *rhs)
764 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400765 return createArithmetic(Ice::InstArithmetic::Udiv, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400766 }
767
768 Value *Nucleus::createSDiv(Value *lhs, Value *rhs)
769 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400770 return createArithmetic(Ice::InstArithmetic::Sdiv, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400771 }
772
773 Value *Nucleus::createFAdd(Value *lhs, Value *rhs)
774 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400775 return createArithmetic(Ice::InstArithmetic::Fadd, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400776 }
777
778 Value *Nucleus::createFSub(Value *lhs, Value *rhs)
779 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400780 return createArithmetic(Ice::InstArithmetic::Fsub, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400781 }
782
783 Value *Nucleus::createFMul(Value *lhs, Value *rhs)
784 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400785 return createArithmetic(Ice::InstArithmetic::Fmul, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400786 }
787
788 Value *Nucleus::createFDiv(Value *lhs, Value *rhs)
789 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400790 return createArithmetic(Ice::InstArithmetic::Fdiv, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400791 }
792
793 Value *Nucleus::createURem(Value *lhs, Value *rhs)
794 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400795 return createArithmetic(Ice::InstArithmetic::Urem, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400796 }
797
798 Value *Nucleus::createSRem(Value *lhs, Value *rhs)
799 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400800 return createArithmetic(Ice::InstArithmetic::Srem, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400801 }
802
803 Value *Nucleus::createFRem(Value *lhs, Value *rhs)
804 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400805 return createArithmetic(Ice::InstArithmetic::Frem, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400806 }
807
808 Value *Nucleus::createShl(Value *lhs, Value *rhs)
809 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400810 return createArithmetic(Ice::InstArithmetic::Shl, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400811 }
812
813 Value *Nucleus::createLShr(Value *lhs, Value *rhs)
814 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400815 return createArithmetic(Ice::InstArithmetic::Lshr, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400816 }
817
818 Value *Nucleus::createAShr(Value *lhs, Value *rhs)
819 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400820 return createArithmetic(Ice::InstArithmetic::Ashr, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400821 }
822
823 Value *Nucleus::createAnd(Value *lhs, Value *rhs)
824 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400825 return createArithmetic(Ice::InstArithmetic::And, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400826 }
827
828 Value *Nucleus::createOr(Value *lhs, Value *rhs)
829 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400830 return createArithmetic(Ice::InstArithmetic::Or, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400831 }
832
833 Value *Nucleus::createXor(Value *lhs, Value *rhs)
834 {
Nicolas Capens7d9f76d2016-09-29 13:39:44 -0400835 return createArithmetic(Ice::InstArithmetic::Xor, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400836 }
837
838 Value *Nucleus::createNeg(Value *v)
839 {
Nicolas Capensc5c0c332016-11-08 11:37:01 -0500840 return createSub(createNullValue(T(v->getType())), v);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400841 }
842
843 Value *Nucleus::createFNeg(Value *v)
844 {
Nicolas Capensc5c0c332016-11-08 11:37:01 -0500845 double c[4] = {-0.0, -0.0, -0.0, -0.0};
846 Value *negativeZero = Ice::isVectorType(v->getType()) ?
847 createConstantVector(c, T(v->getType())) :
Nicolas Capens15060bb2016-12-05 22:17:19 -0500848 V(::context->getConstantFloat(-0.0f));
Nicolas Capensc5c0c332016-11-08 11:37:01 -0500849
850 return createFSub(negativeZero, v);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400851 }
852
853 Value *Nucleus::createNot(Value *v)
854 {
Nicolas Capensc5c0c332016-11-08 11:37:01 -0500855 if(Ice::isScalarIntegerType(v->getType()))
856 {
Nicolas Capens15060bb2016-12-05 22:17:19 -0500857 return createXor(v, V(::context->getConstantInt(v->getType(), -1)));
Nicolas Capensc5c0c332016-11-08 11:37:01 -0500858 }
859 else // Vector
860 {
Nicolas Capensf34d1ac2017-05-08 17:06:11 -0400861 int64_t c[16] = {-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1};
Nicolas Capensc5c0c332016-11-08 11:37:01 -0500862 return createXor(v, createConstantVector(c, T(v->getType())));
863 }
Nicolas Capens598f8d82016-09-26 15:09:10 -0400864 }
865
Nicolas Capens86509d92019-03-21 13:23:50 -0400866 Value *Nucleus::createLoad(Value *ptr, Type *type, bool isVolatile, unsigned int align, bool atomic, std::memory_order memoryOrder)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400867 {
Nicolas Capens86509d92019-03-21 13:23:50 -0400868 assert(!atomic); // Unimplemented
869 assert(memoryOrder == std::memory_order_relaxed); // Unimplemented
870
Nicolas Capens23d99a42016-09-30 14:57:16 -0400871 int valueType = (int)reinterpret_cast<intptr_t>(type);
872 Ice::Variable *result = ::function->makeVariable(T(type));
873
Nicolas Capensf4c4eca2017-10-03 14:26:07 -0400874 if((valueType & EmulatedBits) && (align != 0)) // Narrow vector not stored on stack.
Nicolas Capens23d99a42016-09-30 14:57:16 -0400875 {
Nicolas Capens070d9f42017-04-26 13:36:33 -0400876 if(emulateIntrinsics)
877 {
878 if(typeSize(type) == 4)
879 {
880 auto pointer = RValue<Pointer<Byte>>(ptr);
Nicolas Capens1894cfa2017-07-27 14:21:46 -0400881 Int x = *Pointer<Int>(pointer);
Nicolas Capens070d9f42017-04-26 13:36:33 -0400882
883 Int4 vector;
884 vector = Insert(vector, x, 0);
885
886 auto bitcast = Ice::InstCast::create(::function, Ice::InstCast::Bitcast, result, vector.loadValue());
887 ::basicBlock->appendInst(bitcast);
888 }
889 else if(typeSize(type) == 8)
890 {
891 auto pointer = RValue<Pointer<Byte>>(ptr);
Nicolas Capens1894cfa2017-07-27 14:21:46 -0400892 Int x = *Pointer<Int>(pointer);
Nicolas Capens070d9f42017-04-26 13:36:33 -0400893 Int y = *Pointer<Int>(pointer + 4);
894
895 Int4 vector;
896 vector = Insert(vector, x, 0);
897 vector = Insert(vector, y, 1);
898
899 auto bitcast = Ice::InstCast::create(::function, Ice::InstCast::Bitcast, result, vector.loadValue());
900 ::basicBlock->appendInst(bitcast);
901 }
902 else assert(false);
903 }
904 else
905 {
906 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::LoadSubVector, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
907 auto target = ::context->getConstantUndef(Ice::IceType_i32);
908 auto load = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
909 load->addArg(ptr);
910 load->addArg(::context->getConstantInt32(typeSize(type)));
911 ::basicBlock->appendInst(load);
912 }
Nicolas Capens23d99a42016-09-30 14:57:16 -0400913 }
914 else
915 {
916 auto load = Ice::InstLoad::create(::function, result, ptr, align);
917 ::basicBlock->appendInst(load);
918 }
919
920 return V(result);
Nicolas Capens598f8d82016-09-26 15:09:10 -0400921 }
922
Nicolas Capens86509d92019-03-21 13:23:50 -0400923 Value *Nucleus::createStore(Value *value, Value *ptr, Type *type, bool isVolatile, unsigned int align, bool atomic, std::memory_order memoryOrder)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400924 {
Nicolas Capens86509d92019-03-21 13:23:50 -0400925 assert(!atomic); // Unimplemented
926 assert(memoryOrder == std::memory_order_relaxed); // Unimplemented
927
Nicolas Capens6a990f82018-07-06 15:54:07 -0400928 #if __has_feature(memory_sanitizer)
929 // Mark all (non-stack) memory writes as initialized by calling __msan_unpoison
930 if(align != 0)
931 {
932 auto call = Ice::InstCall::create(::function, 2, nullptr, ::context->getConstantInt64(reinterpret_cast<intptr_t>(__msan_unpoison)), false);
933 call->addArg(ptr);
934 call->addArg(::context->getConstantInt64(typeSize(type)));
935 ::basicBlock->appendInst(call);
936 }
937 #endif
938
Nicolas Capens23d99a42016-09-30 14:57:16 -0400939 int valueType = (int)reinterpret_cast<intptr_t>(type);
940
Nicolas Capensf4c4eca2017-10-03 14:26:07 -0400941 if((valueType & EmulatedBits) && (align != 0)) // Narrow vector not stored on stack.
Nicolas Capens23d99a42016-09-30 14:57:16 -0400942 {
Nicolas Capens070d9f42017-04-26 13:36:33 -0400943 if(emulateIntrinsics)
944 {
945 if(typeSize(type) == 4)
946 {
947 Ice::Variable *vector = ::function->makeVariable(Ice::IceType_v4i32);
948 auto bitcast = Ice::InstCast::create(::function, Ice::InstCast::Bitcast, vector, value);
949 ::basicBlock->appendInst(bitcast);
950
951 RValue<Int4> v(V(vector));
952
953 auto pointer = RValue<Pointer<Byte>>(ptr);
954 Int x = Extract(v, 0);
955 *Pointer<Int>(pointer) = x;
956 }
957 else if(typeSize(type) == 8)
958 {
959 Ice::Variable *vector = ::function->makeVariable(Ice::IceType_v4i32);
960 auto bitcast = Ice::InstCast::create(::function, Ice::InstCast::Bitcast, vector, value);
961 ::basicBlock->appendInst(bitcast);
962
963 RValue<Int4> v(V(vector));
964
965 auto pointer = RValue<Pointer<Byte>>(ptr);
966 Int x = Extract(v, 0);
967 *Pointer<Int>(pointer) = x;
968 Int y = Extract(v, 1);
969 *Pointer<Int>(pointer + 4) = y;
970 }
971 else assert(false);
972 }
973 else
974 {
975 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::StoreSubVector, Ice::Intrinsics::SideEffects_T, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_T};
976 auto target = ::context->getConstantUndef(Ice::IceType_i32);
977 auto store = Ice::InstIntrinsicCall::create(::function, 3, nullptr, target, intrinsic);
978 store->addArg(value);
979 store->addArg(ptr);
980 store->addArg(::context->getConstantInt32(typeSize(type)));
981 ::basicBlock->appendInst(store);
982 }
Nicolas Capens23d99a42016-09-30 14:57:16 -0400983 }
984 else
985 {
Nicolas Capensf4c4eca2017-10-03 14:26:07 -0400986 assert(value->getType() == T(type));
Nicolas Capens23d99a42016-09-30 14:57:16 -0400987
988 auto store = Ice::InstStore::create(::function, value, ptr, align);
989 ::basicBlock->appendInst(store);
990 }
991
Nicolas Capens598f8d82016-09-26 15:09:10 -0400992 return value;
993 }
994
Nicolas Capensd294def2017-01-26 17:44:37 -0800995 Value *Nucleus::createGEP(Value *ptr, Type *type, Value *index, bool unsignedIndex)
Nicolas Capens598f8d82016-09-26 15:09:10 -0400996 {
Nicolas Capens8820f642016-09-30 04:42:43 -0400997 assert(index->getType() == Ice::IceType_i32);
998
Nicolas Capens15060bb2016-12-05 22:17:19 -0500999 if(auto *constant = llvm::dyn_cast<Ice::ConstantInteger32>(index))
1000 {
Nicolas Capens584088c2017-01-26 16:05:18 -08001001 int32_t offset = constant->getValue() * (int)typeSize(type);
Nicolas Capens15060bb2016-12-05 22:17:19 -05001002
1003 if(offset == 0)
1004 {
1005 return ptr;
1006 }
1007
1008 return createAdd(ptr, createConstantInt(offset));
1009 }
1010
Nicolas Capens8820f642016-09-30 04:42:43 -04001011 if(!Ice::isByteSizedType(T(type)))
1012 {
Nicolas Capens584088c2017-01-26 16:05:18 -08001013 index = createMul(index, createConstantInt((int)typeSize(type)));
Nicolas Capens8820f642016-09-30 04:42:43 -04001014 }
1015
1016 if(sizeof(void*) == 8)
1017 {
Nicolas Capensd294def2017-01-26 17:44:37 -08001018 if(unsignedIndex)
1019 {
1020 index = createZExt(index, T(Ice::IceType_i64));
1021 }
1022 else
1023 {
1024 index = createSExt(index, T(Ice::IceType_i64));
1025 }
Nicolas Capens8820f642016-09-30 04:42:43 -04001026 }
1027
1028 return createAdd(ptr, index);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001029 }
1030
1031 Value *Nucleus::createAtomicAdd(Value *ptr, Value *value)
1032 {
1033 assert(false && "UNIMPLEMENTED"); return nullptr;
1034 }
1035
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001036 static Value *createCast(Ice::InstCast::OpKind op, Value *v, Type *destType)
1037 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04001038 if(v->getType() == T(destType))
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001039 {
1040 return v;
1041 }
1042
1043 Ice::Variable *result = ::function->makeVariable(T(destType));
1044 Ice::InstCast *cast = Ice::InstCast::create(::function, op, result, v);
1045 ::basicBlock->appendInst(cast);
1046
1047 return V(result);
1048 }
1049
Nicolas Capens598f8d82016-09-26 15:09:10 -04001050 Value *Nucleus::createTrunc(Value *v, Type *destType)
1051 {
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001052 return createCast(Ice::InstCast::Trunc, v, destType);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001053 }
1054
1055 Value *Nucleus::createZExt(Value *v, Type *destType)
1056 {
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001057 return createCast(Ice::InstCast::Zext, v, destType);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001058 }
1059
1060 Value *Nucleus::createSExt(Value *v, Type *destType)
1061 {
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001062 return createCast(Ice::InstCast::Sext, v, destType);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001063 }
1064
1065 Value *Nucleus::createFPToSI(Value *v, Type *destType)
1066 {
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001067 return createCast(Ice::InstCast::Fptosi, v, destType);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001068 }
1069
Nicolas Capens598f8d82016-09-26 15:09:10 -04001070 Value *Nucleus::createSIToFP(Value *v, Type *destType)
1071 {
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001072 return createCast(Ice::InstCast::Sitofp, v, destType);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001073 }
1074
1075 Value *Nucleus::createFPTrunc(Value *v, Type *destType)
1076 {
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001077 return createCast(Ice::InstCast::Fptrunc, v, destType);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001078 }
1079
1080 Value *Nucleus::createFPExt(Value *v, Type *destType)
1081 {
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001082 return createCast(Ice::InstCast::Fpext, v, destType);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001083 }
1084
1085 Value *Nucleus::createBitCast(Value *v, Type *destType)
1086 {
Nicolas Capens2d8c3702017-07-25 13:56:46 -04001087 // Bitcasts must be between types of the same logical size. But with emulated narrow vectors we need
1088 // support for casting between scalars and wide vectors. For platforms where this is not supported,
1089 // emulate them by writing to the stack and reading back as the destination type.
1090 if(emulateMismatchedBitCast)
1091 {
1092 if(!Ice::isVectorType(v->getType()) && Ice::isVectorType(T(destType)))
1093 {
1094 Value *address = allocateStackVariable(destType);
1095 createStore(v, address, T(v->getType()));
1096 return createLoad(address, destType);
1097 }
1098 else if(Ice::isVectorType(v->getType()) && !Ice::isVectorType(T(destType)))
1099 {
1100 Value *address = allocateStackVariable(T(v->getType()));
1101 createStore(v, address, T(v->getType()));
1102 return createLoad(address, destType);
1103 }
1104 }
1105
Nicolas Capensa0c2fc52016-09-30 05:04:21 -04001106 return createCast(Ice::InstCast::Bitcast, v, destType);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001107 }
1108
Nicolas Capens43dc6292016-10-20 00:01:38 -04001109 static Value *createIntCompare(Ice::InstIcmp::ICond condition, Value *lhs, Value *rhs)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001110 {
Nicolas Capens611642a2016-09-28 16:45:04 -04001111 assert(lhs->getType() == rhs->getType());
1112
Nicolas Capens43dc6292016-10-20 00:01:38 -04001113 auto result = ::function->makeVariable(Ice::isScalarIntegerType(lhs->getType()) ? Ice::IceType_i1 : lhs->getType());
1114 auto cmp = Ice::InstIcmp::create(::function, condition, result, lhs, rhs);
Nicolas Capens611642a2016-09-28 16:45:04 -04001115 ::basicBlock->appendInst(cmp);
1116
1117 return V(result);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001118 }
1119
Nicolas Capens43dc6292016-10-20 00:01:38 -04001120 Value *Nucleus::createICmpEQ(Value *lhs, Value *rhs)
1121 {
1122 return createIntCompare(Ice::InstIcmp::Eq, lhs, rhs);
1123 }
1124
1125 Value *Nucleus::createICmpNE(Value *lhs, Value *rhs)
1126 {
1127 return createIntCompare(Ice::InstIcmp::Ne, lhs, rhs);
1128 }
1129
1130 Value *Nucleus::createICmpUGT(Value *lhs, Value *rhs)
1131 {
1132 return createIntCompare(Ice::InstIcmp::Ugt, lhs, rhs);
1133 }
1134
1135 Value *Nucleus::createICmpUGE(Value *lhs, Value *rhs)
1136 {
1137 return createIntCompare(Ice::InstIcmp::Uge, lhs, rhs);
1138 }
1139
1140 Value *Nucleus::createICmpULT(Value *lhs, Value *rhs)
1141 {
1142 return createIntCompare(Ice::InstIcmp::Ult, lhs, rhs);
1143 }
1144
1145 Value *Nucleus::createICmpULE(Value *lhs, Value *rhs)
1146 {
1147 return createIntCompare(Ice::InstIcmp::Ule, lhs, rhs);
1148 }
1149
1150 Value *Nucleus::createICmpSGT(Value *lhs, Value *rhs)
1151 {
1152 return createIntCompare(Ice::InstIcmp::Sgt, lhs, rhs);
1153 }
1154
1155 Value *Nucleus::createICmpSGE(Value *lhs, Value *rhs)
1156 {
1157 return createIntCompare(Ice::InstIcmp::Sge, lhs, rhs);
1158 }
1159
1160 Value *Nucleus::createICmpSLT(Value *lhs, Value *rhs)
1161 {
1162 return createIntCompare(Ice::InstIcmp::Slt, lhs, rhs);
1163 }
1164
Nicolas Capens598f8d82016-09-26 15:09:10 -04001165 Value *Nucleus::createICmpSLE(Value *lhs, Value *rhs)
1166 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001167 return createIntCompare(Ice::InstIcmp::Sle, lhs, rhs);
1168 }
1169
1170 static Value *createFloatCompare(Ice::InstFcmp::FCond condition, Value *lhs, Value *rhs)
1171 {
1172 assert(lhs->getType() == rhs->getType());
1173 assert(Ice::isScalarFloatingType(lhs->getType()) || lhs->getType() == Ice::IceType_v4f32);
1174
1175 auto result = ::function->makeVariable(Ice::isScalarFloatingType(lhs->getType()) ? Ice::IceType_i1 : Ice::IceType_v4i32);
1176 auto cmp = Ice::InstFcmp::create(::function, condition, result, lhs, rhs);
1177 ::basicBlock->appendInst(cmp);
1178
1179 return V(result);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001180 }
1181
1182 Value *Nucleus::createFCmpOEQ(Value *lhs, Value *rhs)
1183 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001184 return createFloatCompare(Ice::InstFcmp::Oeq, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001185 }
1186
1187 Value *Nucleus::createFCmpOGT(Value *lhs, Value *rhs)
1188 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001189 return createFloatCompare(Ice::InstFcmp::Ogt, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001190 }
1191
1192 Value *Nucleus::createFCmpOGE(Value *lhs, Value *rhs)
1193 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001194 return createFloatCompare(Ice::InstFcmp::Oge, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001195 }
1196
1197 Value *Nucleus::createFCmpOLT(Value *lhs, Value *rhs)
1198 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001199 return createFloatCompare(Ice::InstFcmp::Olt, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001200 }
1201
1202 Value *Nucleus::createFCmpOLE(Value *lhs, Value *rhs)
1203 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001204 return createFloatCompare(Ice::InstFcmp::Ole, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001205 }
1206
1207 Value *Nucleus::createFCmpONE(Value *lhs, Value *rhs)
1208 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001209 return createFloatCompare(Ice::InstFcmp::One, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001210 }
1211
1212 Value *Nucleus::createFCmpORD(Value *lhs, Value *rhs)
1213 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001214 return createFloatCompare(Ice::InstFcmp::Ord, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001215 }
1216
1217 Value *Nucleus::createFCmpUNO(Value *lhs, Value *rhs)
1218 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001219 return createFloatCompare(Ice::InstFcmp::Uno, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001220 }
1221
1222 Value *Nucleus::createFCmpUEQ(Value *lhs, Value *rhs)
1223 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001224 return createFloatCompare(Ice::InstFcmp::Ueq, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001225 }
1226
1227 Value *Nucleus::createFCmpUGT(Value *lhs, Value *rhs)
1228 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001229 return createFloatCompare(Ice::InstFcmp::Ugt, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001230 }
1231
1232 Value *Nucleus::createFCmpUGE(Value *lhs, Value *rhs)
1233 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001234 return createFloatCompare(Ice::InstFcmp::Uge, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001235 }
1236
1237 Value *Nucleus::createFCmpULT(Value *lhs, Value *rhs)
1238 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001239 return createFloatCompare(Ice::InstFcmp::Ult, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001240 }
1241
1242 Value *Nucleus::createFCmpULE(Value *lhs, Value *rhs)
1243 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001244 return createFloatCompare(Ice::InstFcmp::Ule, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001245 }
1246
1247 Value *Nucleus::createFCmpUNE(Value *lhs, Value *rhs)
1248 {
Nicolas Capens43dc6292016-10-20 00:01:38 -04001249 return createFloatCompare(Ice::InstFcmp::Une, lhs, rhs);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001250 }
1251
Nicolas Capense95d5342016-09-30 11:37:28 -04001252 Value *Nucleus::createExtractElement(Value *vector, Type *type, int index)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001253 {
Nicolas Capens9709d4f2016-09-30 11:44:14 -04001254 auto result = ::function->makeVariable(T(type));
1255 auto extract = Ice::InstExtractElement::create(::function, result, vector, ::context->getConstantInt32(index));
1256 ::basicBlock->appendInst(extract);
1257
1258 return V(result);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001259 }
1260
1261 Value *Nucleus::createInsertElement(Value *vector, Value *element, int index)
1262 {
Nicolas Capens9709d4f2016-09-30 11:44:14 -04001263 auto result = ::function->makeVariable(vector->getType());
1264 auto insert = Ice::InstInsertElement::create(::function, result, vector, element, ::context->getConstantInt32(index));
1265 ::basicBlock->appendInst(insert);
1266
1267 return V(result);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001268 }
1269
Nicolas Capense89cd582016-09-30 14:23:47 -04001270 Value *Nucleus::createShuffleVector(Value *V1, Value *V2, const int *select)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001271 {
Nicolas Capens619c0ab2016-09-30 14:46:24 -04001272 assert(V1->getType() == V2->getType());
1273
1274 int size = Ice::typeNumElements(V1->getType());
1275 auto result = ::function->makeVariable(V1->getType());
1276 auto shuffle = Ice::InstShuffleVector::create(::function, result, V1, V2);
1277
1278 for(int i = 0; i < size; i++)
1279 {
1280 shuffle->addIndex(llvm::cast<Ice::ConstantInteger32>(::context->getConstantInt32(select[i])));
1281 }
1282
1283 ::basicBlock->appendInst(shuffle);
1284
1285 return V(result);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001286 }
1287
1288 Value *Nucleus::createSelect(Value *C, Value *ifTrue, Value *ifFalse)
1289 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04001290 assert(ifTrue->getType() == ifFalse->getType());
1291
1292 auto result = ::function->makeVariable(ifTrue->getType());
1293 auto *select = Ice::InstSelect::create(::function, result, C, ifTrue, ifFalse);
1294 ::basicBlock->appendInst(select);
1295
1296 return V(result);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001297 }
1298
Nicolas Capensb98fe5c2016-11-09 12:24:06 -05001299 SwitchCases *Nucleus::createSwitch(Value *control, BasicBlock *defaultBranch, unsigned numCases)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001300 {
Nicolas Capensb98fe5c2016-11-09 12:24:06 -05001301 auto switchInst = Ice::InstSwitch::create(::function, numCases, control, defaultBranch);
1302 ::basicBlock->appendInst(switchInst);
1303
1304 return reinterpret_cast<SwitchCases*>(switchInst);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001305 }
1306
Nicolas Capensb98fe5c2016-11-09 12:24:06 -05001307 void Nucleus::addSwitchCase(SwitchCases *switchCases, int label, BasicBlock *branch)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001308 {
Nicolas Capensb98fe5c2016-11-09 12:24:06 -05001309 switchCases->addBranch(label, label, branch);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001310 }
1311
1312 void Nucleus::createUnreachable()
1313 {
Nicolas Capensfdcca2d2016-10-20 11:31:36 -04001314 Ice::InstUnreachable *unreachable = Ice::InstUnreachable::create(::function);
1315 ::basicBlock->appendInst(unreachable);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001316 }
1317
Nicolas Capens598f8d82016-09-26 15:09:10 -04001318 Type *Nucleus::getPointerType(Type *ElementType)
1319 {
Nicolas Capense12780d2016-09-27 14:18:07 -04001320 if(sizeof(void*) == 8)
1321 {
1322 return T(Ice::IceType_i64);
1323 }
1324 else
1325 {
1326 return T(Ice::IceType_i32);
1327 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001328 }
1329
Nicolas Capens13ac2322016-10-13 14:52:12 -04001330 Value *Nucleus::createNullValue(Type *Ty)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001331 {
Nicolas Capens73dd7a22016-10-20 13:20:34 -04001332 if(Ice::isVectorType(T(Ty)))
1333 {
Nicolas Capens30385f02017-04-18 13:03:47 -04001334 assert(Ice::typeNumElements(T(Ty)) <= 16);
1335 int64_t c[16] = {0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0};
Nicolas Capens73dd7a22016-10-20 13:20:34 -04001336 return createConstantVector(c, Ty);
1337 }
1338 else
1339 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001340 return V(::context->getConstantZero(T(Ty)));
Nicolas Capens73dd7a22016-10-20 13:20:34 -04001341 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001342 }
1343
Nicolas Capens13ac2322016-10-13 14:52:12 -04001344 Value *Nucleus::createConstantLong(int64_t i)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001345 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001346 return V(::context->getConstantInt64(i));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001347 }
1348
Nicolas Capens13ac2322016-10-13 14:52:12 -04001349 Value *Nucleus::createConstantInt(int i)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001350 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001351 return V(::context->getConstantInt32(i));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001352 }
1353
Nicolas Capens13ac2322016-10-13 14:52:12 -04001354 Value *Nucleus::createConstantInt(unsigned int i)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001355 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001356 return V(::context->getConstantInt32(i));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001357 }
1358
Nicolas Capens13ac2322016-10-13 14:52:12 -04001359 Value *Nucleus::createConstantBool(bool b)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001360 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001361 return V(::context->getConstantInt1(b));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001362 }
1363
Nicolas Capens13ac2322016-10-13 14:52:12 -04001364 Value *Nucleus::createConstantByte(signed char i)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001365 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001366 return V(::context->getConstantInt8(i));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001367 }
1368
Nicolas Capens13ac2322016-10-13 14:52:12 -04001369 Value *Nucleus::createConstantByte(unsigned char i)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001370 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001371 return V(::context->getConstantInt8(i));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001372 }
1373
Nicolas Capens13ac2322016-10-13 14:52:12 -04001374 Value *Nucleus::createConstantShort(short i)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001375 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001376 return V(::context->getConstantInt16(i));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001377 }
1378
Nicolas Capens13ac2322016-10-13 14:52:12 -04001379 Value *Nucleus::createConstantShort(unsigned short i)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001380 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001381 return V(::context->getConstantInt16(i));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001382 }
1383
Nicolas Capens13ac2322016-10-13 14:52:12 -04001384 Value *Nucleus::createConstantFloat(float x)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001385 {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001386 return V(::context->getConstantFloat(x));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001387 }
1388
Nicolas Capens13ac2322016-10-13 14:52:12 -04001389 Value *Nucleus::createNullPointer(Type *Ty)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001390 {
Nicolas Capensa29d6532016-12-05 21:38:09 -05001391 return createNullValue(T(sizeof(void*) == 8 ? Ice::IceType_i64 : Ice::IceType_i32));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001392 }
1393
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001394 Value *Nucleus::createConstantVector(const int64_t *constants, Type *type)
Nicolas Capens13ac2322016-10-13 14:52:12 -04001395 {
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001396 const int vectorSize = 16;
1397 assert(Ice::typeWidthInBytes(T(type)) == vectorSize);
1398 const int alignment = vectorSize;
1399 auto globalPool = ::function->getGlobalPool();
1400
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001401 const int64_t *i = constants;
1402 const double *f = reinterpret_cast<const double*>(constants);
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001403 Ice::VariableDeclaration::DataInitializer *dataInitializer = nullptr;
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001404
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001405 switch((int)reinterpret_cast<intptr_t>(type))
1406 {
1407 case Ice::IceType_v4i32:
Nicolas Capensa4c30b02016-11-08 15:43:17 -05001408 case Ice::IceType_v4i1:
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001409 {
1410 const int initializer[4] = {(int)i[0], (int)i[1], (int)i[2], (int)i[3]};
1411 static_assert(sizeof(initializer) == vectorSize, "!");
1412 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1413 }
1414 break;
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001415 case Ice::IceType_v4f32:
1416 {
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001417 const float initializer[4] = {(float)f[0], (float)f[1], (float)f[2], (float)f[3]};
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001418 static_assert(sizeof(initializer) == vectorSize, "!");
1419 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1420 }
1421 break;
1422 case Ice::IceType_v8i16:
Nicolas Capensa4c30b02016-11-08 15:43:17 -05001423 case Ice::IceType_v8i1:
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001424 {
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001425 const short initializer[8] = {(short)i[0], (short)i[1], (short)i[2], (short)i[3], (short)i[4], (short)i[5], (short)i[6], (short)i[7]};
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001426 static_assert(sizeof(initializer) == vectorSize, "!");
1427 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1428 }
1429 break;
1430 case Ice::IceType_v16i8:
Nicolas Capensa4c30b02016-11-08 15:43:17 -05001431 case Ice::IceType_v16i1:
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001432 {
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001433 const char initializer[16] = {(char)i[0], (char)i[1], (char)i[2], (char)i[3], (char)i[4], (char)i[5], (char)i[6], (char)i[7], (char)i[8], (char)i[9], (char)i[10], (char)i[11], (char)i[12], (char)i[13], (char)i[14], (char)i[15]};
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001434 static_assert(sizeof(initializer) == vectorSize, "!");
1435 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1436 }
1437 break;
1438 case Type_v2i32:
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001439 {
1440 const int initializer[4] = {(int)i[0], (int)i[1], (int)i[0], (int)i[1]};
1441 static_assert(sizeof(initializer) == vectorSize, "!");
1442 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1443 }
1444 break;
Nicolas Capens4cfd4572016-10-20 01:00:19 -04001445 case Type_v2f32:
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001446 {
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001447 const float initializer[4] = {(float)f[0], (float)f[1], (float)f[0], (float)f[1]};
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001448 static_assert(sizeof(initializer) == vectorSize, "!");
1449 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1450 }
1451 break;
1452 case Type_v4i16:
1453 {
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001454 const short initializer[8] = {(short)i[0], (short)i[1], (short)i[2], (short)i[3], (short)i[0], (short)i[1], (short)i[2], (short)i[3]};
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001455 static_assert(sizeof(initializer) == vectorSize, "!");
1456 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1457 }
1458 break;
1459 case Type_v8i8:
1460 {
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001461 const char initializer[16] = {(char)i[0], (char)i[1], (char)i[2], (char)i[3], (char)i[4], (char)i[5], (char)i[6], (char)i[7], (char)i[0], (char)i[1], (char)i[2], (char)i[3], (char)i[4], (char)i[5], (char)i[6], (char)i[7]};
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001462 static_assert(sizeof(initializer) == vectorSize, "!");
1463 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1464 }
1465 break;
1466 case Type_v4i8:
1467 {
Nicolas Capens7f3f69c2016-10-20 01:29:33 -04001468 const char initializer[16] = {(char)i[0], (char)i[1], (char)i[2], (char)i[3], (char)i[0], (char)i[1], (char)i[2], (char)i[3], (char)i[0], (char)i[1], (char)i[2], (char)i[3], (char)i[0], (char)i[1], (char)i[2], (char)i[3]};
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001469 static_assert(sizeof(initializer) == vectorSize, "!");
1470 dataInitializer = Ice::VariableDeclaration::DataInitializer::create(globalPool, (const char*)initializer, vectorSize);
1471 }
1472 break;
1473 default:
1474 assert(false && "Unknown constant vector type" && type);
1475 }
1476
1477 auto name = Ice::GlobalString::createWithoutString(::context);
1478 auto *variableDeclaration = Ice::VariableDeclaration::create(globalPool);
1479 variableDeclaration->setName(name);
1480 variableDeclaration->setAlignment(alignment);
1481 variableDeclaration->setIsConstant(true);
1482 variableDeclaration->addInitializer(dataInitializer);
Nicolas Capens87852e12016-11-24 14:45:06 -05001483
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001484 ::function->addGlobal(variableDeclaration);
1485
1486 constexpr int32_t offset = 0;
1487 Ice::Operand *ptr = ::context->getConstantSym(offset, name);
1488
1489 Ice::Variable *result = ::function->makeVariable(T(type));
1490 auto load = Ice::InstLoad::create(::function, result, ptr, alignment);
1491 ::basicBlock->appendInst(load);
1492
1493 return V(result);
Nicolas Capens13ac2322016-10-13 14:52:12 -04001494 }
1495
1496 Value *Nucleus::createConstantVector(const double *constants, Type *type)
Nicolas Capens598f8d82016-09-26 15:09:10 -04001497 {
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04001498 return createConstantVector((const int64_t*)constants, type);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001499 }
1500
1501 Type *Void::getType()
1502 {
1503 return T(Ice::IceType_void);
1504 }
1505
Nicolas Capens598f8d82016-09-26 15:09:10 -04001506 Type *Bool::getType()
1507 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04001508 return T(Ice::IceType_i1);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001509 }
1510
Nicolas Capens598f8d82016-09-26 15:09:10 -04001511 Type *Byte::getType()
1512 {
Nicolas Capens6d738712016-09-30 04:15:22 -04001513 return T(Ice::IceType_i8);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001514 }
1515
Nicolas Capens598f8d82016-09-26 15:09:10 -04001516 Type *SByte::getType()
1517 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04001518 return T(Ice::IceType_i8);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001519 }
1520
Nicolas Capens598f8d82016-09-26 15:09:10 -04001521 Type *Short::getType()
1522 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04001523 return T(Ice::IceType_i16);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001524 }
1525
Nicolas Capens598f8d82016-09-26 15:09:10 -04001526 Type *UShort::getType()
1527 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04001528 return T(Ice::IceType_i16);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001529 }
1530
1531 Type *Byte4::getType()
1532 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04001533 return T(Type_v4i8);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001534 }
1535
1536 Type *SByte4::getType()
1537 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04001538 return T(Type_v4i8);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001539 }
1540
Nicolas Capensb6d4ce32019-03-12 23:00:24 -04001541 namespace
Nicolas Capens598f8d82016-09-26 15:09:10 -04001542 {
Nicolas Capensb6d4ce32019-03-12 23:00:24 -04001543 RValue<Byte> SaturateUnsigned(RValue<Short> x)
1544 {
1545 return Byte(IfThenElse(Int(x) > 0xFF, Int(0xFF), IfThenElse(Int(x) < 0, Int(0), Int(x))));
1546 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001547
Nicolas Capensb6d4ce32019-03-12 23:00:24 -04001548 RValue<Byte> Extract(RValue<Byte8> val, int i)
1549 {
1550 return RValue<Byte>(Nucleus::createExtractElement(val.value, Byte::getType(), i));
1551 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001552
Nicolas Capensb6d4ce32019-03-12 23:00:24 -04001553 RValue<Byte8> Insert(RValue<Byte8> val, RValue<Byte> element, int i)
1554 {
1555 return RValue<Byte8>(Nucleus::createInsertElement(val.value, element.value, i));
1556 }
Nicolas Capens98436732017-07-25 15:32:12 -04001557 }
1558
Nicolas Capens598f8d82016-09-26 15:09:10 -04001559 RValue<Byte8> AddSat(RValue<Byte8> x, RValue<Byte8> y)
1560 {
Nicolas Capens98436732017-07-25 15:32:12 -04001561 if(emulateIntrinsics)
1562 {
1563 Byte8 result;
Nicolas Capens33438a62017-09-27 11:47:35 -04001564 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 0)) + Int(Extract(y, 0)))), 0);
1565 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 1)) + Int(Extract(y, 1)))), 1);
1566 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 2)) + Int(Extract(y, 2)))), 2);
1567 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 3)) + Int(Extract(y, 3)))), 3);
1568 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 4)) + Int(Extract(y, 4)))), 4);
1569 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 5)) + Int(Extract(y, 5)))), 5);
1570 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 6)) + Int(Extract(y, 6)))), 6);
1571 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 7)) + Int(Extract(y, 7)))), 7);
Nicolas Capensc71bed22016-11-07 22:25:14 -05001572
Nicolas Capens98436732017-07-25 15:32:12 -04001573 return result;
1574 }
1575 else
1576 {
1577 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v16i8);
1578 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::AddSaturateUnsigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
1579 auto target = ::context->getConstantUndef(Ice::IceType_i32);
1580 auto paddusb = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
1581 paddusb->addArg(x.value);
1582 paddusb->addArg(y.value);
1583 ::basicBlock->appendInst(paddusb);
1584
1585 return RValue<Byte8>(V(result));
1586 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001587 }
1588
1589 RValue<Byte8> SubSat(RValue<Byte8> x, RValue<Byte8> y)
1590 {
Nicolas Capens98436732017-07-25 15:32:12 -04001591 if(emulateIntrinsics)
1592 {
1593 Byte8 result;
Nicolas Capens33438a62017-09-27 11:47:35 -04001594 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 0)) - Int(Extract(y, 0)))), 0);
1595 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 1)) - Int(Extract(y, 1)))), 1);
1596 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 2)) - Int(Extract(y, 2)))), 2);
1597 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 3)) - Int(Extract(y, 3)))), 3);
1598 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 4)) - Int(Extract(y, 4)))), 4);
1599 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 5)) - Int(Extract(y, 5)))), 5);
1600 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 6)) - Int(Extract(y, 6)))), 6);
1601 result = Insert(result, SaturateUnsigned(Short(Int(Extract(x, 7)) - Int(Extract(y, 7)))), 7);
Nicolas Capensc71bed22016-11-07 22:25:14 -05001602
Nicolas Capens98436732017-07-25 15:32:12 -04001603 return result;
1604 }
1605 else
1606 {
1607 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v16i8);
1608 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::SubtractSaturateUnsigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
1609 auto target = ::context->getConstantUndef(Ice::IceType_i32);
1610 auto psubusw = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
1611 psubusw->addArg(x.value);
1612 psubusw->addArg(y.value);
1613 ::basicBlock->appendInst(psubusw);
1614
1615 return RValue<Byte8>(V(result));
1616 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001617 }
1618
Nicolas Capensd6cacad2017-07-25 15:32:12 -04001619 RValue<SByte> Extract(RValue<SByte8> val, int i)
1620 {
1621 return RValue<SByte>(Nucleus::createExtractElement(val.value, SByte::getType(), i));
1622 }
1623
1624 RValue<SByte8> Insert(RValue<SByte8> val, RValue<SByte> element, int i)
1625 {
1626 return RValue<SByte8>(Nucleus::createInsertElement(val.value, element.value, i));
1627 }
1628
1629 RValue<SByte8> operator>>(RValue<SByte8> lhs, unsigned char rhs)
1630 {
1631 if(emulateIntrinsics)
1632 {
1633 SByte8 result;
1634 result = Insert(result, Extract(lhs, 0) >> SByte(rhs), 0);
1635 result = Insert(result, Extract(lhs, 1) >> SByte(rhs), 1);
1636 result = Insert(result, Extract(lhs, 2) >> SByte(rhs), 2);
1637 result = Insert(result, Extract(lhs, 3) >> SByte(rhs), 3);
1638 result = Insert(result, Extract(lhs, 4) >> SByte(rhs), 4);
1639 result = Insert(result, Extract(lhs, 5) >> SByte(rhs), 5);
1640 result = Insert(result, Extract(lhs, 6) >> SByte(rhs), 6);
1641 result = Insert(result, Extract(lhs, 7) >> SByte(rhs), 7);
1642
1643 return result;
1644 }
1645 else
1646 {
1647 #if defined(__i386__) || defined(__x86_64__)
1648 // SSE2 doesn't support byte vector shifts, so shift as shorts and recombine.
Alexis Hetue18c5302017-08-04 11:48:17 -04001649 RValue<Short4> hi = (As<Short4>(lhs) >> rhs) & Short4(0xFF00u);
Nicolas Capensd6cacad2017-07-25 15:32:12 -04001650 RValue<Short4> lo = As<Short4>(As<UShort4>((As<Short4>(lhs) << 8) >> rhs) >> 8);
1651
1652 return As<SByte8>(hi | lo);
1653 #else
1654 return RValue<SByte8>(Nucleus::createAShr(lhs.value, V(::context->getConstantInt32(rhs))));
1655 #endif
1656 }
1657 }
1658
Nicolas Capens598f8d82016-09-26 15:09:10 -04001659 RValue<Int> SignMask(RValue<Byte8> x)
1660 {
Nicolas Capens091f3502017-10-03 14:56:49 -04001661 if(emulateIntrinsics || CPUID::ARM)
Nicolas Capensd6cacad2017-07-25 15:32:12 -04001662 {
1663 Byte8 xx = As<Byte8>(As<SByte8>(x) >> 7) & Byte8(0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80);
1664 return Int(Extract(xx, 0)) | Int(Extract(xx, 1)) | Int(Extract(xx, 2)) | Int(Extract(xx, 3)) | Int(Extract(xx, 4)) | Int(Extract(xx, 5)) | Int(Extract(xx, 6)) | Int(Extract(xx, 7));
1665 }
1666 else
1667 {
1668 Ice::Variable *result = ::function->makeVariable(Ice::IceType_i32);
1669 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::SignMask, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
1670 auto target = ::context->getConstantUndef(Ice::IceType_i32);
1671 auto movmsk = Ice::InstIntrinsicCall::create(::function, 1, result, target, intrinsic);
1672 movmsk->addArg(x.value);
1673 ::basicBlock->appendInst(movmsk);
Nicolas Capensc71bed22016-11-07 22:25:14 -05001674
Nicolas Capens0f70a7f2017-07-26 13:50:04 -04001675 return RValue<Int>(V(result)) & 0xFF;
Nicolas Capensd6cacad2017-07-25 15:32:12 -04001676 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001677 }
1678
1679// RValue<Byte8> CmpGT(RValue<Byte8> x, RValue<Byte8> y)
1680// {
Nicolas Capens2f970b62016-11-08 14:28:59 -05001681// return RValue<Byte8>(createIntCompare(Ice::InstIcmp::Ugt, x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001682// }
1683
1684 RValue<Byte8> CmpEQ(RValue<Byte8> x, RValue<Byte8> y)
1685 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05001686 return RValue<Byte8>(Nucleus::createICmpEQ(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001687 }
1688
1689 Type *Byte8::getType()
1690 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04001691 return T(Type_v8i8);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001692 }
1693
Nicolas Capens598f8d82016-09-26 15:09:10 -04001694// RValue<SByte8> operator<<(RValue<SByte8> lhs, unsigned char rhs)
1695// {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001696// return RValue<SByte8>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001697// }
1698
1699// RValue<SByte8> operator>>(RValue<SByte8> lhs, unsigned char rhs)
1700// {
Nicolas Capens15060bb2016-12-05 22:17:19 -05001701// return RValue<SByte8>(Nucleus::createAShr(lhs.value, V(::context->getConstantInt32(rhs))));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001702// }
1703
Nicolas Capens33438a62017-09-27 11:47:35 -04001704 RValue<SByte> SaturateSigned(RValue<Short> x)
Nicolas Capens98436732017-07-25 15:32:12 -04001705 {
1706 return SByte(IfThenElse(Int(x) > 0x7F, Int(0x7F), IfThenElse(Int(x) < -0x80, Int(0x80), Int(x))));
1707 }
1708
Nicolas Capens598f8d82016-09-26 15:09:10 -04001709 RValue<SByte8> AddSat(RValue<SByte8> x, RValue<SByte8> y)
1710 {
Nicolas Capens98436732017-07-25 15:32:12 -04001711 if(emulateIntrinsics)
1712 {
1713 SByte8 result;
Nicolas Capens33438a62017-09-27 11:47:35 -04001714 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 0)) + Int(Extract(y, 0)))), 0);
1715 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 1)) + Int(Extract(y, 1)))), 1);
1716 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 2)) + Int(Extract(y, 2)))), 2);
1717 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 3)) + Int(Extract(y, 3)))), 3);
1718 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 4)) + Int(Extract(y, 4)))), 4);
1719 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 5)) + Int(Extract(y, 5)))), 5);
1720 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 6)) + Int(Extract(y, 6)))), 6);
1721 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 7)) + Int(Extract(y, 7)))), 7);
Nicolas Capensc71bed22016-11-07 22:25:14 -05001722
Nicolas Capens98436732017-07-25 15:32:12 -04001723 return result;
1724 }
1725 else
1726 {
1727 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v16i8);
1728 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::AddSaturateSigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
1729 auto target = ::context->getConstantUndef(Ice::IceType_i32);
1730 auto paddsb = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
1731 paddsb->addArg(x.value);
1732 paddsb->addArg(y.value);
1733 ::basicBlock->appendInst(paddsb);
1734
1735 return RValue<SByte8>(V(result));
1736 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001737 }
1738
1739 RValue<SByte8> SubSat(RValue<SByte8> x, RValue<SByte8> y)
1740 {
Nicolas Capens98436732017-07-25 15:32:12 -04001741 if(emulateIntrinsics)
1742 {
1743 SByte8 result;
Nicolas Capens33438a62017-09-27 11:47:35 -04001744 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 0)) - Int(Extract(y, 0)))), 0);
1745 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 1)) - Int(Extract(y, 1)))), 1);
1746 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 2)) - Int(Extract(y, 2)))), 2);
1747 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 3)) - Int(Extract(y, 3)))), 3);
1748 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 4)) - Int(Extract(y, 4)))), 4);
1749 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 5)) - Int(Extract(y, 5)))), 5);
1750 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 6)) - Int(Extract(y, 6)))), 6);
1751 result = Insert(result, SaturateSigned(Short(Int(Extract(x, 7)) - Int(Extract(y, 7)))), 7);
Nicolas Capensc71bed22016-11-07 22:25:14 -05001752
Nicolas Capens98436732017-07-25 15:32:12 -04001753 return result;
1754 }
1755 else
1756 {
1757 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v16i8);
1758 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::SubtractSaturateSigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
1759 auto target = ::context->getConstantUndef(Ice::IceType_i32);
1760 auto psubsb = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
1761 psubsb->addArg(x.value);
1762 psubsb->addArg(y.value);
1763 ::basicBlock->appendInst(psubsb);
1764
1765 return RValue<SByte8>(V(result));
1766 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001767 }
1768
Nicolas Capens598f8d82016-09-26 15:09:10 -04001769 RValue<Int> SignMask(RValue<SByte8> x)
1770 {
Nicolas Capens091f3502017-10-03 14:56:49 -04001771 if(emulateIntrinsics || CPUID::ARM)
Nicolas Capensd6cacad2017-07-25 15:32:12 -04001772 {
1773 SByte8 xx = (x >> 7) & SByte8(0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80);
1774 return Int(Extract(xx, 0)) | Int(Extract(xx, 1)) | Int(Extract(xx, 2)) | Int(Extract(xx, 3)) | Int(Extract(xx, 4)) | Int(Extract(xx, 5)) | Int(Extract(xx, 6)) | Int(Extract(xx, 7));
1775 }
1776 else
1777 {
1778 Ice::Variable *result = ::function->makeVariable(Ice::IceType_i32);
1779 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::SignMask, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
1780 auto target = ::context->getConstantUndef(Ice::IceType_i32);
1781 auto movmsk = Ice::InstIntrinsicCall::create(::function, 1, result, target, intrinsic);
1782 movmsk->addArg(x.value);
1783 ::basicBlock->appendInst(movmsk);
Nicolas Capensf2cb9df2016-10-21 17:26:13 -04001784
Nicolas Capens0f70a7f2017-07-26 13:50:04 -04001785 return RValue<Int>(V(result)) & 0xFF;
Nicolas Capensd6cacad2017-07-25 15:32:12 -04001786 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001787 }
1788
1789 RValue<Byte8> CmpGT(RValue<SByte8> x, RValue<SByte8> y)
1790 {
Nicolas Capens2f970b62016-11-08 14:28:59 -05001791 return RValue<Byte8>(createIntCompare(Ice::InstIcmp::Sgt, x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001792 }
1793
1794 RValue<Byte8> CmpEQ(RValue<SByte8> x, RValue<SByte8> y)
1795 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05001796 return RValue<Byte8>(Nucleus::createICmpEQ(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001797 }
1798
1799 Type *SByte8::getType()
1800 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04001801 return T(Type_v8i8);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001802 }
1803
Nicolas Capens598f8d82016-09-26 15:09:10 -04001804 Type *Byte16::getType()
1805 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04001806 return T(Ice::IceType_v16i8);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001807 }
1808
1809 Type *SByte16::getType()
1810 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04001811 return T(Ice::IceType_v16i8);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001812 }
1813
Nicolas Capens16b5f152016-10-13 13:39:01 -04001814 Type *Short2::getType()
1815 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04001816 return T(Type_v2i16);
Nicolas Capens16b5f152016-10-13 13:39:01 -04001817 }
1818
Nicolas Capens16b5f152016-10-13 13:39:01 -04001819 Type *UShort2::getType()
1820 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04001821 return T(Type_v2i16);
Nicolas Capens16b5f152016-10-13 13:39:01 -04001822 }
1823
Nicolas Capens598f8d82016-09-26 15:09:10 -04001824 Short4::Short4(RValue<Int4> cast)
1825 {
Nicolas Capensf8beb4b2017-01-27 02:55:44 -08001826 int select[8] = {0, 2, 4, 6, 0, 2, 4, 6};
1827 Value *short8 = Nucleus::createBitCast(cast.value, Short8::getType());
1828 Value *packed = Nucleus::createShuffleVector(short8, short8, select);
Nicolas Capensd4227962016-11-09 14:24:25 -05001829
Nicolas Capensbea4dce2017-07-24 16:54:44 -04001830 Value *int2 = RValue<Int2>(Int2(As<Int4>(packed))).value;
Nicolas Capensd4227962016-11-09 14:24:25 -05001831 Value *short4 = Nucleus::createBitCast(int2, Short4::getType());
1832
1833 storeValue(short4);
Nicolas Capens598f8d82016-09-26 15:09:10 -04001834 }
1835
1836// Short4::Short4(RValue<Float> cast)
1837// {
1838// }
1839
1840 Short4::Short4(RValue<Float4> cast)
1841 {
1842 assert(false && "UNIMPLEMENTED");
1843 }
1844
Nicolas Capens598f8d82016-09-26 15:09:10 -04001845 RValue<Short4> operator<<(RValue<Short4> lhs, unsigned char rhs)
1846 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04001847 if(emulateIntrinsics)
1848 {
1849 Short4 result;
1850 result = Insert(result, Extract(lhs, 0) << Short(rhs), 0);
1851 result = Insert(result, Extract(lhs, 1) << Short(rhs), 1);
1852 result = Insert(result, Extract(lhs, 2) << Short(rhs), 2);
1853 result = Insert(result, Extract(lhs, 3) << Short(rhs), 3);
1854
1855 return result;
1856 }
1857 else
1858 {
1859 return RValue<Short4>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
1860 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001861 }
1862
1863 RValue<Short4> operator>>(RValue<Short4> lhs, unsigned char rhs)
1864 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04001865 if(emulateIntrinsics)
1866 {
1867 Short4 result;
1868 result = Insert(result, Extract(lhs, 0) >> Short(rhs), 0);
1869 result = Insert(result, Extract(lhs, 1) >> Short(rhs), 1);
1870 result = Insert(result, Extract(lhs, 2) >> Short(rhs), 2);
1871 result = Insert(result, Extract(lhs, 3) >> Short(rhs), 3);
1872
1873 return result;
1874 }
1875 else
1876 {
1877 return RValue<Short4>(Nucleus::createAShr(lhs.value, V(::context->getConstantInt32(rhs))));
1878 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001879 }
1880
Nicolas Capens598f8d82016-09-26 15:09:10 -04001881 RValue<Short4> Max(RValue<Short4> x, RValue<Short4> y)
1882 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04001883 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v8i1);
1884 auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Sle, condition, x.value, y.value);
1885 ::basicBlock->appendInst(cmp);
1886
1887 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
1888 auto select = Ice::InstSelect::create(::function, result, condition, y.value, x.value);
1889 ::basicBlock->appendInst(select);
1890
1891 return RValue<Short4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001892 }
1893
1894 RValue<Short4> Min(RValue<Short4> x, RValue<Short4> y)
1895 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04001896 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v8i1);
1897 auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Sgt, condition, x.value, y.value);
1898 ::basicBlock->appendInst(cmp);
1899
1900 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
1901 auto select = Ice::InstSelect::create(::function, result, condition, y.value, x.value);
1902 ::basicBlock->appendInst(select);
1903
1904 return RValue<Short4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04001905 }
1906
Nicolas Capens33438a62017-09-27 11:47:35 -04001907 RValue<Short> SaturateSigned(RValue<Int> x)
Nicolas Capens98436732017-07-25 15:32:12 -04001908 {
1909 return Short(IfThenElse(x > 0x7FFF, Int(0x7FFF), IfThenElse(x < -0x8000, Int(0x8000), x)));
1910 }
1911
Nicolas Capens598f8d82016-09-26 15:09:10 -04001912 RValue<Short4> AddSat(RValue<Short4> x, RValue<Short4> y)
1913 {
Nicolas Capens98436732017-07-25 15:32:12 -04001914 if(emulateIntrinsics)
1915 {
1916 Short4 result;
Nicolas Capens33438a62017-09-27 11:47:35 -04001917 result = Insert(result, SaturateSigned(Int(Extract(x, 0)) + Int(Extract(y, 0))), 0);
1918 result = Insert(result, SaturateSigned(Int(Extract(x, 1)) + Int(Extract(y, 1))), 1);
1919 result = Insert(result, SaturateSigned(Int(Extract(x, 2)) + Int(Extract(y, 2))), 2);
1920 result = Insert(result, SaturateSigned(Int(Extract(x, 3)) + Int(Extract(y, 3))), 3);
Nicolas Capensc71bed22016-11-07 22:25:14 -05001921
Nicolas Capens98436732017-07-25 15:32:12 -04001922 return result;
1923 }
1924 else
1925 {
1926 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
1927 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::AddSaturateSigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
1928 auto target = ::context->getConstantUndef(Ice::IceType_i32);
1929 auto paddsw = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
1930 paddsw->addArg(x.value);
1931 paddsw->addArg(y.value);
1932 ::basicBlock->appendInst(paddsw);
1933
1934 return RValue<Short4>(V(result));
1935 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001936 }
1937
1938 RValue<Short4> SubSat(RValue<Short4> x, RValue<Short4> y)
1939 {
Nicolas Capens98436732017-07-25 15:32:12 -04001940 if(emulateIntrinsics)
1941 {
1942 Short4 result;
Nicolas Capens33438a62017-09-27 11:47:35 -04001943 result = Insert(result, SaturateSigned(Int(Extract(x, 0)) - Int(Extract(y, 0))), 0);
1944 result = Insert(result, SaturateSigned(Int(Extract(x, 1)) - Int(Extract(y, 1))), 1);
1945 result = Insert(result, SaturateSigned(Int(Extract(x, 2)) - Int(Extract(y, 2))), 2);
1946 result = Insert(result, SaturateSigned(Int(Extract(x, 3)) - Int(Extract(y, 3))), 3);
Nicolas Capensc71bed22016-11-07 22:25:14 -05001947
Nicolas Capens98436732017-07-25 15:32:12 -04001948 return result;
1949 }
1950 else
1951 {
1952 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
1953 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::SubtractSaturateSigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
1954 auto target = ::context->getConstantUndef(Ice::IceType_i32);
1955 auto psubsw = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
1956 psubsw->addArg(x.value);
1957 psubsw->addArg(y.value);
1958 ::basicBlock->appendInst(psubsw);
1959
1960 return RValue<Short4>(V(result));
1961 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001962 }
1963
1964 RValue<Short4> MulHigh(RValue<Short4> x, RValue<Short4> y)
1965 {
Nicolas Capens6c157442017-07-25 15:32:12 -04001966 if(emulateIntrinsics)
1967 {
1968 Short4 result;
1969 result = Insert(result, Short((Int(Extract(x, 0)) * Int(Extract(y, 0))) >> 16), 0);
1970 result = Insert(result, Short((Int(Extract(x, 1)) * Int(Extract(y, 1))) >> 16), 1);
1971 result = Insert(result, Short((Int(Extract(x, 2)) * Int(Extract(y, 2))) >> 16), 2);
1972 result = Insert(result, Short((Int(Extract(x, 3)) * Int(Extract(y, 3))) >> 16), 3);
Nicolas Capensc71bed22016-11-07 22:25:14 -05001973
Nicolas Capens6c157442017-07-25 15:32:12 -04001974 return result;
1975 }
1976 else
1977 {
1978 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
1979 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::MultiplyHighSigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
1980 auto target = ::context->getConstantUndef(Ice::IceType_i32);
1981 auto pmulhw = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
1982 pmulhw->addArg(x.value);
1983 pmulhw->addArg(y.value);
1984 ::basicBlock->appendInst(pmulhw);
1985
1986 return RValue<Short4>(V(result));
1987 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04001988 }
1989
1990 RValue<Int2> MulAdd(RValue<Short4> x, RValue<Short4> y)
1991 {
Nicolas Capensafe27e92017-07-25 15:32:12 -04001992 if(emulateIntrinsics)
1993 {
1994 Int2 result;
1995 result = Insert(result, Int(Extract(x, 0)) * Int(Extract(y, 0)) + Int(Extract(x, 1)) * Int(Extract(y, 1)), 0);
1996 result = Insert(result, Int(Extract(x, 2)) * Int(Extract(y, 2)) + Int(Extract(x, 3)) * Int(Extract(y, 3)), 1);
Nicolas Capensc71bed22016-11-07 22:25:14 -05001997
Nicolas Capensafe27e92017-07-25 15:32:12 -04001998 return result;
1999 }
2000 else
2001 {
2002 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2003 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::MultiplyAddPairs, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2004 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2005 auto pmaddwd = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2006 pmaddwd->addArg(x.value);
2007 pmaddwd->addArg(y.value);
2008 ::basicBlock->appendInst(pmaddwd);
2009
2010 return As<Int2>(V(result));
2011 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002012 }
2013
Nicolas Capens33438a62017-09-27 11:47:35 -04002014 RValue<SByte8> PackSigned(RValue<Short4> x, RValue<Short4> y)
Nicolas Capens598f8d82016-09-26 15:09:10 -04002015 {
Nicolas Capens8960fbf2017-07-25 15:32:12 -04002016 if(emulateIntrinsics)
2017 {
2018 SByte8 result;
Nicolas Capens33438a62017-09-27 11:47:35 -04002019 result = Insert(result, SaturateSigned(Extract(x, 0)), 0);
2020 result = Insert(result, SaturateSigned(Extract(x, 1)), 1);
2021 result = Insert(result, SaturateSigned(Extract(x, 2)), 2);
2022 result = Insert(result, SaturateSigned(Extract(x, 3)), 3);
2023 result = Insert(result, SaturateSigned(Extract(y, 0)), 4);
2024 result = Insert(result, SaturateSigned(Extract(y, 1)), 5);
2025 result = Insert(result, SaturateSigned(Extract(y, 2)), 6);
2026 result = Insert(result, SaturateSigned(Extract(y, 3)), 7);
Nicolas Capensec54a172016-10-25 17:32:37 -04002027
Nicolas Capens8960fbf2017-07-25 15:32:12 -04002028 return result;
2029 }
2030 else
2031 {
2032 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v16i8);
2033 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::VectorPackSigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2034 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2035 auto pack = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2036 pack->addArg(x.value);
2037 pack->addArg(y.value);
2038 ::basicBlock->appendInst(pack);
2039
2040 return As<SByte8>(Swizzle(As<Int4>(V(result)), 0x88));
2041 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002042 }
2043
Nicolas Capens33438a62017-09-27 11:47:35 -04002044 RValue<Byte8> PackUnsigned(RValue<Short4> x, RValue<Short4> y)
2045 {
2046 if(emulateIntrinsics)
2047 {
2048 Byte8 result;
2049 result = Insert(result, SaturateUnsigned(Extract(x, 0)), 0);
2050 result = Insert(result, SaturateUnsigned(Extract(x, 1)), 1);
2051 result = Insert(result, SaturateUnsigned(Extract(x, 2)), 2);
2052 result = Insert(result, SaturateUnsigned(Extract(x, 3)), 3);
2053 result = Insert(result, SaturateUnsigned(Extract(y, 0)), 4);
2054 result = Insert(result, SaturateUnsigned(Extract(y, 1)), 5);
2055 result = Insert(result, SaturateUnsigned(Extract(y, 2)), 6);
2056 result = Insert(result, SaturateUnsigned(Extract(y, 3)), 7);
2057
2058 return result;
2059 }
2060 else
2061 {
2062 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v16i8);
2063 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::VectorPackUnsigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2064 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2065 auto pack = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2066 pack->addArg(x.value);
2067 pack->addArg(y.value);
2068 ::basicBlock->appendInst(pack);
2069
2070 return As<Byte8>(Swizzle(As<Int4>(V(result)), 0x88));
2071 }
2072 }
2073
Nicolas Capens598f8d82016-09-26 15:09:10 -04002074 RValue<Short4> CmpGT(RValue<Short4> x, RValue<Short4> y)
2075 {
Nicolas Capens2f970b62016-11-08 14:28:59 -05002076 return RValue<Short4>(createIntCompare(Ice::InstIcmp::Sgt, x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002077 }
2078
2079 RValue<Short4> CmpEQ(RValue<Short4> x, RValue<Short4> y)
2080 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05002081 return RValue<Short4>(Nucleus::createICmpEQ(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002082 }
2083
2084 Type *Short4::getType()
2085 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04002086 return T(Type_v4i16);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002087 }
2088
Nicolas Capens598f8d82016-09-26 15:09:10 -04002089 UShort4::UShort4(RValue<Float4> cast, bool saturate)
2090 {
Nicolas Capensd4227962016-11-09 14:24:25 -05002091 if(saturate)
2092 {
Nicolas Capens9ca48d52017-01-14 12:52:55 -05002093 if(CPUID::SSE4_1)
Nicolas Capensd4227962016-11-09 14:24:25 -05002094 {
Nicolas Capens091f3502017-10-03 14:56:49 -04002095 // x86 produces 0x80000000 on 32-bit integer overflow/underflow.
2096 // PackUnsigned takes care of 0x0000 saturation.
2097 Int4 int4(Min(cast, Float4(0xFFFF)));
2098 *this = As<UShort4>(PackUnsigned(int4, int4));
2099 }
2100 else if(CPUID::ARM)
2101 {
2102 // ARM saturates the 32-bit integer result on overflow/undeflow.
2103 Int4 int4(cast);
Nicolas Capens33438a62017-09-27 11:47:35 -04002104 *this = As<UShort4>(PackUnsigned(int4, int4));
Nicolas Capensd4227962016-11-09 14:24:25 -05002105 }
2106 else
2107 {
2108 *this = Short4(Int4(Max(Min(cast, Float4(0xFFFF)), Float4(0x0000))));
2109 }
2110 }
2111 else
2112 {
2113 *this = Short4(Int4(cast));
2114 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002115 }
2116
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002117 RValue<UShort> Extract(RValue<UShort4> val, int i)
2118 {
2119 return RValue<UShort>(Nucleus::createExtractElement(val.value, UShort::getType(), i));
2120 }
2121
2122 RValue<UShort4> Insert(RValue<UShort4> val, RValue<UShort> element, int i)
2123 {
2124 return RValue<UShort4>(Nucleus::createInsertElement(val.value, element.value, i));
2125 }
2126
Nicolas Capens598f8d82016-09-26 15:09:10 -04002127 RValue<UShort4> operator<<(RValue<UShort4> lhs, unsigned char rhs)
2128 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002129 if(emulateIntrinsics)
2130 {
2131 UShort4 result;
2132 result = Insert(result, Extract(lhs, 0) << UShort(rhs), 0);
2133 result = Insert(result, Extract(lhs, 1) << UShort(rhs), 1);
2134 result = Insert(result, Extract(lhs, 2) << UShort(rhs), 2);
2135 result = Insert(result, Extract(lhs, 3) << UShort(rhs), 3);
2136
2137 return result;
2138 }
2139 else
2140 {
2141 return RValue<UShort4>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
2142 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002143 }
2144
2145 RValue<UShort4> operator>>(RValue<UShort4> lhs, unsigned char rhs)
2146 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002147 if(emulateIntrinsics)
2148 {
2149 UShort4 result;
2150 result = Insert(result, Extract(lhs, 0) >> UShort(rhs), 0);
2151 result = Insert(result, Extract(lhs, 1) >> UShort(rhs), 1);
2152 result = Insert(result, Extract(lhs, 2) >> UShort(rhs), 2);
2153 result = Insert(result, Extract(lhs, 3) >> UShort(rhs), 3);
2154
2155 return result;
2156 }
2157 else
2158 {
2159 return RValue<UShort4>(Nucleus::createLShr(lhs.value, V(::context->getConstantInt32(rhs))));
2160 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002161 }
2162
Nicolas Capens598f8d82016-09-26 15:09:10 -04002163 RValue<UShort4> Max(RValue<UShort4> x, RValue<UShort4> y)
2164 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04002165 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v8i1);
2166 auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Ule, condition, x.value, y.value);
2167 ::basicBlock->appendInst(cmp);
2168
2169 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2170 auto select = Ice::InstSelect::create(::function, result, condition, y.value, x.value);
2171 ::basicBlock->appendInst(select);
2172
2173 return RValue<UShort4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002174 }
2175
2176 RValue<UShort4> Min(RValue<UShort4> x, RValue<UShort4> y)
2177 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04002178 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v8i1);
2179 auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Ugt, condition, x.value, y.value);
2180 ::basicBlock->appendInst(cmp);
2181
2182 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2183 auto select = Ice::InstSelect::create(::function, result, condition, y.value, x.value);
2184 ::basicBlock->appendInst(select);
2185
2186 return RValue<UShort4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002187 }
2188
Nicolas Capens7f301812017-10-02 17:32:34 -04002189 RValue<UShort> SaturateUnsigned(RValue<Int> x)
Nicolas Capens98436732017-07-25 15:32:12 -04002190 {
2191 return UShort(IfThenElse(x > 0xFFFF, Int(0xFFFF), IfThenElse(x < 0, Int(0), x)));
2192 }
2193
Nicolas Capens598f8d82016-09-26 15:09:10 -04002194 RValue<UShort4> AddSat(RValue<UShort4> x, RValue<UShort4> y)
2195 {
Nicolas Capens98436732017-07-25 15:32:12 -04002196 if(emulateIntrinsics)
2197 {
2198 UShort4 result;
Nicolas Capens7f301812017-10-02 17:32:34 -04002199 result = Insert(result, SaturateUnsigned(Int(Extract(x, 0)) + Int(Extract(y, 0))), 0);
2200 result = Insert(result, SaturateUnsigned(Int(Extract(x, 1)) + Int(Extract(y, 1))), 1);
2201 result = Insert(result, SaturateUnsigned(Int(Extract(x, 2)) + Int(Extract(y, 2))), 2);
2202 result = Insert(result, SaturateUnsigned(Int(Extract(x, 3)) + Int(Extract(y, 3))), 3);
Nicolas Capensc71bed22016-11-07 22:25:14 -05002203
Nicolas Capens98436732017-07-25 15:32:12 -04002204 return result;
2205 }
2206 else
2207 {
2208 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2209 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::AddSaturateUnsigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2210 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2211 auto paddusw = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2212 paddusw->addArg(x.value);
2213 paddusw->addArg(y.value);
2214 ::basicBlock->appendInst(paddusw);
2215
2216 return RValue<UShort4>(V(result));
2217 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002218 }
2219
2220 RValue<UShort4> SubSat(RValue<UShort4> x, RValue<UShort4> y)
2221 {
Nicolas Capens98436732017-07-25 15:32:12 -04002222 if(emulateIntrinsics)
2223 {
2224 UShort4 result;
Nicolas Capens7f301812017-10-02 17:32:34 -04002225 result = Insert(result, SaturateUnsigned(Int(Extract(x, 0)) - Int(Extract(y, 0))), 0);
2226 result = Insert(result, SaturateUnsigned(Int(Extract(x, 1)) - Int(Extract(y, 1))), 1);
2227 result = Insert(result, SaturateUnsigned(Int(Extract(x, 2)) - Int(Extract(y, 2))), 2);
2228 result = Insert(result, SaturateUnsigned(Int(Extract(x, 3)) - Int(Extract(y, 3))), 3);
Nicolas Capensc71bed22016-11-07 22:25:14 -05002229
Nicolas Capens98436732017-07-25 15:32:12 -04002230 return result;
2231 }
2232 else
2233 {
2234 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2235 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::SubtractSaturateUnsigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2236 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2237 auto psubusw = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2238 psubusw->addArg(x.value);
2239 psubusw->addArg(y.value);
2240 ::basicBlock->appendInst(psubusw);
2241
2242 return RValue<UShort4>(V(result));
2243 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002244 }
2245
2246 RValue<UShort4> MulHigh(RValue<UShort4> x, RValue<UShort4> y)
2247 {
Nicolas Capens6c157442017-07-25 15:32:12 -04002248 if(emulateIntrinsics)
2249 {
2250 UShort4 result;
2251 result = Insert(result, UShort((UInt(Extract(x, 0)) * UInt(Extract(y, 0))) >> 16), 0);
2252 result = Insert(result, UShort((UInt(Extract(x, 1)) * UInt(Extract(y, 1))) >> 16), 1);
2253 result = Insert(result, UShort((UInt(Extract(x, 2)) * UInt(Extract(y, 2))) >> 16), 2);
2254 result = Insert(result, UShort((UInt(Extract(x, 3)) * UInt(Extract(y, 3))) >> 16), 3);
Nicolas Capensc71bed22016-11-07 22:25:14 -05002255
Nicolas Capens6c157442017-07-25 15:32:12 -04002256 return result;
2257 }
2258 else
2259 {
2260 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2261 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::MultiplyHighUnsigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2262 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2263 auto pmulhuw = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2264 pmulhuw->addArg(x.value);
2265 pmulhuw->addArg(y.value);
2266 ::basicBlock->appendInst(pmulhuw);
2267
2268 return RValue<UShort4>(V(result));
2269 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002270 }
2271
Chris Forbesaa8f6992019-03-01 14:18:30 -08002272 RValue<Int4> MulHigh(RValue<Int4> x, RValue<Int4> y)
2273 {
2274 // TODO: For x86, build an intrinsics version of this which uses shuffles + pmuludq.
2275
2276 // Scalarized implementation.
2277 Int4 result;
2278 result = Insert(result, Int((Long(Extract(x, 0)) * Long(Extract(y, 0))) >> Long(Int(32))), 0);
2279 result = Insert(result, Int((Long(Extract(x, 1)) * Long(Extract(y, 1))) >> Long(Int(32))), 1);
2280 result = Insert(result, Int((Long(Extract(x, 2)) * Long(Extract(y, 2))) >> Long(Int(32))), 2);
2281 result = Insert(result, Int((Long(Extract(x, 3)) * Long(Extract(y, 3))) >> Long(Int(32))), 3);
2282
2283 return result;
2284 }
2285
2286 RValue<UInt4> MulHigh(RValue<UInt4> x, RValue<UInt4> y)
2287 {
2288 // TODO: For x86, build an intrinsics version of this which uses shuffles + pmuludq.
2289
2290 if(false) // Partial product based implementation.
2291 {
2292 auto xh = x >> 16;
2293 auto yh = y >> 16;
2294 auto xl = x & UInt4(0x0000FFFF);
2295 auto yl = y & UInt4(0x0000FFFF);
2296 auto xlyh = xl * yh;
2297 auto xhyl = xh * yl;
2298 auto xlyhh = xlyh >> 16;
2299 auto xhylh = xhyl >> 16;
2300 auto xlyhl = xlyh & UInt4(0x0000FFFF);
2301 auto xhyll = xhyl & UInt4(0x0000FFFF);
2302 auto xlylh = (xl * yl) >> 16;
2303 auto oflow = (xlyhl + xhyll + xlylh) >> 16;
2304
2305 return (xh * yh) + (xlyhh + xhylh) + oflow;
2306 }
2307
2308 // Scalarized implementation.
2309 Int4 result;
2310 result = Insert(result, Int((Long(UInt(Extract(As<Int4>(x), 0))) * Long(UInt(Extract(As<Int4>(y), 0)))) >> Long(Int(32))), 0);
2311 result = Insert(result, Int((Long(UInt(Extract(As<Int4>(x), 1))) * Long(UInt(Extract(As<Int4>(y), 1)))) >> Long(Int(32))), 1);
2312 result = Insert(result, Int((Long(UInt(Extract(As<Int4>(x), 2))) * Long(UInt(Extract(As<Int4>(y), 2)))) >> Long(Int(32))), 2);
2313 result = Insert(result, Int((Long(UInt(Extract(As<Int4>(x), 3))) * Long(UInt(Extract(As<Int4>(y), 3)))) >> Long(Int(32))), 3);
2314
2315 return As<UInt4>(result);
2316 }
2317
Nicolas Capens598f8d82016-09-26 15:09:10 -04002318 RValue<UShort4> Average(RValue<UShort4> x, RValue<UShort4> y)
2319 {
Nicolas Capensc37252c2016-09-28 16:11:54 -04002320 assert(false && "UNIMPLEMENTED"); return RValue<UShort4>(V(nullptr));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002321 }
2322
Nicolas Capens598f8d82016-09-26 15:09:10 -04002323 Type *UShort4::getType()
2324 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04002325 return T(Type_v4i16);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002326 }
2327
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002328 RValue<Short> Extract(RValue<Short8> val, int i)
2329 {
2330 return RValue<Short>(Nucleus::createExtractElement(val.value, Short::getType(), i));
2331 }
2332
2333 RValue<Short8> Insert(RValue<Short8> val, RValue<Short> element, int i)
2334 {
2335 return RValue<Short8>(Nucleus::createInsertElement(val.value, element.value, i));
2336 }
2337
Nicolas Capens598f8d82016-09-26 15:09:10 -04002338 RValue<Short8> operator<<(RValue<Short8> lhs, unsigned char rhs)
2339 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002340 if(emulateIntrinsics)
2341 {
2342 Short8 result;
2343 result = Insert(result, Extract(lhs, 0) << Short(rhs), 0);
2344 result = Insert(result, Extract(lhs, 1) << Short(rhs), 1);
2345 result = Insert(result, Extract(lhs, 2) << Short(rhs), 2);
2346 result = Insert(result, Extract(lhs, 3) << Short(rhs), 3);
2347 result = Insert(result, Extract(lhs, 4) << Short(rhs), 4);
2348 result = Insert(result, Extract(lhs, 5) << Short(rhs), 5);
2349 result = Insert(result, Extract(lhs, 6) << Short(rhs), 6);
2350 result = Insert(result, Extract(lhs, 7) << Short(rhs), 7);
2351
2352 return result;
2353 }
2354 else
2355 {
2356 return RValue<Short8>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
2357 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002358 }
2359
2360 RValue<Short8> operator>>(RValue<Short8> lhs, unsigned char rhs)
2361 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002362 if(emulateIntrinsics)
2363 {
2364 Short8 result;
2365 result = Insert(result, Extract(lhs, 0) >> Short(rhs), 0);
2366 result = Insert(result, Extract(lhs, 1) >> Short(rhs), 1);
2367 result = Insert(result, Extract(lhs, 2) >> Short(rhs), 2);
2368 result = Insert(result, Extract(lhs, 3) >> Short(rhs), 3);
2369 result = Insert(result, Extract(lhs, 4) >> Short(rhs), 4);
2370 result = Insert(result, Extract(lhs, 5) >> Short(rhs), 5);
2371 result = Insert(result, Extract(lhs, 6) >> Short(rhs), 6);
2372 result = Insert(result, Extract(lhs, 7) >> Short(rhs), 7);
2373
2374 return result;
2375 }
2376 else
2377 {
2378 return RValue<Short8>(Nucleus::createAShr(lhs.value, V(::context->getConstantInt32(rhs))));
2379 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002380 }
2381
2382 RValue<Int4> MulAdd(RValue<Short8> x, RValue<Short8> y)
2383 {
Nicolas Capensc37252c2016-09-28 16:11:54 -04002384 assert(false && "UNIMPLEMENTED"); return RValue<Int4>(V(nullptr));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002385 }
2386
Nicolas Capens598f8d82016-09-26 15:09:10 -04002387 RValue<Short8> MulHigh(RValue<Short8> x, RValue<Short8> y)
2388 {
Nicolas Capensc37252c2016-09-28 16:11:54 -04002389 assert(false && "UNIMPLEMENTED"); return RValue<Short8>(V(nullptr));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002390 }
2391
2392 Type *Short8::getType()
2393 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04002394 return T(Ice::IceType_v8i16);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002395 }
2396
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002397 RValue<UShort> Extract(RValue<UShort8> val, int i)
2398 {
2399 return RValue<UShort>(Nucleus::createExtractElement(val.value, UShort::getType(), i));
2400 }
2401
2402 RValue<UShort8> Insert(RValue<UShort8> val, RValue<UShort> element, int i)
2403 {
2404 return RValue<UShort8>(Nucleus::createInsertElement(val.value, element.value, i));
2405 }
2406
Nicolas Capens598f8d82016-09-26 15:09:10 -04002407 RValue<UShort8> operator<<(RValue<UShort8> lhs, unsigned char rhs)
2408 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002409 if(emulateIntrinsics)
2410 {
2411 UShort8 result;
2412 result = Insert(result, Extract(lhs, 0) << UShort(rhs), 0);
2413 result = Insert(result, Extract(lhs, 1) << UShort(rhs), 1);
2414 result = Insert(result, Extract(lhs, 2) << UShort(rhs), 2);
2415 result = Insert(result, Extract(lhs, 3) << UShort(rhs), 3);
2416 result = Insert(result, Extract(lhs, 4) << UShort(rhs), 4);
2417 result = Insert(result, Extract(lhs, 5) << UShort(rhs), 5);
2418 result = Insert(result, Extract(lhs, 6) << UShort(rhs), 6);
2419 result = Insert(result, Extract(lhs, 7) << UShort(rhs), 7);
2420
2421 return result;
2422 }
2423 else
2424 {
2425 return RValue<UShort8>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
2426 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002427 }
2428
2429 RValue<UShort8> operator>>(RValue<UShort8> lhs, unsigned char rhs)
2430 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002431 if(emulateIntrinsics)
2432 {
2433 UShort8 result;
2434 result = Insert(result, Extract(lhs, 0) >> UShort(rhs), 0);
2435 result = Insert(result, Extract(lhs, 1) >> UShort(rhs), 1);
2436 result = Insert(result, Extract(lhs, 2) >> UShort(rhs), 2);
2437 result = Insert(result, Extract(lhs, 3) >> UShort(rhs), 3);
2438 result = Insert(result, Extract(lhs, 4) >> UShort(rhs), 4);
2439 result = Insert(result, Extract(lhs, 5) >> UShort(rhs), 5);
2440 result = Insert(result, Extract(lhs, 6) >> UShort(rhs), 6);
2441 result = Insert(result, Extract(lhs, 7) >> UShort(rhs), 7);
2442
2443 return result;
2444 }
2445 else
2446 {
2447 return RValue<UShort8>(Nucleus::createLShr(lhs.value, V(::context->getConstantInt32(rhs))));
2448 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002449 }
2450
Nicolas Capens598f8d82016-09-26 15:09:10 -04002451 RValue<UShort8> Swizzle(RValue<UShort8> x, char select0, char select1, char select2, char select3, char select4, char select5, char select6, char select7)
2452 {
Nicolas Capensc37252c2016-09-28 16:11:54 -04002453 assert(false && "UNIMPLEMENTED"); return RValue<UShort8>(V(nullptr));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002454 }
2455
2456 RValue<UShort8> MulHigh(RValue<UShort8> x, RValue<UShort8> y)
2457 {
Nicolas Capensc37252c2016-09-28 16:11:54 -04002458 assert(false && "UNIMPLEMENTED"); return RValue<UShort8>(V(nullptr));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002459 }
2460
2461 // FIXME: Implement as Shuffle(x, y, Select(i0, ..., i16)) and Shuffle(x, y, SELECT_PACK_REPEAT(element))
2462// RValue<UShort8> PackRepeat(RValue<Byte16> x, RValue<Byte16> y, int element)
2463// {
Nicolas Capensc37252c2016-09-28 16:11:54 -04002464// assert(false && "UNIMPLEMENTED"); return RValue<UShort8>(V(nullptr));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002465// }
2466
2467 Type *UShort8::getType()
2468 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04002469 return T(Ice::IceType_v8i16);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002470 }
2471
Nicolas Capens96d4e092016-11-18 14:22:38 -05002472 RValue<Int> operator++(Int &val, int) // Post-increment
Nicolas Capens598f8d82016-09-26 15:09:10 -04002473 {
Nicolas Capens5b41ba32016-12-08 14:34:00 -05002474 RValue<Int> res = val;
Nicolas Capensd1229402016-11-07 16:05:22 -05002475 val += 1;
2476 return res;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002477 }
2478
Nicolas Capens96d4e092016-11-18 14:22:38 -05002479 const Int &operator++(Int &val) // Pre-increment
Nicolas Capens598f8d82016-09-26 15:09:10 -04002480 {
Nicolas Capensd1229402016-11-07 16:05:22 -05002481 val += 1;
2482 return val;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002483 }
2484
Nicolas Capens96d4e092016-11-18 14:22:38 -05002485 RValue<Int> operator--(Int &val, int) // Post-decrement
Nicolas Capens598f8d82016-09-26 15:09:10 -04002486 {
Nicolas Capensd1229402016-11-07 16:05:22 -05002487 RValue<Int> res = val;
2488 val -= 1;
2489 return res;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002490 }
2491
Nicolas Capens96d4e092016-11-18 14:22:38 -05002492 const Int &operator--(Int &val) // Pre-decrement
Nicolas Capens598f8d82016-09-26 15:09:10 -04002493 {
Nicolas Capensd1229402016-11-07 16:05:22 -05002494 val -= 1;
2495 return val;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002496 }
2497
Nicolas Capens598f8d82016-09-26 15:09:10 -04002498 RValue<Int> RoundInt(RValue<Float> cast)
2499 {
Nicolas Capens091f3502017-10-03 14:56:49 -04002500 if(emulateIntrinsics || CPUID::ARM)
Nicolas Capensf7b75882017-04-26 09:30:47 -04002501 {
2502 // Push the fractional part off the mantissa. Accurate up to +/-2^22.
2503 return Int((cast + Float(0x00C00000)) - Float(0x00C00000));
2504 }
2505 else
2506 {
2507 Ice::Variable *result = ::function->makeVariable(Ice::IceType_i32);
2508 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::Nearbyint, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2509 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2510 auto nearbyint = Ice::InstIntrinsicCall::create(::function, 1, result, target, intrinsic);
2511 nearbyint->addArg(cast.value);
2512 ::basicBlock->appendInst(nearbyint);
Nicolas Capensa8086512016-11-07 17:32:17 -05002513
Nicolas Capensf7b75882017-04-26 09:30:47 -04002514 return RValue<Int>(V(result));
2515 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002516 }
2517
2518 Type *Int::getType()
2519 {
2520 return T(Ice::IceType_i32);
2521 }
2522
Nicolas Capens598f8d82016-09-26 15:09:10 -04002523 Type *Long::getType()
2524 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04002525 return T(Ice::IceType_i64);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002526 }
2527
Nicolas Capens598f8d82016-09-26 15:09:10 -04002528 UInt::UInt(RValue<Float> cast)
2529 {
Nicolas Capensc70a1162016-12-03 00:16:14 -05002530 // Smallest positive value representable in UInt, but not in Int
2531 const unsigned int ustart = 0x80000000u;
2532 const float ustartf = float(ustart);
2533
2534 // If the value is negative, store 0, otherwise store the result of the conversion
2535 storeValue((~(As<Int>(cast) >> 31) &
2536 // Check if the value can be represented as an Int
2537 IfThenElse(cast >= ustartf,
2538 // If the value is too large, subtract ustart and re-add it after conversion.
2539 As<Int>(As<UInt>(Int(cast - Float(ustartf))) + UInt(ustart)),
2540 // Otherwise, just convert normally
2541 Int(cast))).value);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002542 }
2543
Nicolas Capens96d4e092016-11-18 14:22:38 -05002544 RValue<UInt> operator++(UInt &val, int) // Post-increment
Nicolas Capens598f8d82016-09-26 15:09:10 -04002545 {
Nicolas Capensd1229402016-11-07 16:05:22 -05002546 RValue<UInt> res = val;
2547 val += 1;
2548 return res;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002549 }
2550
Nicolas Capens96d4e092016-11-18 14:22:38 -05002551 const UInt &operator++(UInt &val) // Pre-increment
Nicolas Capens598f8d82016-09-26 15:09:10 -04002552 {
Nicolas Capensd1229402016-11-07 16:05:22 -05002553 val += 1;
2554 return val;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002555 }
2556
Nicolas Capens96d4e092016-11-18 14:22:38 -05002557 RValue<UInt> operator--(UInt &val, int) // Post-decrement
Nicolas Capens598f8d82016-09-26 15:09:10 -04002558 {
Nicolas Capensd1229402016-11-07 16:05:22 -05002559 RValue<UInt> res = val;
2560 val -= 1;
2561 return res;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002562 }
2563
Nicolas Capens96d4e092016-11-18 14:22:38 -05002564 const UInt &operator--(UInt &val) // Pre-decrement
Nicolas Capens598f8d82016-09-26 15:09:10 -04002565 {
Nicolas Capensd1229402016-11-07 16:05:22 -05002566 val -= 1;
2567 return val;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002568 }
2569
Nicolas Capens598f8d82016-09-26 15:09:10 -04002570// RValue<UInt> RoundUInt(RValue<Float> cast)
2571// {
Nicolas Capensc37252c2016-09-28 16:11:54 -04002572// assert(false && "UNIMPLEMENTED"); return RValue<UInt>(V(nullptr));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002573// }
2574
2575 Type *UInt::getType()
2576 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04002577 return T(Ice::IceType_i32);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002578 }
2579
2580// Int2::Int2(RValue<Int> cast)
2581// {
2582// Value *extend = Nucleus::createZExt(cast.value, Long::getType());
2583// Value *vector = Nucleus::createBitCast(extend, Int2::getType());
2584//
2585// Constant *shuffle[2];
2586// shuffle[0] = Nucleus::createConstantInt(0);
2587// shuffle[1] = Nucleus::createConstantInt(0);
2588//
2589// Value *replicate = Nucleus::createShuffleVector(vector, UndefValue::get(Int2::getType()), Nucleus::createConstantVector(shuffle, 2));
2590//
2591// storeValue(replicate);
2592// }
2593
Nicolas Capens598f8d82016-09-26 15:09:10 -04002594 RValue<Int2> operator<<(RValue<Int2> lhs, unsigned char rhs)
2595 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002596 if(emulateIntrinsics)
2597 {
2598 Int2 result;
2599 result = Insert(result, Extract(lhs, 0) << Int(rhs), 0);
2600 result = Insert(result, Extract(lhs, 1) << Int(rhs), 1);
2601
2602 return result;
2603 }
2604 else
2605 {
2606 return RValue<Int2>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
2607 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002608 }
2609
2610 RValue<Int2> operator>>(RValue<Int2> lhs, unsigned char rhs)
2611 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002612 if(emulateIntrinsics)
2613 {
2614 Int2 result;
2615 result = Insert(result, Extract(lhs, 0) >> Int(rhs), 0);
2616 result = Insert(result, Extract(lhs, 1) >> Int(rhs), 1);
2617
2618 return result;
2619 }
2620 else
2621 {
2622 return RValue<Int2>(Nucleus::createAShr(lhs.value, V(::context->getConstantInt32(rhs))));
2623 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002624 }
2625
Nicolas Capens598f8d82016-09-26 15:09:10 -04002626 Type *Int2::getType()
2627 {
Nicolas Capens8dfd9a72016-10-13 17:44:51 -04002628 return T(Type_v2i32);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002629 }
2630
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002631 RValue<UInt> Extract(RValue<UInt2> val, int i)
2632 {
2633 return RValue<UInt>(Nucleus::createExtractElement(val.value, UInt::getType(), i));
2634 }
2635
2636 RValue<UInt2> Insert(RValue<UInt2> val, RValue<UInt> element, int i)
2637 {
2638 return RValue<UInt2>(Nucleus::createInsertElement(val.value, element.value, i));
2639 }
2640
Nicolas Capens598f8d82016-09-26 15:09:10 -04002641 RValue<UInt2> operator<<(RValue<UInt2> lhs, unsigned char rhs)
2642 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002643 if(emulateIntrinsics)
2644 {
2645 UInt2 result;
2646 result = Insert(result, Extract(lhs, 0) << UInt(rhs), 0);
2647 result = Insert(result, Extract(lhs, 1) << UInt(rhs), 1);
2648
2649 return result;
2650 }
2651 else
2652 {
2653 return RValue<UInt2>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
2654 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002655 }
2656
2657 RValue<UInt2> operator>>(RValue<UInt2> lhs, unsigned char rhs)
2658 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002659 if(emulateIntrinsics)
2660 {
2661 UInt2 result;
2662 result = Insert(result, Extract(lhs, 0) >> UInt(rhs), 0);
2663 result = Insert(result, Extract(lhs, 1) >> UInt(rhs), 1);
2664
2665 return result;
2666 }
2667 else
2668 {
2669 return RValue<UInt2>(Nucleus::createLShr(lhs.value, V(::context->getConstantInt32(rhs))));
2670 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002671 }
2672
Nicolas Capens598f8d82016-09-26 15:09:10 -04002673 Type *UInt2::getType()
2674 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04002675 return T(Type_v2i32);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002676 }
2677
Nicolas Capenscb986762017-01-20 11:34:37 -05002678 Int4::Int4(RValue<Byte4> cast) : XYZW(this)
Nicolas Capens598f8d82016-09-26 15:09:10 -04002679 {
Nicolas Capensd4227962016-11-09 14:24:25 -05002680 Value *x = Nucleus::createBitCast(cast.value, Int::getType());
2681 Value *a = Nucleus::createInsertElement(loadValue(), x, 0);
2682
2683 Value *e;
2684 int swizzle[16] = {0, 16, 1, 17, 2, 18, 3, 19, 4, 20, 5, 21, 6, 22, 7, 23};
2685 Value *b = Nucleus::createBitCast(a, Byte16::getType());
2686 Value *c = Nucleus::createShuffleVector(b, V(Nucleus::createNullValue(Byte16::getType())), swizzle);
2687
2688 int swizzle2[8] = {0, 8, 1, 9, 2, 10, 3, 11};
2689 Value *d = Nucleus::createBitCast(c, Short8::getType());
2690 e = Nucleus::createShuffleVector(d, V(Nucleus::createNullValue(Short8::getType())), swizzle2);
2691
2692 Value *f = Nucleus::createBitCast(e, Int4::getType());
2693 storeValue(f);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002694 }
2695
Nicolas Capenscb986762017-01-20 11:34:37 -05002696 Int4::Int4(RValue<SByte4> cast) : XYZW(this)
Nicolas Capens598f8d82016-09-26 15:09:10 -04002697 {
Nicolas Capensd4227962016-11-09 14:24:25 -05002698 Value *x = Nucleus::createBitCast(cast.value, Int::getType());
2699 Value *a = Nucleus::createInsertElement(loadValue(), x, 0);
2700
Nicolas Capensd4227962016-11-09 14:24:25 -05002701 int swizzle[16] = {0, 0, 1, 1, 2, 2, 3, 3, 4, 4, 5, 5, 6, 6, 7, 7};
2702 Value *b = Nucleus::createBitCast(a, Byte16::getType());
2703 Value *c = Nucleus::createShuffleVector(b, b, swizzle);
2704
2705 int swizzle2[8] = {0, 0, 1, 1, 2, 2, 3, 3};
2706 Value *d = Nucleus::createBitCast(c, Short8::getType());
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002707 Value *e = Nucleus::createShuffleVector(d, d, swizzle2);
Nicolas Capensd4227962016-11-09 14:24:25 -05002708
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002709 *this = As<Int4>(e) >> 24;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002710 }
2711
Nicolas Capenscb986762017-01-20 11:34:37 -05002712 Int4::Int4(RValue<Short4> cast) : XYZW(this)
Nicolas Capens598f8d82016-09-26 15:09:10 -04002713 {
Nicolas Capensd4227962016-11-09 14:24:25 -05002714 int swizzle[8] = {0, 0, 1, 1, 2, 2, 3, 3};
2715 Value *c = Nucleus::createShuffleVector(cast.value, cast.value, swizzle);
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002716
2717 *this = As<Int4>(c) >> 16;
Nicolas Capens598f8d82016-09-26 15:09:10 -04002718 }
2719
Nicolas Capenscb986762017-01-20 11:34:37 -05002720 Int4::Int4(RValue<UShort4> cast) : XYZW(this)
Nicolas Capens598f8d82016-09-26 15:09:10 -04002721 {
Nicolas Capensd4227962016-11-09 14:24:25 -05002722 int swizzle[8] = {0, 8, 1, 9, 2, 10, 3, 11};
2723 Value *c = Nucleus::createShuffleVector(cast.value, Short8(0, 0, 0, 0, 0, 0, 0, 0).loadValue(), swizzle);
2724 Value *d = Nucleus::createBitCast(c, Int4::getType());
2725 storeValue(d);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002726 }
2727
Nicolas Capenscb986762017-01-20 11:34:37 -05002728 Int4::Int4(RValue<Int> rhs) : XYZW(this)
Nicolas Capens598f8d82016-09-26 15:09:10 -04002729 {
Nicolas Capensf8beb4b2017-01-27 02:55:44 -08002730 Value *vector = Nucleus::createBitCast(rhs.value, Int4::getType());
Nicolas Capensd4227962016-11-09 14:24:25 -05002731
2732 int swizzle[4] = {0, 0, 0, 0};
Nicolas Capensf8beb4b2017-01-27 02:55:44 -08002733 Value *replicate = Nucleus::createShuffleVector(vector, vector, swizzle);
Nicolas Capensd4227962016-11-09 14:24:25 -05002734
2735 storeValue(replicate);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002736 }
2737
Nicolas Capens598f8d82016-09-26 15:09:10 -04002738 RValue<Int4> operator<<(RValue<Int4> lhs, unsigned char rhs)
2739 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002740 if(emulateIntrinsics)
2741 {
2742 Int4 result;
2743 result = Insert(result, Extract(lhs, 0) << Int(rhs), 0);
2744 result = Insert(result, Extract(lhs, 1) << Int(rhs), 1);
2745 result = Insert(result, Extract(lhs, 2) << Int(rhs), 2);
2746 result = Insert(result, Extract(lhs, 3) << Int(rhs), 3);
2747
2748 return result;
2749 }
2750 else
2751 {
2752 return RValue<Int4>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
2753 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002754 }
2755
2756 RValue<Int4> operator>>(RValue<Int4> lhs, unsigned char rhs)
2757 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002758 if(emulateIntrinsics)
2759 {
2760 Int4 result;
2761 result = Insert(result, Extract(lhs, 0) >> Int(rhs), 0);
2762 result = Insert(result, Extract(lhs, 1) >> Int(rhs), 1);
2763 result = Insert(result, Extract(lhs, 2) >> Int(rhs), 2);
2764 result = Insert(result, Extract(lhs, 3) >> Int(rhs), 3);
2765
2766 return result;
2767 }
2768 else
2769 {
2770 return RValue<Int4>(Nucleus::createAShr(lhs.value, V(::context->getConstantInt32(rhs))));
2771 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002772 }
2773
Nicolas Capens598f8d82016-09-26 15:09:10 -04002774 RValue<Int4> CmpEQ(RValue<Int4> x, RValue<Int4> y)
2775 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05002776 return RValue<Int4>(Nucleus::createICmpEQ(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002777 }
2778
2779 RValue<Int4> CmpLT(RValue<Int4> x, RValue<Int4> y)
2780 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05002781 return RValue<Int4>(Nucleus::createICmpSLT(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002782 }
2783
2784 RValue<Int4> CmpLE(RValue<Int4> x, RValue<Int4> y)
2785 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05002786 return RValue<Int4>(Nucleus::createICmpSLE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002787 }
2788
2789 RValue<Int4> CmpNEQ(RValue<Int4> x, RValue<Int4> y)
2790 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05002791 return RValue<Int4>(Nucleus::createICmpNE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002792 }
2793
2794 RValue<Int4> CmpNLT(RValue<Int4> x, RValue<Int4> y)
2795 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05002796 return RValue<Int4>(Nucleus::createICmpSGE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002797 }
2798
2799 RValue<Int4> CmpNLE(RValue<Int4> x, RValue<Int4> y)
2800 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05002801 return RValue<Int4>(Nucleus::createICmpSGT(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002802 }
2803
2804 RValue<Int4> Max(RValue<Int4> x, RValue<Int4> y)
2805 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04002806 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
2807 auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Sle, condition, x.value, y.value);
2808 ::basicBlock->appendInst(cmp);
2809
2810 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4i32);
2811 auto select = Ice::InstSelect::create(::function, result, condition, y.value, x.value);
2812 ::basicBlock->appendInst(select);
2813
2814 return RValue<Int4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002815 }
2816
2817 RValue<Int4> Min(RValue<Int4> x, RValue<Int4> y)
2818 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04002819 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
2820 auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Sgt, condition, x.value, y.value);
2821 ::basicBlock->appendInst(cmp);
2822
2823 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4i32);
2824 auto select = Ice::InstSelect::create(::function, result, condition, y.value, x.value);
2825 ::basicBlock->appendInst(select);
2826
2827 return RValue<Int4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002828 }
2829
2830 RValue<Int4> RoundInt(RValue<Float4> cast)
2831 {
Nicolas Capens091f3502017-10-03 14:56:49 -04002832 if(emulateIntrinsics || CPUID::ARM)
Nicolas Capensf7b75882017-04-26 09:30:47 -04002833 {
2834 // Push the fractional part off the mantissa. Accurate up to +/-2^22.
2835 return Int4((cast + Float4(0x00C00000)) - Float4(0x00C00000));
2836 }
2837 else
2838 {
2839 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4i32);
2840 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::Nearbyint, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2841 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2842 auto nearbyint = Ice::InstIntrinsicCall::create(::function, 1, result, target, intrinsic);
2843 nearbyint->addArg(cast.value);
2844 ::basicBlock->appendInst(nearbyint);
Nicolas Capensa8086512016-11-07 17:32:17 -05002845
Nicolas Capensf7b75882017-04-26 09:30:47 -04002846 return RValue<Int4>(V(result));
2847 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002848 }
2849
Nicolas Capens33438a62017-09-27 11:47:35 -04002850 RValue<Short8> PackSigned(RValue<Int4> x, RValue<Int4> y)
Nicolas Capens598f8d82016-09-26 15:09:10 -04002851 {
Nicolas Capens8960fbf2017-07-25 15:32:12 -04002852 if(emulateIntrinsics)
2853 {
2854 Short8 result;
Nicolas Capens33438a62017-09-27 11:47:35 -04002855 result = Insert(result, SaturateSigned(Extract(x, 0)), 0);
2856 result = Insert(result, SaturateSigned(Extract(x, 1)), 1);
2857 result = Insert(result, SaturateSigned(Extract(x, 2)), 2);
2858 result = Insert(result, SaturateSigned(Extract(x, 3)), 3);
2859 result = Insert(result, SaturateSigned(Extract(y, 0)), 4);
2860 result = Insert(result, SaturateSigned(Extract(y, 1)), 5);
2861 result = Insert(result, SaturateSigned(Extract(y, 2)), 6);
2862 result = Insert(result, SaturateSigned(Extract(y, 3)), 7);
Nicolas Capensec54a172016-10-25 17:32:37 -04002863
Nicolas Capens8960fbf2017-07-25 15:32:12 -04002864 return result;
2865 }
2866 else
2867 {
2868 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2869 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::VectorPackSigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2870 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2871 auto pack = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2872 pack->addArg(x.value);
2873 pack->addArg(y.value);
2874 ::basicBlock->appendInst(pack);
2875
2876 return RValue<Short8>(V(result));
2877 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002878 }
2879
Nicolas Capens33438a62017-09-27 11:47:35 -04002880 RValue<UShort8> PackUnsigned(RValue<Int4> x, RValue<Int4> y)
2881 {
Nicolas Capens091f3502017-10-03 14:56:49 -04002882 if(emulateIntrinsics || !(CPUID::SSE4_1 || CPUID::ARM))
2883 {
2884 RValue<Int4> sx = As<Int4>(x);
2885 RValue<Int4> bx = (sx & ~(sx >> 31)) - Int4(0x8000);
2886
2887 RValue<Int4> sy = As<Int4>(y);
2888 RValue<Int4> by = (sy & ~(sy >> 31)) - Int4(0x8000);
2889
2890 return As<UShort8>(PackSigned(bx, by) + Short8(0x8000u));
2891 }
2892 else
Nicolas Capens33438a62017-09-27 11:47:35 -04002893 {
2894 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v8i16);
2895 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::VectorPackUnsigned, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2896 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2897 auto pack = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
2898 pack->addArg(x.value);
2899 pack->addArg(y.value);
2900 ::basicBlock->appendInst(pack);
2901
2902 return RValue<UShort8>(V(result));
2903 }
Nicolas Capens33438a62017-09-27 11:47:35 -04002904 }
2905
Nicolas Capens598f8d82016-09-26 15:09:10 -04002906 RValue<Int> SignMask(RValue<Int4> x)
2907 {
Nicolas Capens091f3502017-10-03 14:56:49 -04002908 if(emulateIntrinsics || CPUID::ARM)
Nicolas Capensd6cacad2017-07-25 15:32:12 -04002909 {
2910 Int4 xx = (x >> 31) & Int4(0x00000001, 0x00000002, 0x00000004, 0x00000008);
2911 return Extract(xx, 0) | Extract(xx, 1) | Extract(xx, 2) | Extract(xx, 3);
2912 }
2913 else
2914 {
2915 Ice::Variable *result = ::function->makeVariable(Ice::IceType_i32);
2916 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::SignMask, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
2917 auto target = ::context->getConstantUndef(Ice::IceType_i32);
2918 auto movmsk = Ice::InstIntrinsicCall::create(::function, 1, result, target, intrinsic);
2919 movmsk->addArg(x.value);
2920 ::basicBlock->appendInst(movmsk);
Nicolas Capensf2cb9df2016-10-21 17:26:13 -04002921
Nicolas Capensd6cacad2017-07-25 15:32:12 -04002922 return RValue<Int>(V(result));
2923 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002924 }
2925
Nicolas Capens598f8d82016-09-26 15:09:10 -04002926 Type *Int4::getType()
2927 {
Nicolas Capens23d99a42016-09-30 14:57:16 -04002928 return T(Ice::IceType_v4i32);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002929 }
2930
Nicolas Capenscb986762017-01-20 11:34:37 -05002931 UInt4::UInt4(RValue<Float4> cast) : XYZW(this)
Nicolas Capens598f8d82016-09-26 15:09:10 -04002932 {
Nicolas Capensc70a1162016-12-03 00:16:14 -05002933 // Smallest positive value representable in UInt, but not in Int
2934 const unsigned int ustart = 0x80000000u;
2935 const float ustartf = float(ustart);
2936
2937 // Check if the value can be represented as an Int
2938 Int4 uiValue = CmpNLT(cast, Float4(ustartf));
2939 // If the value is too large, subtract ustart and re-add it after conversion.
2940 uiValue = (uiValue & As<Int4>(As<UInt4>(Int4(cast - Float4(ustartf))) + UInt4(ustart))) |
2941 // Otherwise, just convert normally
2942 (~uiValue & Int4(cast));
2943 // If the value is negative, store 0, otherwise store the result of the conversion
2944 storeValue((~(As<Int4>(cast) >> 31) & uiValue).value);
Nicolas Capens598f8d82016-09-26 15:09:10 -04002945 }
2946
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002947 RValue<UInt> Extract(RValue<UInt4> x, int i)
2948 {
2949 return RValue<UInt>(Nucleus::createExtractElement(x.value, UInt::getType(), i));
2950 }
2951
2952 RValue<UInt4> Insert(RValue<UInt4> x, RValue<UInt> element, int i)
2953 {
2954 return RValue<UInt4>(Nucleus::createInsertElement(x.value, element.value, i));
2955 }
2956
Nicolas Capens598f8d82016-09-26 15:09:10 -04002957 RValue<UInt4> operator<<(RValue<UInt4> lhs, unsigned char rhs)
2958 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002959 if(emulateIntrinsics)
2960 {
2961 UInt4 result;
2962 result = Insert(result, Extract(lhs, 0) << UInt(rhs), 0);
2963 result = Insert(result, Extract(lhs, 1) << UInt(rhs), 1);
2964 result = Insert(result, Extract(lhs, 2) << UInt(rhs), 2);
2965 result = Insert(result, Extract(lhs, 3) << UInt(rhs), 3);
2966
2967 return result;
2968 }
2969 else
2970 {
2971 return RValue<UInt4>(Nucleus::createShl(lhs.value, V(::context->getConstantInt32(rhs))));
2972 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002973 }
2974
2975 RValue<UInt4> operator>>(RValue<UInt4> lhs, unsigned char rhs)
2976 {
Nicolas Capens8be6c7b2017-07-25 15:32:12 -04002977 if(emulateIntrinsics)
2978 {
2979 UInt4 result;
2980 result = Insert(result, Extract(lhs, 0) >> UInt(rhs), 0);
2981 result = Insert(result, Extract(lhs, 1) >> UInt(rhs), 1);
2982 result = Insert(result, Extract(lhs, 2) >> UInt(rhs), 2);
2983 result = Insert(result, Extract(lhs, 3) >> UInt(rhs), 3);
2984
2985 return result;
2986 }
2987 else
2988 {
2989 return RValue<UInt4>(Nucleus::createLShr(lhs.value, V(::context->getConstantInt32(rhs))));
2990 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04002991 }
2992
Nicolas Capens598f8d82016-09-26 15:09:10 -04002993 RValue<UInt4> CmpEQ(RValue<UInt4> x, RValue<UInt4> y)
2994 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05002995 return RValue<UInt4>(Nucleus::createICmpEQ(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04002996 }
2997
2998 RValue<UInt4> CmpLT(RValue<UInt4> x, RValue<UInt4> y)
2999 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003000 return RValue<UInt4>(Nucleus::createICmpULT(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003001 }
3002
3003 RValue<UInt4> CmpLE(RValue<UInt4> x, RValue<UInt4> y)
3004 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003005 return RValue<UInt4>(Nucleus::createICmpULE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003006 }
3007
3008 RValue<UInt4> CmpNEQ(RValue<UInt4> x, RValue<UInt4> y)
3009 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003010 return RValue<UInt4>(Nucleus::createICmpNE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003011 }
3012
3013 RValue<UInt4> CmpNLT(RValue<UInt4> x, RValue<UInt4> y)
3014 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003015 return RValue<UInt4>(Nucleus::createICmpUGE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003016 }
3017
3018 RValue<UInt4> CmpNLE(RValue<UInt4> x, RValue<UInt4> y)
3019 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003020 return RValue<UInt4>(Nucleus::createICmpUGT(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003021 }
3022
3023 RValue<UInt4> Max(RValue<UInt4> x, RValue<UInt4> y)
3024 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04003025 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
3026 auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Ule, condition, x.value, y.value);
3027 ::basicBlock->appendInst(cmp);
3028
3029 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4i32);
3030 auto select = Ice::InstSelect::create(::function, result, condition, y.value, x.value);
3031 ::basicBlock->appendInst(select);
3032
3033 return RValue<UInt4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003034 }
3035
3036 RValue<UInt4> Min(RValue<UInt4> x, RValue<UInt4> y)
3037 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04003038 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
3039 auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Ugt, condition, x.value, y.value);
3040 ::basicBlock->appendInst(cmp);
3041
3042 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4i32);
3043 auto select = Ice::InstSelect::create(::function, result, condition, y.value, x.value);
3044 ::basicBlock->appendInst(select);
3045
3046 return RValue<UInt4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003047 }
3048
Nicolas Capens598f8d82016-09-26 15:09:10 -04003049 Type *UInt4::getType()
3050 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04003051 return T(Ice::IceType_v4i32);
Nicolas Capens598f8d82016-09-26 15:09:10 -04003052 }
3053
Ben Claytonec1aeb82019-03-04 19:33:27 +00003054 Type *Half::getType()
3055 {
3056 return T(Ice::IceType_i16);
3057 }
Alexis Hetu734e2572018-12-20 14:00:49 -05003058
Nicolas Capens598f8d82016-09-26 15:09:10 -04003059 RValue<Float> Rcp_pp(RValue<Float> x, bool exactAtPow2)
3060 {
Nicolas Capensd52e9362016-10-31 23:23:15 -04003061 return 1.0f / x;
Nicolas Capens598f8d82016-09-26 15:09:10 -04003062 }
3063
3064 RValue<Float> RcpSqrt_pp(RValue<Float> x)
3065 {
Nicolas Capensd52e9362016-10-31 23:23:15 -04003066 return Rcp_pp(Sqrt(x));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003067 }
3068
3069 RValue<Float> Sqrt(RValue<Float> x)
3070 {
Nicolas Capensd52e9362016-10-31 23:23:15 -04003071 Ice::Variable *result = ::function->makeVariable(Ice::IceType_f32);
3072 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::Sqrt, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
3073 auto target = ::context->getConstantUndef(Ice::IceType_i32);
3074 auto sqrt = Ice::InstIntrinsicCall::create(::function, 1, result, target, intrinsic);
3075 sqrt->addArg(x.value);
3076 ::basicBlock->appendInst(sqrt);
3077
3078 return RValue<Float>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003079 }
3080
3081 RValue<Float> Round(RValue<Float> x)
3082 {
Nicolas Capensa8086512016-11-07 17:32:17 -05003083 return Float4(Round(Float4(x))).x;
Nicolas Capens598f8d82016-09-26 15:09:10 -04003084 }
3085
3086 RValue<Float> Trunc(RValue<Float> x)
3087 {
Nicolas Capensa8086512016-11-07 17:32:17 -05003088 return Float4(Trunc(Float4(x))).x;
Nicolas Capens598f8d82016-09-26 15:09:10 -04003089 }
3090
3091 RValue<Float> Frac(RValue<Float> x)
3092 {
Nicolas Capensa8086512016-11-07 17:32:17 -05003093 return Float4(Frac(Float4(x))).x;
Nicolas Capens598f8d82016-09-26 15:09:10 -04003094 }
3095
3096 RValue<Float> Floor(RValue<Float> x)
3097 {
Nicolas Capensa8086512016-11-07 17:32:17 -05003098 return Float4(Floor(Float4(x))).x;
Nicolas Capens598f8d82016-09-26 15:09:10 -04003099 }
3100
3101 RValue<Float> Ceil(RValue<Float> x)
3102 {
Nicolas Capensa8086512016-11-07 17:32:17 -05003103 return Float4(Ceil(Float4(x))).x;
Nicolas Capens598f8d82016-09-26 15:09:10 -04003104 }
3105
3106 Type *Float::getType()
3107 {
Nicolas Capens9709d4f2016-09-30 11:44:14 -04003108 return T(Ice::IceType_f32);
Nicolas Capens598f8d82016-09-26 15:09:10 -04003109 }
3110
Nicolas Capens598f8d82016-09-26 15:09:10 -04003111 Type *Float2::getType()
3112 {
Nicolas Capens4cfd4572016-10-20 01:00:19 -04003113 return T(Type_v2f32);
Nicolas Capens598f8d82016-09-26 15:09:10 -04003114 }
3115
Nicolas Capenscb986762017-01-20 11:34:37 -05003116 Float4::Float4(RValue<Float> rhs) : XYZW(this)
Nicolas Capens598f8d82016-09-26 15:09:10 -04003117 {
Nicolas Capensf8beb4b2017-01-27 02:55:44 -08003118 Value *vector = Nucleus::createBitCast(rhs.value, Float4::getType());
Nicolas Capensd4227962016-11-09 14:24:25 -05003119
3120 int swizzle[4] = {0, 0, 0, 0};
Nicolas Capensf8beb4b2017-01-27 02:55:44 -08003121 Value *replicate = Nucleus::createShuffleVector(vector, vector, swizzle);
Nicolas Capensd4227962016-11-09 14:24:25 -05003122
3123 storeValue(replicate);
Nicolas Capens598f8d82016-09-26 15:09:10 -04003124 }
3125
Nicolas Capens598f8d82016-09-26 15:09:10 -04003126 RValue<Float4> Max(RValue<Float4> x, RValue<Float4> y)
3127 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04003128 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
Nicolas Capens5cdb91a2017-02-13 12:39:18 -05003129 auto cmp = Ice::InstFcmp::create(::function, Ice::InstFcmp::Ogt, condition, x.value, y.value);
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04003130 ::basicBlock->appendInst(cmp);
3131
3132 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
Nicolas Capens5cdb91a2017-02-13 12:39:18 -05003133 auto select = Ice::InstSelect::create(::function, result, condition, x.value, y.value);
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04003134 ::basicBlock->appendInst(select);
3135
3136 return RValue<Float4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003137 }
3138
3139 RValue<Float4> Min(RValue<Float4> x, RValue<Float4> y)
3140 {
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04003141 Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
Nicolas Capens5cdb91a2017-02-13 12:39:18 -05003142 auto cmp = Ice::InstFcmp::create(::function, Ice::InstFcmp::Olt, condition, x.value, y.value);
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04003143 ::basicBlock->appendInst(cmp);
3144
3145 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
Nicolas Capens5cdb91a2017-02-13 12:39:18 -05003146 auto select = Ice::InstSelect::create(::function, result, condition, x.value, y.value);
Nicolas Capens53a8a3f2016-10-26 00:23:12 -04003147 ::basicBlock->appendInst(select);
3148
3149 return RValue<Float4>(V(result));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003150 }
3151
3152 RValue<Float4> Rcp_pp(RValue<Float4> x, bool exactAtPow2)
3153 {
Nicolas Capensd52e9362016-10-31 23:23:15 -04003154 return Float4(1.0f) / x;
Nicolas Capens598f8d82016-09-26 15:09:10 -04003155 }
3156
3157 RValue<Float4> RcpSqrt_pp(RValue<Float4> x)
3158 {
Nicolas Capensd52e9362016-10-31 23:23:15 -04003159 return Rcp_pp(Sqrt(x));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003160 }
3161
3162 RValue<Float4> Sqrt(RValue<Float4> x)
3163 {
Nicolas Capens091f3502017-10-03 14:56:49 -04003164 if(emulateIntrinsics || CPUID::ARM)
Nicolas Capens9f737d32017-07-25 17:26:14 -04003165 {
3166 Float4 result;
3167 result.x = Sqrt(Float(Float4(x).x));
3168 result.y = Sqrt(Float(Float4(x).y));
3169 result.z = Sqrt(Float(Float4(x).z));
3170 result.w = Sqrt(Float(Float4(x).w));
Nicolas Capensd52e9362016-10-31 23:23:15 -04003171
Nicolas Capens9f737d32017-07-25 17:26:14 -04003172 return result;
3173 }
3174 else
3175 {
3176 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
3177 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::Sqrt, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
3178 auto target = ::context->getConstantUndef(Ice::IceType_i32);
3179 auto sqrt = Ice::InstIntrinsicCall::create(::function, 1, result, target, intrinsic);
3180 sqrt->addArg(x.value);
3181 ::basicBlock->appendInst(sqrt);
3182
3183 return RValue<Float4>(V(result));
3184 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04003185 }
3186
Nicolas Capens598f8d82016-09-26 15:09:10 -04003187 RValue<Int> SignMask(RValue<Float4> x)
3188 {
Nicolas Capens091f3502017-10-03 14:56:49 -04003189 if(emulateIntrinsics || CPUID::ARM)
Nicolas Capensd6cacad2017-07-25 15:32:12 -04003190 {
3191 Int4 xx = (As<Int4>(x) >> 31) & Int4(0x00000001, 0x00000002, 0x00000004, 0x00000008);
3192 return Extract(xx, 0) | Extract(xx, 1) | Extract(xx, 2) | Extract(xx, 3);
3193 }
3194 else
3195 {
3196 Ice::Variable *result = ::function->makeVariable(Ice::IceType_i32);
3197 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::SignMask, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
3198 auto target = ::context->getConstantUndef(Ice::IceType_i32);
3199 auto movmsk = Ice::InstIntrinsicCall::create(::function, 1, result, target, intrinsic);
3200 movmsk->addArg(x.value);
3201 ::basicBlock->appendInst(movmsk);
Nicolas Capensf2cb9df2016-10-21 17:26:13 -04003202
Nicolas Capensd6cacad2017-07-25 15:32:12 -04003203 return RValue<Int>(V(result));
3204 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04003205 }
3206
3207 RValue<Int4> CmpEQ(RValue<Float4> x, RValue<Float4> y)
3208 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003209 return RValue<Int4>(Nucleus::createFCmpOEQ(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003210 }
3211
3212 RValue<Int4> CmpLT(RValue<Float4> x, RValue<Float4> y)
3213 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003214 return RValue<Int4>(Nucleus::createFCmpOLT(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003215 }
3216
3217 RValue<Int4> CmpLE(RValue<Float4> x, RValue<Float4> y)
3218 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003219 return RValue<Int4>(Nucleus::createFCmpOLE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003220 }
3221
3222 RValue<Int4> CmpNEQ(RValue<Float4> x, RValue<Float4> y)
3223 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003224 return RValue<Int4>(Nucleus::createFCmpONE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003225 }
3226
3227 RValue<Int4> CmpNLT(RValue<Float4> x, RValue<Float4> y)
3228 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003229 return RValue<Int4>(Nucleus::createFCmpOGE(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003230 }
3231
3232 RValue<Int4> CmpNLE(RValue<Float4> x, RValue<Float4> y)
3233 {
Nicolas Capens5e6ca092017-01-13 15:09:21 -05003234 return RValue<Int4>(Nucleus::createFCmpOGT(x.value, y.value));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003235 }
3236
Ben Claytonec1aeb82019-03-04 19:33:27 +00003237 RValue<Int4> CmpUEQ(RValue<Float4> x, RValue<Float4> y)
3238 {
3239 return RValue<Int4>(Nucleus::createFCmpUEQ(x.value, y.value));
3240 }
3241
3242 RValue<Int4> CmpULT(RValue<Float4> x, RValue<Float4> y)
3243 {
3244 return RValue<Int4>(Nucleus::createFCmpULT(x.value, y.value));
3245 }
3246
3247 RValue<Int4> CmpULE(RValue<Float4> x, RValue<Float4> y)
3248 {
3249 return RValue<Int4>(Nucleus::createFCmpULE(x.value, y.value));
3250 }
3251
3252 RValue<Int4> CmpUNEQ(RValue<Float4> x, RValue<Float4> y)
3253 {
3254 return RValue<Int4>(Nucleus::createFCmpUNE(x.value, y.value));
3255 }
3256
3257 RValue<Int4> CmpUNLT(RValue<Float4> x, RValue<Float4> y)
3258 {
3259 return RValue<Int4>(Nucleus::createFCmpUGE(x.value, y.value));
3260 }
3261
3262 RValue<Int4> CmpUNLE(RValue<Float4> x, RValue<Float4> y)
3263 {
3264 return RValue<Int4>(Nucleus::createFCmpUGT(x.value, y.value));
3265 }
3266
Nicolas Capens598f8d82016-09-26 15:09:10 -04003267 RValue<Float4> Round(RValue<Float4> x)
3268 {
Nicolas Capens091f3502017-10-03 14:56:49 -04003269 if(emulateIntrinsics || CPUID::ARM)
Nicolas Capensf7b75882017-04-26 09:30:47 -04003270 {
3271 // Push the fractional part off the mantissa. Accurate up to +/-2^22.
3272 return (x + Float4(0x00C00000)) - Float4(0x00C00000);
3273 }
3274 else if(CPUID::SSE4_1)
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003275 {
3276 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
3277 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::Round, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
3278 auto target = ::context->getConstantUndef(Ice::IceType_i32);
3279 auto round = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
3280 round->addArg(x.value);
3281 round->addArg(::context->getConstantInt32(0));
3282 ::basicBlock->appendInst(round);
Nicolas Capensa8086512016-11-07 17:32:17 -05003283
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003284 return RValue<Float4>(V(result));
3285 }
3286 else
3287 {
3288 return Float4(RoundInt(x));
3289 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04003290 }
3291
3292 RValue<Float4> Trunc(RValue<Float4> x)
3293 {
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003294 if(CPUID::SSE4_1)
3295 {
3296 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
3297 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::Round, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
3298 auto target = ::context->getConstantUndef(Ice::IceType_i32);
3299 auto round = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
3300 round->addArg(x.value);
3301 round->addArg(::context->getConstantInt32(3));
3302 ::basicBlock->appendInst(round);
Nicolas Capensa8086512016-11-07 17:32:17 -05003303
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003304 return RValue<Float4>(V(result));
3305 }
3306 else
3307 {
3308 return Float4(Int4(x));
3309 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04003310 }
3311
3312 RValue<Float4> Frac(RValue<Float4> x)
3313 {
Nicolas Capensb9230422017-07-17 10:27:33 -04003314 Float4 frc;
3315
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003316 if(CPUID::SSE4_1)
3317 {
Nicolas Capensb9230422017-07-17 10:27:33 -04003318 frc = x - Floor(x);
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003319 }
3320 else
3321 {
Nicolas Capensb9230422017-07-17 10:27:33 -04003322 frc = x - Float4(Int4(x)); // Signed fractional part.
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003323
Nicolas Capensb9230422017-07-17 10:27:33 -04003324 frc += As<Float4>(As<Int4>(CmpNLE(Float4(0.0f), frc)) & As<Int4>(Float4(1, 1, 1, 1))); // Add 1.0 if negative.
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003325 }
Nicolas Capensb9230422017-07-17 10:27:33 -04003326
3327 // x - floor(x) can be 1.0 for very small negative x.
3328 // Clamp against the value just below 1.0.
3329 return Min(frc, As<Float4>(Int4(0x3F7FFFFF)));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003330 }
3331
3332 RValue<Float4> Floor(RValue<Float4> x)
3333 {
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003334 if(CPUID::SSE4_1)
3335 {
3336 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
3337 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::Round, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
3338 auto target = ::context->getConstantUndef(Ice::IceType_i32);
3339 auto round = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
3340 round->addArg(x.value);
3341 round->addArg(::context->getConstantInt32(1));
3342 ::basicBlock->appendInst(round);
Nicolas Capensa8086512016-11-07 17:32:17 -05003343
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003344 return RValue<Float4>(V(result));
3345 }
3346 else
3347 {
3348 return x - Frac(x);
3349 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04003350 }
3351
3352 RValue<Float4> Ceil(RValue<Float4> x)
3353 {
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003354 if(CPUID::SSE4_1)
3355 {
3356 Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
3357 const Ice::Intrinsics::IntrinsicInfo intrinsic = {Ice::Intrinsics::Round, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F};
3358 auto target = ::context->getConstantUndef(Ice::IceType_i32);
3359 auto round = Ice::InstIntrinsicCall::create(::function, 2, result, target, intrinsic);
3360 round->addArg(x.value);
3361 round->addArg(::context->getConstantInt32(2));
3362 ::basicBlock->appendInst(round);
Nicolas Capensa8086512016-11-07 17:32:17 -05003363
Nicolas Capens9ca48d52017-01-14 12:52:55 -05003364 return RValue<Float4>(V(result));
3365 }
3366 else
3367 {
3368 return -Floor(-x);
3369 }
Nicolas Capens598f8d82016-09-26 15:09:10 -04003370 }
3371
3372 Type *Float4::getType()
3373 {
Nicolas Capens9709d4f2016-09-30 11:44:14 -04003374 return T(Ice::IceType_v4f32);
Nicolas Capens598f8d82016-09-26 15:09:10 -04003375 }
3376
Nicolas Capens598f8d82016-09-26 15:09:10 -04003377 RValue<Long> Ticks()
3378 {
Nicolas Capensc37252c2016-09-28 16:11:54 -04003379 assert(false && "UNIMPLEMENTED"); return RValue<Long>(V(nullptr));
Nicolas Capens598f8d82016-09-26 15:09:10 -04003380 }
3381}