lib/Target/JSBackend/JSBackend.cpp - external/github.com/emscripten-core/emscripten-fastcomp - Git at Google

 //===-- JSBackend.cpp - Library for converting LLVM code to JS       -----===//
 //
 //                     The LLVM Compiler Infrastructure
 //
 // This file is distributed under the University of Illinois Open Source
 // License. See LICENSE.TXT for details.
 //
 //===----------------------------------------------------------------------===//
 //
 // This file implements compiling of LLVM IR, which is assumed to have been
 // simplified using the PNaCl passes, i64 legalization, and other necessary
 // transformations, into JavaScript in asm.js format, suitable for passing
 // to emscripten for final processing.
 //
 //===----------------------------------------------------------------------===//

 #include "JSTargetMachine.h"
 #include "MCTargetDesc/JSBackendMCTargetDesc.h"
 #include "AllocaManager.h"
 #include "llvm/Analysis/ValueTracking.h"
 #include "llvm/ADT/SmallPtrSet.h"
 #include "llvm/ADT/SmallString.h"
 #include "llvm/ADT/StringExtras.h"
 #include "llvm/ADT/STLExtras.h"
 #include "llvm/Config/config.h"
 #include "llvm/IR/Constants.h"
 #include "llvm/IR/DerivedTypes.h"
 #include "llvm/IR/InlineAsm.h"
 #include "llvm/IR/Instruction.h"
 #include "llvm/IR/Instructions.h"
 #include "llvm/IR/Intrinsics.h"
 #include "llvm/IR/Module.h"
 #include "llvm/IR/Operator.h"
 #include "llvm/Pass.h"
 #include "llvm/IR/LegacyPassManager.h"
 #include "llvm/IR/CallSite.h"
 #include "llvm/Support/CommandLine.h"
 #include "llvm/Support/ErrorHandling.h"
 #include "llvm/IR/GetElementPtrTypeIterator.h"
 #include "llvm/Support/MathExtras.h"
 #include "llvm/Support/TargetRegistry.h"
 #include "llvm/IR/DebugInfo.h"
 #include "llvm/Transforms/NaCl.h"
 #include <algorithm>
 #include <cstdio>
 #include <map>
 #include <set> // TODO: unordered_set?
 using namespace llvm;

 #include <OptPasses.h>
 #include <Relooper.h>

 #ifdef NDEBUG
 #undef assert
 #define assert(x) { if (!(x)) report_fatal_error(#x); }
 #endif

 raw_ostream &prettyWarning() {
   errs().changeColor(raw_ostream::YELLOW);
   errs() << "warning:";
   errs().resetColor();
   errs() << " ";
   return errs();
 }

 static cl::opt<bool>
 PreciseF32("emscripten-precise-f32",
            cl::desc("Enables Math.fround usage to implement precise float32 semantics and performance (see emscripten PRECISE_F32 option)"),
            cl::init(false));

 static cl::opt<bool>
 EnablePthreads("emscripten-enable-pthreads",
            cl::desc("Enables compilation targeting JavaScript Shared Array Buffer and Atomics API to implement support for pthreads-based multithreading"),
            cl::init(false));

 static cl::opt<bool>
 WarnOnUnaligned("emscripten-warn-unaligned",
                 cl::desc("Warns about unaligned loads and stores (which can negatively affect performance)"),
                 cl::init(false));

 static cl::opt<int>
 ReservedFunctionPointers("emscripten-reserved-function-pointers",
                          cl::desc("Number of reserved slots in function tables for functions to be added at runtime (see emscripten RESERVED_FUNCTION_POINTERS option)"),
                          cl::init(0));

 static cl::opt<bool>
 EmulatedFunctionPointers("emscripten-emulated-function-pointers",
                          cl::desc("Emulate function pointers, avoiding asm.js function tables (see emscripten EMULATED_FUNCTION_POINTERS option)"),
                          cl::init(false));

 static cl::opt<int>
 EmscriptenAssertions("emscripten-assertions",
                      cl::desc("Additional JS-specific assertions (see emscripten ASSERTIONS)"),
                      cl::init(0));

 static cl::opt<bool>
 NoAliasingFunctionPointers("emscripten-no-aliasing-function-pointers",
                            cl::desc("Forces function pointers to not alias (this is more correct, but rarely needed, and has the cost of much larger function tables; it is useful for debugging though; see emscripten ALIASING_FUNCTION_POINTERS option)"),
                            cl::init(false));

 static cl::opt<int>
 GlobalBase("emscripten-global-base",
            cl::desc("Where global variables start out in memory (see emscripten GLOBAL_BASE option)"),
            cl::init(8));

 static cl::opt<bool>
 Relocatable("emscripten-relocatable",
             cl::desc("Whether to emit relocatable code (see emscripten RELOCATABLE option)"),
             cl::init(false));


 extern "C" void LLVMInitializeJSBackendTarget() {
   // Register the target.
   RegisterTargetMachine<JSTargetMachine> X(TheJSBackendTarget);
 }

 namespace {
   #define ASM_SIGNED 0
   #define ASM_UNSIGNED 1
   #define ASM_NONSPECIFIC 2 // nonspecific means to not differentiate ints. |0 for all, regardless of size and sign
   #define ASM_FFI_IN 4 // FFI return values are limited to things that work in ffis
   #define ASM_FFI_OUT 8 // params to FFIs are limited to things that work in ffis
   #define ASM_MUST_CAST 16 // this value must be explicitly cast (or be an integer constant)
   typedef unsigned AsmCast;

   typedef std::map<const Value*,std::string> ValueMap;
   typedef std::set<std::string> NameSet;
   typedef std::set<int> IntSet;
   typedef std::vector<unsigned char> HeapData;
   typedef std::map<int, HeapData> HeapDataMap;
   typedef std::vector<int> AlignedHeapStartMap;
   typedef std::pair<unsigned, unsigned> Address;
   typedef std::map<std::string, Type *> VarMap;
   typedef std::map<std::string, Address> GlobalAddressMap;
   typedef std::vector<std::string> FunctionTable;
   typedef std::map<std::string, FunctionTable> FunctionTableMap;
   typedef std::map<std::string, std::string> StringMap;
   typedef std::map<std::string, unsigned> NameIntMap;
   typedef std::map<unsigned, unsigned> IntIntMap;
   typedef std::map<const BasicBlock*, unsigned> BlockIndexMap;
   typedef std::map<const Function*, BlockIndexMap> BlockAddressMap;
   typedef std::map<const BasicBlock*, Block*> LLVMToRelooperMap;

   /// JSWriter - This class is the main chunk of code that converts an LLVM
   /// module to JavaScript.
   class JSWriter : public ModulePass {
     raw_pwrite_stream &Out;
     Module *TheModule;
     unsigned UniqueNum;
     unsigned NextFunctionIndex; // used with NoAliasingFunctionPointers
     ValueMap ValueNames;
     VarMap UsedVars;
     AllocaManager Allocas;
     HeapDataMap GlobalDataMap;
     AlignedHeapStartMap AlignedHeapStarts;
     GlobalAddressMap GlobalAddresses;
     NameSet Externals; // vars
     NameSet Declares; // funcs
     StringMap Redirects; // library function redirects actually used, needed for wrapper funcs in tables
     std::vector<std::string> PostSets;
     NameIntMap NamedGlobals; // globals that we export as metadata to JS, so it can access them by name
     std::map<std::string, unsigned> IndexedFunctions; // name -> index
     FunctionTableMap FunctionTables; // sig => list of functions
     std::vector<std::string> GlobalInitializers;
     std::vector<std::string> Exports; // additional exports
     StringMap Aliases;
     BlockAddressMap BlockAddresses;
     NameIntMap AsmConsts;
     IntIntMap AsmConstArities;
     NameSet FuncRelocatableExterns; // which externals are accessed in this function; we load them once at the beginning (avoids a potential call in a heap access, and might be faster)

     std::string CantValidate;
     bool UsesSIMDInt8x16;
     bool UsesSIMDInt16x8;
     bool UsesSIMDInt32x4;
     bool UsesSIMDFloat32x4;
     bool UsesSIMDFloat64x2;
     int InvokeState; // cycles between 0, 1 after preInvoke, 2 after call, 0 again after postInvoke. hackish, no argument there.
     CodeGenOpt::Level OptLevel;
     const DataLayout *DL;
     bool StackBumped;
     int GlobalBasePadding;
     int MaxGlobalAlign;

     #include "CallHandlers.h"

   public:
     static char ID;
     JSWriter(raw_pwrite_stream &o, CodeGenOpt::Level OptLevel)
       : ModulePass(ID), Out(o), UniqueNum(0), NextFunctionIndex(0), CantValidate(""),
         UsesSIMDInt8x16(false), UsesSIMDInt16x8(false), UsesSIMDInt32x4(false),
         UsesSIMDFloat32x4(false), UsesSIMDFloat64x2(false), InvokeState(0),
         OptLevel(OptLevel), StackBumped(false), GlobalBasePadding(0), MaxGlobalAlign(0) {}

     const char *getPassName() const override { return "JavaScript backend"; }

     bool runOnModule(Module &M) override;

     void getAnalysisUsage(AnalysisUsage &AU) const override {
       AU.setPreservesAll();
       ModulePass::getAnalysisUsage(AU);
     }

     void printProgram(const std::string& fname, const std::string& modName );
     void printModule(const std::string& fname, const std::string& modName );
     void printFunction(const Function *F);

     LLVM_ATTRIBUTE_NORETURN void error(const std::string& msg);

     raw_pwrite_stream& nl(raw_pwrite_stream &Out, int delta = 0);

   private:
     void printCommaSeparated(const HeapData v);

     // parsing of constants has two phases: calculate, and then emit
     void parseConstant(const std::string& name, const Constant* CV, int Alignment, bool calculate);

     #define DEFAULT_MEM_ALIGN 8

     #define STACK_ALIGN 16
     #define STACK_ALIGN_BITS 128

     unsigned stackAlign(unsigned x) {
       return RoundUpToAlignment(x, STACK_ALIGN);
     }
     std::string stackAlignStr(std::string x) {
       return "((" + x + "+" + utostr(STACK_ALIGN-1) + ")&-" + utostr(STACK_ALIGN) + ")";
     }

     void ensureAligned(int Alignment, HeapData* GlobalData) {
       assert(isPowerOf2_32(Alignment) && Alignment > 0);
       while (GlobalData->size() & (Alignment-1)) GlobalData->push_back(0);
     }
     void ensureAligned(int Alignment, HeapData& GlobalData) {
       assert(isPowerOf2_32(Alignment) && Alignment > 0);
       while (GlobalData.size() & (Alignment-1)) GlobalData.push_back(0);
     }

     HeapData *allocateAddress(const std::string& Name, unsigned Alignment) {
       assert(isPowerOf2_32(Alignment) && Alignment > 0);
       HeapData* GlobalData = &GlobalDataMap[Alignment];
       ensureAligned(Alignment, GlobalData);
       GlobalAddresses[Name] = Address(GlobalData->size(), Alignment*8);
       return GlobalData;
     }

     // return the absolute offset of a global
     unsigned getGlobalAddress(const std::string &s) {
       GlobalAddressMap::const_iterator I = GlobalAddresses.find(s);
       if (I == GlobalAddresses.end()) {
         report_fatal_error("cannot find global address " + Twine(s));
       }
       Address a = I->second;
       int Alignment = a.second/8;
       assert(AlignedHeapStarts.size() > (unsigned)Alignment);
       int Ret = a.first + AlignedHeapStarts[Alignment];
       assert(Ret % Alignment == 0);
       return Ret;
     }
     // returns the internal offset inside the proper block: GlobalData8, 32, 64
     unsigned getRelativeGlobalAddress(const std::string &s) {
       GlobalAddressMap::const_iterator I = GlobalAddresses.find(s);
       if (I == GlobalAddresses.end()) {
         report_fatal_error("cannot find global address " + Twine(s));
       }
       Address a = I->second;
       return a.first;
     }
     char getFunctionSignatureLetter(Type *T) {
       if (T->isVoidTy()) return 'v';
       else if (T->isFloatingPointTy()) {
         if (PreciseF32 && T->isFloatTy()) {
           return 'f';
         } else {
           return 'd';
         }
       } else if (VectorType *VT = dyn_cast<VectorType>(T)) {
         checkVectorType(VT);
         if (VT->getElementType()->isIntegerTy()) {
           return 'I';
         } else {
           return 'F';
         }
       } else {
         return 'i';
       }
     }
     std::string getFunctionSignature(const FunctionType *F, const std::string *Name=NULL) {
       std::string Ret;
       Ret += getFunctionSignatureLetter(F->getReturnType());
       for (FunctionType::param_iterator AI = F->param_begin(),
              AE = F->param_end(); AI != AE; ++AI) {
         Ret += getFunctionSignatureLetter(*AI);
       }
       return Ret;
     }
     FunctionTable& ensureFunctionTable(const FunctionType *FT) {
       FunctionTable &Table = FunctionTables[getFunctionSignature(FT)];
       unsigned MinSize = ReservedFunctionPointers ? 2*(ReservedFunctionPointers+1) : 1; // each reserved slot must be 2-aligned
       while (Table.size() < MinSize) Table.push_back("0");
       return Table;
     }
     unsigned getFunctionIndex(const Function *F) {
       const std::string &Name = getJSName(F);
       if (IndexedFunctions.find(Name) != IndexedFunctions.end()) return IndexedFunctions[Name];
       std::string Sig = getFunctionSignature(F->getFunctionType(), &Name);
       FunctionTable& Table = ensureFunctionTable(F->getFunctionType());
       if (NoAliasingFunctionPointers) {
         while (Table.size() < NextFunctionIndex) Table.push_back("0");
       }
       // XXX this is wrong, it's always 1. but, that's fine in the ARM-like ABI
       // we have which allows unaligned func the one risk is if someone forces a
       // function to be aligned, and relies on that. Could do F->getAlignment()
       // instead.
       unsigned Alignment = 1;
       while (Table.size() % Alignment) Table.push_back("0");
       unsigned Index = Table.size();
       Table.push_back(Name);
       IndexedFunctions[Name] = Index;
       if (NoAliasingFunctionPointers) {
         NextFunctionIndex = Index+1;
       }

       // invoke the callHandler for this, if there is one. the function may only be indexed but never called directly, and we may need to do things in the handler
       CallHandlerMap::const_iterator CH = CallHandlers.find(Name);
       if (CH != CallHandlers.end()) {
         (this->*(CH->second))(NULL, Name, -1);
       }

       return Index;
     }

     unsigned getBlockAddress(const Function *F, const BasicBlock *BB) {
       BlockIndexMap& Blocks = BlockAddresses[F];
       if (Blocks.find(BB) == Blocks.end()) {
         Blocks[BB] = Blocks.size(); // block addresses start from 0
       }
       return Blocks[BB];
     }

     unsigned getBlockAddress(const BlockAddress *BA) {
       return getBlockAddress(BA->getFunction(), BA->getBasicBlock());
     }

     const Value *resolveFully(const Value *V) {
       bool More = true;
       while (More) {
         More = false;
         if (const GlobalAlias *GA = dyn_cast<GlobalAlias>(V)) {
           V = GA->getAliasee();
           More = true;
         }
         if (const ConstantExpr *CE = dyn_cast<ConstantExpr>(V)) {
           V = CE->getOperand(0); // ignore bitcasts
           More = true;
         }
       }
       return V;
     }

     std::string relocateFunctionPointer(std::string FP) {
       return Relocatable ? "(fb + (" + FP + ") | 0)" : FP;
     }

     std::string relocateGlobal(std::string G) {
       return Relocatable ? "(gb + (" + G + ") | 0)" : G;
     }

     // Return a constant we are about to write into a global as a numeric offset. If the
     // value is not known at compile time, emit a postSet to that location.
     unsigned getConstAsOffset(const Value *V, unsigned AbsoluteTarget) {
       V = resolveFully(V);
       if (const Function *F = dyn_cast<const Function>(V)) {
         if (Relocatable) {
           PostSets.push_back("\n HEAP32[" + relocateGlobal(utostr(AbsoluteTarget)) + " >> 2] = " + relocateFunctionPointer(utostr(getFunctionIndex(F))) + ';');
           return 0; // emit zero in there for now, until the postSet
         }
         return getFunctionIndex(F);
       } else if (const BlockAddress *BA = dyn_cast<const BlockAddress>(V)) {
         return getBlockAddress(BA);
       } else {
         if (const GlobalVariable *GV = dyn_cast<GlobalVariable>(V)) {
           if (!GV->hasInitializer()) {
             // We don't have a constant to emit here, so we must emit a postSet
             // All postsets are of external values, so they are pointers, hence 32-bit
             std::string Name = getOpName(V);
             Externals.insert(Name);
             if (Relocatable) {
               PostSets.push_back("\n temp = g$" + Name + "() | 0;"); // we access linked externs through calls, and must do so to a temp for heap growth validation
               // see later down about adding to an offset
               std::string access = "HEAP32[" + relocateGlobal(utostr(AbsoluteTarget)) + " >> 2]";
               PostSets.push_back("\n " + access + " = (" + access + " | 0) + temp;");
             } else {
               PostSets.push_back("\n HEAP32[" + relocateGlobal(utostr(AbsoluteTarget)) + " >> 2] = " + Name + ';');
             }
             return 0; // emit zero in there for now, until the postSet
           } else if (Relocatable) {
             // this is one of our globals, but we must relocate it. we return zero, but the caller may store
             // an added offset, which we read at postSet time; in other words, we just add to that offset
             std::string access = "HEAP32[" + relocateGlobal(utostr(AbsoluteTarget)) + " >> 2]";
             PostSets.push_back("\n " + access + " = (" + access + " | 0) + " + relocateGlobal(utostr(getGlobalAddress(V->getName().str()))) + ';');
             return 0; // emit zero in there for now, until the postSet
           }
         }
         assert(!Relocatable);
         return getGlobalAddress(V->getName().str());
       }
     }

     // Transform the string input into emscripten_asm_const_*(str, args1, arg2)
     // into an id. We emit a map of id => string contents, and emscripten
     // wraps it up so that calling that id calls that function.
     unsigned getAsmConstId(const Value *V, int Arity) {
       V = resolveFully(V);
       const Constant *CI = cast<GlobalVariable>(V)->getInitializer();
       std::string code;
       if (isa<ConstantAggregateZero>(CI)) {
         code = " ";
       } else {
         const ConstantDataSequential *CDS = cast<ConstantDataSequential>(CI);
         code = CDS->getAsString();
         // replace newlines quotes with escaped newlines
         size_t curr = 0;
         while ((curr = code.find("\\n", curr)) != std::string::npos) {
           code = code.replace(curr, 2, "\\\\n");
           curr += 3; // skip this one
         }
         // replace double quotes with escaped single quotes
         curr = 0;
         while ((curr = code.find('"', curr)) != std::string::npos) {
           if (curr == 0 || code[curr-1] != '\\') {
             code = code.replace(curr, 1, "\\" "\"");
             curr += 2; // skip this one
           } else { // already escaped, escape the slash as well
             code = code.replace(curr, 1, "\\" "\\" "\"");
             curr += 3; // skip this one
           }
         }
       }
       if (AsmConsts.count(code) > 0) return AsmConsts[code];
       unsigned id = AsmConsts.size();
       AsmConsts[code] = id;
       AsmConstArities[id] = Arity;
       return id;
     }

     // Test whether the given value is known to be an absolute value or one we turn into an absolute value
     bool isAbsolute(const Value *P) {
       if (const IntToPtrInst *ITP = dyn_cast<IntToPtrInst>(P)) {
         return isa<ConstantInt>(ITP->getOperand(0));
       }
       if (isa<ConstantPointerNull>(P) || isa<UndefValue>(P)) {
         return true;
       }
       return false;
     }

     void checkVectorType(Type *T) {
       VectorType *VT = cast<VectorType>(T);
       // LLVM represents the results of vector comparison as vectors of i1. We
       // represent them as vectors of integers the size of the vector elements
       // of the compare that produced them.
       assert(VT->getElementType()->getPrimitiveSizeInBits() == 8 ||
              VT->getElementType()->getPrimitiveSizeInBits() == 16 ||
              VT->getElementType()->getPrimitiveSizeInBits() == 32 ||
              VT->getElementType()->getPrimitiveSizeInBits() == 64 ||
              VT->getElementType()->getPrimitiveSizeInBits() == 128 ||
              VT->getElementType()->getPrimitiveSizeInBits() == 1);
       assert(VT->getBitWidth() <= 128);
       assert(VT->getNumElements() <= 16);
       if (VT->getElementType()->isIntegerTy())
       {
         if (VT->getNumElements() == 16 && VT->getElementType()->getPrimitiveSizeInBits() == 8) UsesSIMDInt8x16 = true;
         else if (VT->getNumElements() == 8 && VT->getElementType()->getPrimitiveSizeInBits() == 16) UsesSIMDInt16x8 = true;
         else if (VT->getNumElements() == 4 && VT->getElementType()->getPrimitiveSizeInBits() == 32) UsesSIMDInt32x4 = true;
         else if (VT->getElementType()->getPrimitiveSizeInBits() != 1 && VT->getElementType()->getPrimitiveSizeInBits() != 128) {
           report_fatal_error("Unsupported integer vector type with numElems: " + Twine(VT->getNumElements()) + ", primitiveSize: " + Twine(VT->getElementType()->getPrimitiveSizeInBits()) + "!");
         }
       }
       else
       {
         if (VT->getNumElements() == 4 && VT->getElementType()->getPrimitiveSizeInBits() == 32) UsesSIMDFloat32x4 = true;
         else if (VT->getNumElements() == 2 && VT->getElementType()->getPrimitiveSizeInBits() == 64) UsesSIMDFloat64x2 = true;
         else report_fatal_error("Unsupported floating point vector type numElems: " + Twine(VT->getNumElements()) + ", primitiveSize: " + Twine(VT->getElementType()->getPrimitiveSizeInBits()) + "!");
       }
     }

     std::string ensureCast(std::string S, Type *T, AsmCast sign) {
       if (sign & ASM_MUST_CAST) return getCast(S, T);
       return S;
     }

     std::string ftostr(const ConstantFP *CFP, AsmCast sign) {
       const APFloat &flt = CFP->getValueAPF();

       // Emscripten has its own spellings for infinity and NaN.
       if (flt.getCategory() == APFloat::fcInfinity) return ensureCast(flt.isNegative() ? "-inf" : "inf", CFP->getType(), sign);
       else if (flt.getCategory() == APFloat::fcNaN) return ensureCast("nan", CFP->getType(), sign);

       // Request 9 or 17 digits, aka FLT_DECIMAL_DIG or DBL_DECIMAL_DIG (our
       // long double is the the same as our double), to avoid rounding errors.
       SmallString<29> Str;
       flt.toString(Str, PreciseF32 && CFP->getType()->isFloatTy() ? 9 : 17);

       // asm.js considers literals to be floating-point literals when they contain a
       // dot, however our output may be processed by UglifyJS, which doesn't
       // currently preserve dots in all cases. Mark floating-point literals with
       // unary plus to force them to floating-point.
       if (APFloat(flt).roundToIntegral(APFloat::rmNearestTiesToEven) == APFloat::opOK) {
         return '+' + Str.str().str();
       }

       return Str.str().str();
     }

     std::string getPtrLoad(const Value* Ptr);

     /// Given a pointer to memory, returns the HEAP object and index to that object that is used to access that memory.
     /// @param Ptr [in] The heap object.
     /// @param HeapName [out] Receives the name of the HEAP object used to perform the memory acess.
     /// @return The index to the heap HeapName for the memory access.
     std::string getHeapNameAndIndex(const Value *Ptr, const char **HeapName);

     // Like getHeapNameAndIndex(), but uses the given memory operation size instead of the one from Ptr.
     std::string getHeapNameAndIndex(const Value *Ptr, const char **HeapName, unsigned Bytes);

     /// Like getHeapNameAndIndex(), but for global variables only.
     std::string getHeapNameAndIndexToGlobal(const GlobalVariable *GV, const char **HeapName);

     /// Like getHeapNameAndIndex(), but for pointers represented in string expression form.
     static std::string getHeapNameAndIndexToPtr(const std::string& Ptr, unsigned Bytes, bool Integer, const char **HeapName);

     std::string getShiftedPtr(const Value *Ptr, unsigned Bytes);

     /// Returns a string expression for accessing the given memory address.
     std::string getPtrUse(const Value* Ptr);

     /// Like getPtrUse(), but for pointers represented in string expression form.
     static std::string getHeapAccess(const std::string& Name, unsigned Bytes, bool Integer=true);

     std::string getConstant(const Constant*, AsmCast sign=ASM_SIGNED);
     std::string getConstantVector(const ConstantVector *C);
     std::string getConstantVector(const ConstantDataVector *C);
     std::string getValueAsStr(const Value*, AsmCast sign=ASM_SIGNED);
     std::string getValueAsCastStr(const Value*, AsmCast sign=ASM_SIGNED);
     std::string getValueAsParenStr(const Value*);
     std::string getValueAsCastParenStr(const Value*, AsmCast sign=ASM_SIGNED);

     const std::string &getJSName(const Value* val);

     std::string getPhiCode(const BasicBlock *From, const BasicBlock *To);

     void printAttributes(const AttributeSet &PAL, const std::string &name);
     void printType(Type* Ty);
     void printTypes(const Module* M);

     std::string getAdHocAssign(const StringRef &, Type *);
     std::string getAssign(const Instruction *I);
     std::string getAssignIfNeeded(const Value *V);
     std::string getCast(const StringRef &, Type *, AsmCast sign=ASM_SIGNED);
     std::string getParenCast(const StringRef &, Type *, AsmCast sign=ASM_SIGNED);
     std::string getDoubleToInt(const StringRef &);
     std::string getIMul(const Value *, const Value *);
     std::string getLoad(const Instruction *I, const Value *P, Type *T, unsigned Alignment, char sep=';');
     std::string getStore(const Instruction *I, const Value *P, Type *T, const std::string& VS, unsigned Alignment, char sep=';');
     std::string getStackBump(unsigned Size);
     std::string getStackBump(const std::string &Size);

     void addBlock(const BasicBlock *BB, Relooper& R, LLVMToRelooperMap& LLVMToRelooper);
     void printFunctionBody(const Function *F);
     void generateInsertElementExpression(const InsertElementInst *III, raw_string_ostream& Code);
     void generateExtractElementExpression(const ExtractElementInst *EEI, raw_string_ostream& Code);
     std::string getSIMDCast(VectorType *fromType, VectorType *toType, const std::string &valueStr);
     void generateShuffleVectorExpression(const ShuffleVectorInst *SVI, raw_string_ostream& Code);
     void generateICmpExpression(const ICmpInst *I, raw_string_ostream& Code);
     void generateFCmpExpression(const FCmpInst *I, raw_string_ostream& Code);
     void generateShiftExpression(const BinaryOperator *I, raw_string_ostream& Code);
     void generateUnrolledExpression(const User *I, raw_string_ostream& Code);
     bool generateSIMDExpression(const User *I, raw_string_ostream& Code);
     void generateExpression(const User *I, raw_string_ostream& Code);

     std::string getOpName(const Value*);

     void processConstants();

     // nativization

     typedef std::set<const Value*> NativizedVarsMap;
     NativizedVarsMap NativizedVars;

     void calculateNativizedVars(const Function *F);

     // special analyses

     bool canReloop(const Function *F);

     // main entry point

     void printModuleBody();
   };
 } // end anonymous namespace.

 raw_pwrite_stream &JSWriter::nl(raw_pwrite_stream &Out, int delta) {
   Out << '\n';
   return Out;
 }

 static inline char halfCharToHex(unsigned char half) {
   assert(half <= 15);
   if (half <= 9) {
     return '0' + half;
   } else {
     return 'A' + half - 10;
   }
 }

 static inline void sanitizeGlobal(std::string& str) {
   // Global names are prefixed with "_" to prevent them from colliding with
   // names of things in normal JS.
   str = "_" + str;

   // functions and globals should already be in C-style format,
   // in addition to . for llvm intrinsics and possibly $ and so forth.
   // There is a risk of collisions here, we just lower all these
   // invalid characters to _, but this should not happen in practice.
   // TODO: in debug mode, check for such collisions.
   size_t OriginalSize = str.size();
   for (size_t i = 1; i < OriginalSize; ++i) {
     unsigned char c = str[i];
     if (!isalnum(c) && c != '_') str[i] = '_';
   }
 }

 static inline void sanitizeLocal(std::string& str) {
   // Local names are prefixed with "$" to prevent them from colliding with
   // global names.
   str = "$" + str;

   // We need to convert every string that is not a valid JS identifier into
   // a valid one, without collisions - we cannot turn "x.a" into "x_a" while
   // also leaving "x_a" as is, for example.
   //
   // We leave valid characters 0-9a-zA-Z and _ unchanged. Anything else
   // we replace with $ and append a hex representation of that value,
   // so for example x.a turns into x$a2e, x..a turns into x$$a2e2e.
   //
   // As an optimization, we replace . with $ without appending anything,
   // unless there is another illegal character. The reason is that . is
   // a common illegal character, and we want to avoid resizing strings
   // for perf reasons, and we If we do see we need to append something, then
   // for . we just append Z (one character, instead of the hex code).
   //

   size_t OriginalSize = str.size();
   int Queued = 0;
   for (size_t i = 1; i < OriginalSize; ++i) {
     unsigned char c = str[i];
     if (!isalnum(c) && c != '_') {
       str[i] = '$';
       if (c == '.') {
         Queued++;
       } else {
         size_t s = str.size();
         str.resize(s+2+Queued);
         for (int i = 0; i < Queued; i++) {
           str[s++] = 'Z';
         }
         Queued = 0;
         str[s] = halfCharToHex(c >> 4);
         str[s+1] = halfCharToHex(c & 0xf);
       }
     }
   }
 }

 static inline std::string ensureFloat(const std::string &S, Type *T) {
   if (PreciseF32 && T->isFloatTy()) {
     return "Math_fround(" + S + ')';
   }
   return S;
 }

 static inline std::string ensureFloat(const std::string &value, bool wrap) {
   if (wrap) {
     return "Math_fround(" + value + ')';
   }
   return value;
 }

 static void emitDebugInfo(raw_ostream& Code, const Instruction *I) {
   auto &Loc = I->getDebugLoc();
   if (Loc) {
     unsigned Line = Loc.getLine();
     auto *Scope = cast_or_null<MDScope>(Loc.getScope());
     if (Scope) {
       StringRef File = Scope->getFilename();
       if (Line > 0)
         Code << " //@line " << utostr(Line) << " \"" << (File.size() > 0 ? File.str() : "?") << "\"";
     }
   }
 }

 void JSWriter::error(const std::string& msg) {
   report_fatal_error(msg);
 }

 std::string JSWriter::getPhiCode(const BasicBlock *From, const BasicBlock *To) {
   // FIXME this is all quite inefficient, and also done once per incoming to each phi

   // Find the phis, and generate assignments and dependencies
   std::set<std::string> PhiVars;
   for (BasicBlock::const_iterator I = To->begin(), E = To->end();
        I != E; ++I) {
     const PHINode* P = dyn_cast<PHINode>(I);
     if (!P) break;
     PhiVars.insert(getJSName(P));
   }
   typedef std::map<std::string, std::string> StringMap;
   StringMap assigns; // variable -> assign statement
   std::map<std::string, const Value*> values; // variable -> Value
   StringMap deps; // variable -> dependency
   StringMap undeps; // reverse: dependency -> variable
   for (BasicBlock::const_iterator I = To->begin(), E = To->end();
        I != E; ++I) {
     const PHINode* P = dyn_cast<PHINode>(I);
     if (!P) break;
     int index = P->getBasicBlockIndex(From);
     if (index < 0) continue;
     // we found it
     const std::string &name = getJSName(P);
     assigns[name] = getAssign(P);
     // Get the operand, and strip pointer casts, since normal expression
     // translation also strips pointer casts, and we want to see the same
     // thing so that we can detect any resulting dependencies.
     const Value *V = P->getIncomingValue(index)->stripPointerCasts();
     values[name] = V;
     std::string vname = getValueAsStr(V);
     if (const Instruction *VI = dyn_cast<const Instruction>(V)) {
       if (VI->getParent() == To && PhiVars.find(vname) != PhiVars.end()) {
         deps[name] = vname;
         undeps[vname] = name;
       }
     }
   }
   // Emit assignments+values, taking into account dependencies, and breaking cycles
   std::string pre = "", post = "";
   while (assigns.size() > 0) {
     bool emitted = false;
     for (StringMap::iterator I = assigns.begin(); I != assigns.end();) {
       StringMap::iterator last = I;
       std::string curr = last->first;
       const Value *V = values[curr];
       std::string CV = getValueAsStr(V);
       I++; // advance now, as we may erase
       // if we have no dependencies, or we found none to emit and are at the end (so there is a cycle), emit
       StringMap::const_iterator dep = deps.find(curr);
       if (dep == deps.end() || (!emitted && I == assigns.end())) {
         if (dep != deps.end()) {
           // break a cycle
           std::string depString = dep->second;
           std::string temp = curr + "$phi";
           pre += getAdHocAssign(temp, V->getType()) + CV + ';';
           CV = temp;
           deps.erase(curr);
           undeps.erase(depString);
         }
         post += assigns[curr] + CV + ';';
         assigns.erase(last);
         emitted = true;
       }
     }
   }
   return pre + post;
 }

 const std::string &JSWriter::getJSName(const Value* val) {
   ValueMap::const_iterator I = ValueNames.find(val);
   if (I != ValueNames.end() && I->first == val)
     return I->second;

   // If this is an alloca we've replaced with another, use the other name.
   if (const AllocaInst *AI = dyn_cast<AllocaInst>(val)) {
     if (AI->isStaticAlloca()) {
       const AllocaInst *Rep = Allocas.getRepresentative(AI);
       if (Rep != AI) {
         return getJSName(Rep);
       }
     }
   }

   std::string name;
   if (val->hasName()) {
     name = val->getName().str();
   } else {
     name = utostr(UniqueNum++);
   }

   if (isa<Constant>(val)) {
     sanitizeGlobal(name);
   } else {
     sanitizeLocal(name);
   }

   return ValueNames[val] = name;
 }

 std::string JSWriter::getAdHocAssign(const StringRef &s, Type *t) {
   UsedVars[s] = t;
   return (s + " = ").str();
 }

 std::string JSWriter::getAssign(const Instruction *I) {
   return getAdHocAssign(getJSName(I), I->getType());
 }

 std::string JSWriter::getAssignIfNeeded(const Value *V) {
   if (const Instruction *I = dyn_cast<Instruction>(V)) {
     if (!I->use_empty()) return getAssign(I);
   }
   return std::string();
 }

 std::string SIMDType(VectorType *t) {
   bool isInt = t->getElementType()->isIntegerTy();
   int primSize = t->getElementType()->getPrimitiveSizeInBits();
   int numElems = t->getNumElements();
   if (isInt && primSize == 1) primSize = 128 / numElems; // Always treat bit vectors as integer vectors of the base width.

   return (isInt ? "Int" : "Float") + std::to_string(primSize) + 'x' + std::to_string(numElems);
 }

 std::string JSWriter::getCast(const StringRef &s, Type *t, AsmCast sign) {
   switch (t->getTypeID()) {
     default: {
       errs() << *t << "\n";
       assert(false && "Unsupported type");
     }
     case Type::VectorTyID:
       return std::string("SIMD_") + SIMDType(cast<VectorType>(t)) + "_check(" + s.str() + ")";
     case Type::FloatTyID: {
       if (PreciseF32 && !(sign & ASM_FFI_OUT)) {
         if (sign & ASM_FFI_IN) {
           return ("Math_fround(+(" + s + "))").str();
         } else {
           return ("Math_fround(" + s + ")").str();
         }
       }
       // otherwise fall through to double
     }
     case Type::DoubleTyID: return ("+" + s).str();
     case Type::IntegerTyID: {
       // fall through to the end for nonspecific
       switch (t->getIntegerBitWidth()) {
         case 1:  if (!(sign & ASM_NONSPECIFIC)) return sign == ASM_UNSIGNED ? (s + "&1").str()     : (s + "<<31>>31").str();
         case 8:  if (!(sign & ASM_NONSPECIFIC)) return sign == ASM_UNSIGNED ? (s + "&255").str()   : (s + "<<24>>24").str();
         case 16: if (!(sign & ASM_NONSPECIFIC)) return sign == ASM_UNSIGNED ? (s + "&65535").str() : (s + "<<16>>16").str();
         case 32: return (sign == ASM_SIGNED || (sign & ASM_NONSPECIFIC) ? s + "|0" : s + ">>>0").str();
         default: llvm_unreachable("Unsupported integer cast bitwidth");
       }
     }
     case Type::PointerTyID:
       return (sign == ASM_SIGNED || (sign & ASM_NONSPECIFIC) ? s + "|0" : s + ">>>0").str();
   }
 }

 std::string JSWriter::getParenCast(const StringRef &s, Type *t, AsmCast sign) {
   return getCast(("(" + s + ")").str(), t, sign);
 }

 std::string JSWriter::getDoubleToInt(const StringRef &s) {
   return ("~~(" + s + ")").str();
 }

 std::string JSWriter::getIMul(const Value *V1, const Value *V2) {
   const ConstantInt *CI = NULL;
   const Value *Other = NULL;
   if ((CI = dyn_cast<ConstantInt>(V1))) {
     Other = V2;
   } else if ((CI = dyn_cast<ConstantInt>(V2))) {
     Other = V1;
   }
   // we ignore optimizing the case of multiplying two constants - optimizer would have removed those
   if (CI) {
     std::string OtherStr = getValueAsStr(Other);
     unsigned C = CI->getZExtValue();
     if (C == 0) return "0";
     if (C == 1) return OtherStr;
     unsigned Orig = C, Shifts = 0;
     while (C) {
       if ((C & 1) && (C != 1)) break; // not power of 2
       C >>= 1;
       Shifts++;
       if (C == 0) return OtherStr + "<<" + utostr(Shifts-1); // power of 2, emit shift
     }
     if (Orig < (1<<20)) return "(" + OtherStr + "*" + utostr(Orig) + ")|0"; // small enough, avoid imul
   }
   return "Math_imul(" + getValueAsStr(V1) + ", " + getValueAsStr(V2) + ")|0"; // unknown or too large, emit imul
 }

 static inline const char *getHeapName(int Bytes, int Integer)
 {
   switch (Bytes) {
     default: llvm_unreachable("Unsupported type");
     case 8: return "HEAPF64";
     case 4: return Integer ? "HEAP32" : "HEAPF32";
     case 2: return "HEAP16";
     case 1: return "HEAP8";
   }
 }

 static inline int getHeapShift(int Bytes)
 {
   switch (Bytes) {
     default: llvm_unreachable("Unsupported type");
     case 8: return 3;
     case 4: return 2;
     case 2: return 1;
     case 1: return 0;
   }
 }

 static inline const char *getHeapShiftStr(int Bytes)
 {
   switch (Bytes) {
     default: llvm_unreachable("Unsupported type");
     case 8: return ">>3";
     case 4: return ">>2";
     case 2: return ">>1";
     case 1: return ">>0";
   }
 }

 std::string JSWriter::getHeapNameAndIndexToGlobal(const GlobalVariable *GV, const char **HeapName)
 {
   Type *t = cast<PointerType>(GV->getType())->getElementType();
   unsigned Bytes = DL->getTypeAllocSize(t);
   unsigned Addr = getGlobalAddress(GV->getName().str());
   *HeapName = getHeapName(Bytes, t->isIntegerTy() || t->isPointerTy());
   if (!Relocatable) {
     return utostr(Addr >> getHeapShift(Bytes));
   } else {
     return relocateGlobal(utostr(Addr)) + getHeapShiftStr(Bytes);
   }
 }

 std::string JSWriter::getHeapNameAndIndexToPtr(const std::string& Ptr, unsigned Bytes, bool Integer, const char **HeapName)
 {
   *HeapName = getHeapName(Bytes, Integer);
   return Ptr + getHeapShiftStr(Bytes);
 }

 std::string JSWriter::getHeapNameAndIndex(const Value *Ptr, const char **HeapName, unsigned Bytes)
 {
   Type *t = cast<PointerType>(Ptr->getType())->getElementType();

   if (const GlobalVariable *GV = dyn_cast<GlobalVariable>(Ptr)) {
     return getHeapNameAndIndexToGlobal(GV, HeapName);
   } else {
     return getHeapNameAndIndexToPtr(getValueAsStr(Ptr), Bytes, t->isIntegerTy() || t->isPointerTy(), HeapName);
   }
 }

 std::string JSWriter::getHeapNameAndIndex(const Value *Ptr, const char **HeapName)
 {
   Type *t = cast<PointerType>(Ptr->getType())->getElementType();
   unsigned Bytes = DL->getTypeAllocSize(t);
   return getHeapNameAndIndex(Ptr, HeapName, Bytes);
 }

 static const char *heapNameToAtomicTypeName(const char *HeapName)
 {
   if (!strcmp(HeapName, "HEAPF32")) return "f32";
   if (!strcmp(HeapName, "HEAPF64")) return "f64";
   return "";
 }

 std::string JSWriter::getLoad(const Instruction *I, const Value *P, Type *T, unsigned Alignment, char sep) {
   std::string Assign = getAssign(I);
   unsigned Bytes = DL->getTypeAllocSize(T);
   std::string text;
   if (Bytes <= Alignment || Alignment == 0) {
     if (EnablePthreads && cast<LoadInst>(I)->isVolatile()) {
       const char *HeapName;
       std::string Index = getHeapNameAndIndex(P, &HeapName);
       if (!strcmp(HeapName, "HEAPF32") || !strcmp(HeapName, "HEAPF64")) {
         bool fround = PreciseF32 && !strcmp(HeapName, "HEAPF32");
         // TODO: If https://bugzilla.mozilla.org/show_bug.cgi?id=1131613 and https://bugzilla.mozilla.org/show_bug.cgi?id=1131624 are
         // implemented, we could remove the emulation, but until then we must emulate manually.
         text = Assign + (fround ? "Math_fround(" : "+") + "_emscripten_atomic_load_" + heapNameToAtomicTypeName(HeapName) + "(" + getValueAsStr(P) + (fround ? "))" : ")");
       } else {
         text = Assign + "Atomics_load(" + HeapName + ',' + Index + ')';
       }
     } else {
       text = Assign + getPtrLoad(P);
     }
     if (isAbsolute(P)) {
       // loads from an absolute constants are either intentional segfaults (int x = *((int*)0)), or code problems
       text += "; abort() /* segfault, load from absolute addr */";
     }
   } else {
     // unaligned in some manner

     if (EnablePthreads && cast<LoadInst>(I)->isVolatile()) {
       errs() << "emcc: warning: unable to implement unaligned volatile load as atomic in " << I->getParent()->getParent()->getName() << ":" << *I << " | ";
       emitDebugInfo(errs(), I);
       errs() << "\n";
     }

     if (WarnOnUnaligned) {
       errs() << "emcc: warning: unaligned load in  " << I->getParent()->getParent()->getName() << ":" << *I << " | ";
       emitDebugInfo(errs(), I);
       errs() << "\n";
     }
     std::string PS = getValueAsStr(P);
     switch (Bytes) {
       case 8: {
         switch (Alignment) {
           case 4: {
             text = "HEAP32[tempDoublePtr>>2]=HEAP32[" + PS + ">>2]" + sep +
                     "HEAP32[tempDoublePtr+4>>2]=HEAP32[" + PS + "+4>>2]";
             break;
           }
           case 2: {
             text = "HEAP16[tempDoublePtr>>1]=HEAP16[" + PS + ">>1]" + sep +
                    "HEAP16[tempDoublePtr+2>>1]=HEAP16[" + PS + "+2>>1]" + sep +
                    "HEAP16[tempDoublePtr+4>>1]=HEAP16[" + PS + "+4>>1]" + sep +
                    "HEAP16[tempDoublePtr+6>>1]=HEAP16[" + PS + "+6>>1]";
             break;
           }
           case 1: {
             text = "HEAP8[tempDoublePtr>>0]=HEAP8[" + PS + ">>0]" + sep +
                    "HEAP8[tempDoublePtr+1>>0]=HEAP8[" + PS + "+1>>0]" + sep +
                    "HEAP8[tempDoublePtr+2>>0]=HEAP8[" + PS + "+2>>0]" + sep +
                    "HEAP8[tempDoublePtr+3>>0]=HEAP8[" + PS + "+3>>0]" + sep +
                    "HEAP8[tempDoublePtr+4>>0]=HEAP8[" + PS + "+4>>0]" + sep +
                    "HEAP8[tempDoublePtr+5>>0]=HEAP8[" + PS + "+5>>0]" + sep +
                    "HEAP8[tempDoublePtr+6>>0]=HEAP8[" + PS + "+6>>0]" + sep +
                    "HEAP8[tempDoublePtr+7>>0]=HEAP8[" + PS + "+7>>0]";
             break;
           }
           default: assert(0 && "bad 8 store");
         }
         text += sep + Assign + "+HEAPF64[tempDoublePtr>>3]";
         break;
       }
       case 4: {
         if (T->isIntegerTy() || T->isPointerTy()) {
           switch (Alignment) {
             case 2: {
               text = Assign + "HEAPU16[" + PS + ">>1]|" +
                              "(HEAPU16[" + PS + "+2>>1]<<16)";
               break;
             }
             case 1: {
               text = Assign + "HEAPU8[" + PS + ">>0]|" +
                              "(HEAPU8[" + PS + "+1>>0]<<8)|" +
                              "(HEAPU8[" + PS + "+2>>0]<<16)|" +
                              "(HEAPU8[" + PS + "+3>>0]<<24)";
               break;
             }
             default: assert(0 && "bad 4i store");
           }
         } else { // float
           assert(T->isFloatingPointTy());
           switch (Alignment) {
             case 2: {
               text = "HEAP16[tempDoublePtr>>1]=HEAP16[" + PS + ">>1]" + sep +
                      "HEAP16[tempDoublePtr+2>>1]=HEAP16[" + PS + "+2>>1]";
               break;
             }
             case 1: {
               text = "HEAP8[tempDoublePtr>>0]=HEAP8[" + PS + ">>0]" + sep +
                      "HEAP8[tempDoublePtr+1>>0]=HEAP8[" + PS + "+1>>0]" + sep +
                      "HEAP8[tempDoublePtr+2>>0]=HEAP8[" + PS + "+2>>0]" + sep +
                      "HEAP8[tempDoublePtr+3>>0]=HEAP8[" + PS + "+3>>0]";
               break;
             }
             default: assert(0 && "bad 4f store");
           }
           text += sep + Assign + getCast("HEAPF32[tempDoublePtr>>2]", Type::getFloatTy(TheModule->getContext()));
         }
         break;
       }
       case 2: {
         text = Assign + "HEAPU8[" + PS + ">>0]|" +
                        "(HEAPU8[" + PS + "+1>>0]<<8)";
         break;
       }
       default: assert(0 && "bad store");
     }
   }
   return text;
 }

 std::string JSWriter::getStore(const Instruction *I, const Value *P, Type *T, const std::string& VS, unsigned Alignment, char sep) {
   assert(sep == ';'); // FIXME when we need that
   unsigned Bytes = DL->getTypeAllocSize(T);
   std::string text;
   if (Bytes <= Alignment || Alignment == 0) {
     if (EnablePthreads && cast<StoreInst>(I)->isVolatile()) {
       const char *HeapName;
       std::string Index = getHeapNameAndIndex(P, &HeapName);
       if (!strcmp(HeapName, "HEAPF32") || !strcmp(HeapName, "HEAPF64")) {
         // TODO: If https://bugzilla.mozilla.org/show_bug.cgi?id=1131613 and https://bugzilla.mozilla.org/show_bug.cgi?id=1131624 are
         // implemented, we could remove the emulation, but until then we must emulate manually.
         text = std::string("_emscripten_atomic_store_") + heapNameToAtomicTypeName(HeapName) + "(" + getValueAsStr(P) + ',' + VS + ')';
         if (PreciseF32 && !strcmp(HeapName, "HEAPF32"))
           text = "Math_fround(" + text + ")";
         else
           text = "+" + text;
       } else {
         text = std::string("Atomics_store(") + HeapName + ',' + Index + ',' + VS + ')';
       }
     } else {
       text = getPtrUse(P) + " = " + VS;
     }
     if (Alignment == 536870912) text += "; abort() /* segfault */";
   } else {
     // unaligned in some manner

     if (EnablePthreads && cast<StoreInst>(I)->isVolatile()) {
       errs() << "emcc: warning: unable to implement unaligned volatile store as atomic in " << I->getParent()->getParent()->getName() << ":" << *I << " | ";
       emitDebugInfo(errs(), I);
       errs() << "\n";
     }

     if (WarnOnUnaligned) {
       errs() << "emcc: warning: unaligned store in " << I->getParent()->getParent()->getName() << ":" << *I << " | ";
       emitDebugInfo(errs(), I);
       errs() << "\n";
     }
     std::string PS = getValueAsStr(P);
     switch (Bytes) {
       case 8: {
         text = "HEAPF64[tempDoublePtr>>3]=" + VS + ';';
         switch (Alignment) {
           case 4: {
             text += "HEAP32[" + PS + ">>2]=HEAP32[tempDoublePtr>>2];" +
                     "HEAP32[" + PS + "+4>>2]=HEAP32[tempDoublePtr+4>>2]";
             break;
           }
           case 2: {
             text += "HEAP16[" + PS + ">>1]=HEAP16[tempDoublePtr>>1];" +
                     "HEAP16[" + PS + "+2>>1]=HEAP16[tempDoublePtr+2>>1];" +
                     "HEAP16[" + PS + "+4>>1]=HEAP16[tempDoublePtr+4>>1];" +
                     "HEAP16[" + PS + "+6>>1]=HEAP16[tempDoublePtr+6>>1]";
             break;
           }
           case 1: {
             text += "HEAP8[" + PS + ">>0]=HEAP8[tempDoublePtr>>0];" +
                     "HEAP8[" + PS + "+1>>0]=HEAP8[tempDoublePtr+1>>0];" +
                     "HEAP8[" + PS + "+2>>0]=HEAP8[tempDoublePtr+2>>0];" +
                     "HEAP8[" + PS + "+3>>0]=HEAP8[tempDoublePtr+3>>0];" +
                     "HEAP8[" + PS + "+4>>0]=HEAP8[tempDoublePtr+4>>0];" +
                     "HEAP8[" + PS + "+5>>0]=HEAP8[tempDoublePtr+5>>0];" +
                     "HEAP8[" + PS + "+6>>0]=HEAP8[tempDoublePtr+6>>0];" +
                     "HEAP8[" + PS + "+7>>0]=HEAP8[tempDoublePtr+7>>0]";
             break;
           }
           default: assert(0 && "bad 8 store");
         }
         break;
       }
       case 4: {
         if (T->isIntegerTy() || T->isPointerTy()) {
           switch (Alignment) {
             case 2: {
               text = "HEAP16[" + PS + ">>1]=" + VS + "&65535;" +
                      "HEAP16[" + PS + "+2>>1]=" + VS + ">>>16";
               break;
             }
             case 1: {
               text = "HEAP8[" + PS + ">>0]=" + VS + "&255;" +
                      "HEAP8[" + PS + "+1>>0]=(" + VS + ">>8)&255;" +
                      "HEAP8[" + PS + "+2>>0]=(" + VS + ">>16)&255;" +
                      "HEAP8[" + PS + "+3>>0]=" + VS + ">>24";
               break;
             }
             default: assert(0 && "bad 4i store");
           }
         } else { // float
           assert(T->isFloatingPointTy());
           text = "HEAPF32[tempDoublePtr>>2]=" + VS + ';';
           switch (Alignment) {
             case 2: {
               text += "HEAP16[" + PS + ">>1]=HEAP16[tempDoublePtr>>1];" +
                       "HEAP16[" + PS + "+2>>1]=HEAP16[tempDoublePtr+2>>1]";
               break;
             }
             case 1: {
               text += "HEAP8[" + PS + ">>0]=HEAP8[tempDoublePtr>>0];" +
                       "HEAP8[" + PS + "+1>>0]=HEAP8[tempDoublePtr+1>>0];" +
                       "HEAP8[" + PS + "+2>>0]=HEAP8[tempDoublePtr+2>>0];" +
                       "HEAP8[" + PS + "+3>>0]=HEAP8[tempDoublePtr+3>>0]";
               break;
             }
             default: assert(0 && "bad 4f store");
           }
         }
         break;
       }
       case 2: {
         text = "HEAP8[" + PS + ">>0]=" + VS + "&255;" +
                "HEAP8[" + PS + "+1>>0]=" + VS + ">>8";
         break;
       }
       default: assert(0 && "bad store");
     }
   }
   return text;
 }

 std::string JSWriter::getStackBump(unsigned Size) {
   return getStackBump(utostr(Size));
 }

 std::string JSWriter::getStackBump(const std::string &Size) {
   std::string ret = "STACKTOP = STACKTOP + " + Size + "|0;";
   if (EmscriptenAssertions) {
     ret += " if ((STACKTOP|0) >= (STACK_MAX|0)) abort();";
   }
   return ret;
 }

 std::string JSWriter::getOpName(const Value* V) { // TODO: remove this
   return getJSName(V);
 }

 std::string JSWriter::getPtrLoad(const Value* Ptr) {
   Type *t = cast<PointerType>(Ptr->getType())->getElementType();
   return getCast(getPtrUse(Ptr), t, ASM_NONSPECIFIC);
 }

 std::string JSWriter::getHeapAccess(const std::string& Name, unsigned Bytes, bool Integer) {
   const char *HeapName = 0;
   std::string Index = getHeapNameAndIndexToPtr(Name, Bytes, Integer, &HeapName);
   return std::string(HeapName) + '[' + Index + ']';
 }

 std::string JSWriter::getShiftedPtr(const Value *Ptr, unsigned Bytes) {
   const char *HeapName = 0; // unused
   return getHeapNameAndIndex(Ptr, &HeapName, Bytes);
 }

 std::string JSWriter::getPtrUse(const Value* Ptr) {
   const char *HeapName = 0;
   std::string Index = getHeapNameAndIndex(Ptr, &HeapName);
   return std::string(HeapName) + '[' + Index + ']';
 }

 std::string JSWriter::getConstant(const Constant* CV, AsmCast sign) {
   if (isa<ConstantPointerNull>(CV)) return "0";

   if (const Function *F = dyn_cast<Function>(CV)) {
     return relocateFunctionPointer(utostr(getFunctionIndex(F)));
   }

   if (const GlobalValue *GV = dyn_cast<GlobalValue>(CV)) {
     if (GV->isDeclaration()) {
       std::string Name = getOpName(GV);
       Externals.insert(Name);
       if (Relocatable) {
         // we access linked externs through calls, which we load at the beginning of basic blocks
         FuncRelocatableExterns.insert(Name);
         Name = "t$" + Name;
         UsedVars[Name] = Type::getInt32Ty(CV->getContext());
       }
       return Name;
     }
     if (const GlobalAlias *GA = dyn_cast<GlobalAlias>(CV)) {
       // Since we don't currently support linking of our output, we don't need
       // to worry about weak or other kinds of aliases.
       return getConstant(GA->getAliasee()->stripPointerCasts(), sign);
     }
     return relocateGlobal(utostr(getGlobalAddress(GV->getName().str())));
   }

   if (const ConstantFP *CFP = dyn_cast<ConstantFP>(CV)) {
     std::string S = ftostr(CFP, sign);
     if (PreciseF32 && CV->getType()->isFloatTy() && !(sign & ASM_FFI_OUT)) {
       S = "Math_fround(" + S + ")";
     }
     return S;
   } else if (const ConstantInt *CI = dyn_cast<ConstantInt>(CV)) {
     if (sign != ASM_UNSIGNED && CI->getValue().getBitWidth() == 1) {
       sign = ASM_UNSIGNED; // bools must always be unsigned: either 0 or 1
     }
     return CI->getValue().toString(10, sign != ASM_UNSIGNED);
   } else if (isa<UndefValue>(CV)) {
     std::string S;
     if (VectorType *VT = dyn_cast<VectorType>(CV->getType())) {
       checkVectorType(VT);
       S = std::string("SIMD_") + SIMDType(VT) + "_splat(" + ensureFloat("0", !VT->getElementType()->isIntegerTy()) + ')';
     } else {
       S = CV->getType()->isFloatingPointTy() ? "+0" : "0"; // XXX refactor this
       if (PreciseF32 && CV->getType()->isFloatTy() && !(sign & ASM_FFI_OUT)) {
         S = "Math_fround(" + S + ")";
       }
     }
     return S;
   } else if (isa<ConstantAggregateZero>(CV)) {
     if (VectorType *VT = dyn_cast<VectorType>(CV->getType())) {
       checkVectorType(VT);
       return std::string("SIMD_") + SIMDType(VT) + "_splat(" + ensureFloat("0", !VT->getElementType()->isIntegerTy()) + ')';
     } else {
       // something like [0 x i8*] zeroinitializer, which clang can emit for landingpads
       return "0";
     }
   } else if (const ConstantDataVector *DV = dyn_cast<ConstantDataVector>(CV)) {
     return getConstantVector(DV);
   } else if (const ConstantVector *V = dyn_cast<ConstantVector>(CV)) {
     return getConstantVector(V);
   } else if (const ConstantArray *CA = dyn_cast<const ConstantArray>(CV)) {
     // handle things like [i8* bitcast (<{ i32, i32, i32 }>* @_ZTISt9bad_alloc to i8*)] which clang can emit for landingpads
     assert(CA->getNumOperands() == 1);
     CV = CA->getOperand(0);
     const ConstantExpr *CE = cast<ConstantExpr>(CV);
     CV = CE->getOperand(0); // ignore bitcast
     return getConstant(CV);
   } else if (const BlockAddress *BA = dyn_cast<const BlockAddress>(CV)) {
     return utostr(getBlockAddress(BA));
   } else if (const ConstantExpr *CE = dyn_cast<ConstantExpr>(CV)) {
     std::string Code;
     raw_string_ostream CodeStream(Code);
     CodeStream << '(';
     generateExpression(CE, CodeStream);
     CodeStream << ')';
     return CodeStream.str();
   } else {
     CV->dump();
     llvm_unreachable("Unsupported constant kind");
   }
 }

 std::string JSWriter::getConstantVector(const ConstantVector *C) {
   checkVectorType(C->getType());
   unsigned NumElts = cast<VectorType>(C->getType())->getNumElements();

   bool isInt = C->getType()->getElementType()->isIntegerTy();

   // Check for a splat.
   bool allEqual = true;
   std::string op0 = getConstant(C->getOperand(0));
   for (unsigned i = 0; i < NumElts; ++i) {
     if (getConstant(C->getOperand(i)) != op0) {
       allEqual = false;
       break;
     }
   }
   if (allEqual) {
     return std::string("SIMD_") + SIMDType(C->getType()) + "_splat(" + ensureFloat(op0, !isInt) + ')';
   }

   std::string c = std::string("SIMD_") + SIMDType(C->getType()) + '(' + ensureFloat(op0, !isInt);
   for (unsigned i = 1; i < NumElts; ++i) {
     c += ',' + ensureFloat(getConstant(C->getOperand(i)), !isInt);
   }
   return c + ')';
 }

 std::string JSWriter::getConstantVector(const ConstantDataVector *C) {
   checkVectorType(C->getType());
   unsigned NumElts = cast<VectorType>(C->getType())->getNumElements();

   bool isInt = C->getType()->getElementType()->isIntegerTy();
   bool allEqual = true;
   std::string op0 = getConstant(C->getElementAsConstant(0));
   for (unsigned i = 0; i < NumElts; ++i) {
     if (getConstant(C->getElementAsConstant(i)) != op0) {
       allEqual = false;
       break;
     }
   }
   // Check for a splat.
   if (allEqual) {
     return std::string("SIMD_") + SIMDType(C->getType()) + "_splat(" + ensureFloat(op0, !isInt) + ')';
   }

   std::string c = std::string("SIMD_") + SIMDType(C->getType()) + '(' + ensureFloat(op0, !isInt);
   for (unsigned i = 1; i < NumElts; ++i) {
     c += ',' + ensureFloat(getConstant(C->getElementAsConstant(i)), !isInt);
   }
   return c + ')';
 }

 std::string JSWriter::getValueAsStr(const Value* V, AsmCast sign) {
   // Skip past no-op bitcasts and zero-index geps.
   V = V->stripPointerCasts();

   if (const Constant *CV = dyn_cast<Constant>(V)) {
     return getConstant(CV, sign);
   } else {
     return getJSName(V);
   }
 }

 std::string JSWriter::getValueAsCastStr(const Value* V, AsmCast sign) {
   // Skip past no-op bitcasts and zero-index geps.
   V = V->stripPointerCasts();

   if (isa<ConstantInt>(V) || isa<ConstantFP>(V)) {
     return getConstant(cast<Constant>(V), sign);
   } else {
     return getCast(getValueAsStr(V), V->getType(), sign);
   }
 }

 std::string JSWriter::getValueAsParenStr(const Value* V) {
   // Skip past no-op bitcasts and zero-index geps.
   V = V->stripPointerCasts();

   if (const Constant *CV = dyn_cast<Constant>(V)) {
     return getConstant(CV);
   } else {
     return "(" + getValueAsStr(V) + ")";
   }
 }

 std::string JSWriter::getValueAsCastParenStr(const Value* V, AsmCast sign) {
   // Skip past no-op bitcasts and zero-index geps.
   V = V->stripPointerCasts();

   if (isa<ConstantInt>(V) || isa<ConstantFP>(V) || isa<UndefValue>(V)) {
     return getConstant(cast<Constant>(V), sign);
   } else {
     return "(" + getCast(getValueAsStr(V), V->getType(), sign) + ")";
   }
 }

 void JSWriter::generateInsertElementExpression(const InsertElementInst *III, raw_string_ostream& Code) {
   // LLVM has no vector type constructor operator; it uses chains of
   // insertelement instructions instead. It also has no splat operator; it
   // uses an insertelement followed by a shuffle instead. If this insertelement
   // is part of either such sequence, skip it for now; we'll process it when we
   // reach the end.
   if (III->hasOneUse()) {
       const User *U = *III->user_begin();
       if (isa<InsertElementInst>(U))
           return;
       if (isa<ShuffleVectorInst>(U) &&
           isa<ConstantAggregateZero>(cast<ShuffleVectorInst>(U)->getMask()) &&
           !isa<InsertElementInst>(III->getOperand(0)) &&
           isa<ConstantInt>(III->getOperand(2)) &&
           cast<ConstantInt>(III->getOperand(2))->isZero())
       {
           return;
       }
   }

   // This insertelement is at the base of a chain of single-user insertelement
   // instructions. Collect all the inserted elements so that we can categorize
   // the chain as either a splat, a constructor, or an actual series of inserts.
   VectorType *VT = III->getType();
   checkVectorType(VT);
   unsigned NumElems = VT->getNumElements();
   unsigned NumInserted = 0;
   SmallVector<const Value *, 8> Operands(NumElems, NULL);
   const Value *Splat = III->getOperand(1);
   const Value *Base = III;
   do {
     const InsertElementInst *BaseIII = cast<InsertElementInst>(Base);
     const ConstantInt *IndexInt = cast<ConstantInt>(BaseIII->getOperand(2));
     unsigned Index = IndexInt->getZExtValue();
     if (Operands[Index] == NULL)
       ++NumInserted;
     Value *Op = BaseIII->getOperand(1);
     if (Operands[Index] == NULL) {
       Operands[Index] = Op;
       if (Op != Splat)
         Splat = NULL;
     }
     Base = BaseIII->getOperand(0);
   } while (Base->hasOneUse() && isa<InsertElementInst>(Base));

   // Emit code for the chain.
   Code << getAssignIfNeeded(III);
   if (NumInserted == NumElems) {
     if (Splat) {
       // Emit splat code.
       if (VT->getElementType()->isIntegerTy()) {
         Code << std::string("SIMD_") + SIMDType(VT) + "_splat(" << getValueAsStr(Splat) << ")";
       } else {
         std::string operand = getValueAsStr(Splat);
         if (!PreciseF32) {
           // SIMD_Float32x4_splat requires an actual float32 even if we're
           // otherwise not being precise about it.
           operand = "Math_fround(" + operand + ")";
         }
         Code << std::string("SIMD_") + SIMDType(VT) + "_splat(" << operand << ")";
       }
     } else {
       // Emit constructor code.
       Code << std::string("SIMD_") + SIMDType(VT) + '(';
       for (unsigned Index = 0; Index < NumElems; ++Index) {
         if (Index != 0)
           Code << ", ";
         std::string operand = getValueAsStr(Operands[Index]);
         if (!PreciseF32 && VT->getElementType()->isFloatTy()) {
           // SIMD_Float32x4_splat requires an actual float32 even if we're
           // otherwise not being precise about it.
           operand = "Math_fround(" + operand + ")";
         }
         Code << operand;
       }
       Code << ")";
     }
   } else {
     // Emit a series of inserts.
     std::string Result = getValueAsStr(Base);
     for (unsigned Index = 0; Index < NumElems; ++Index) {
       if (!Operands[Index])
         continue;
       std::string operand = getValueAsStr(Operands[Index]);
       if (!PreciseF32) {
         operand = "Math_fround(" + operand + ")";
       }
       Result = "SIMD_" + SIMDType(VT) + "_replaceLane(" + Result + ',' + utostr(Index) + ',' + operand + ')';
     }
     Code << Result;
   }
 }

 void JSWriter::generateExtractElementExpression(const ExtractElementInst *EEI, raw_string_ostream& Code) {
   VectorType *VT = cast<VectorType>(EEI->getVectorOperand()->getType());
   checkVectorType(VT);
   const ConstantInt *IndexInt = dyn_cast<const ConstantInt>(EEI->getIndexOperand());
   if (IndexInt) {
     unsigned Index = IndexInt->getZExtValue();
     Code << getAssignIfNeeded(EEI);
     std::string OperandCode;
     raw_string_ostream CodeStream(OperandCode);
     CodeStream << std::string("SIMD_") << SIMDType(VT) << "_extractLane(" << getValueAsStr(EEI->getVectorOperand()) << ',' << std::to_string(Index) << ')';
     Code << getCast(CodeStream.str(), EEI->getType());
     return;
   }

   error("SIMD extract element with non-constant index not implemented yet");
 }

 std::string castBoolVecToIntVec(int numElems, const std::string &str)
 {
   int elemWidth = 128 / numElems;
   std::string simdType = "SIMD_Int" + std::to_string(elemWidth) + "x" + std::to_string(numElems);
   return simdType + "_select(" + str + ", " + simdType + "_splat(-1), " + simdType + "_splat(0))";
 }

 std::string castIntVecToBoolVec(int numElems, const std::string &str)
 {
   int elemWidth = 128 / numElems;
   std::string simdType = "SIMD_Int" + std::to_string(elemWidth) + "x" + std::to_string(numElems);
   return simdType + "_notEqual(" + str + ", " + simdType + "_splat(0))";
 }

 std::string JSWriter::getSIMDCast(VectorType *fromType, VectorType *toType, const std::string &valueStr)
 {
   bool toInt = toType->getElementType()->isIntegerTy();
   bool fromInt = fromType->getElementType()->isIntegerTy();
   int fromPrimSize = fromType->getElementType()->getPrimitiveSizeInBits();
   int toPrimSize = toType->getElementType()->getPrimitiveSizeInBits();

   if (fromInt == toInt && fromPrimSize == toPrimSize) {
     // To and from are the same types, no cast needed.
     return valueStr;
   }

   bool fromIsBool = (fromInt && fromPrimSize == 1);
   bool toIsBool = (toInt && toPrimSize == 1);
   if (fromIsBool && !toIsBool) { // Casting from bool vector to a bit vector looks more complicated (e.g. Bool32x4 to Int32x4)
     return castBoolVecToIntVec(toType->getNumElements(), valueStr);
   }

   if (fromType->getBitWidth() != toType->getBitWidth() && !fromIsBool && !toIsBool) {
     error("Invalid SIMD cast between items of different bit sizes!");
   }

   return std::string("SIMD_") + SIMDType(toType) + "_from" + SIMDType(fromType) + "Bits(" + valueStr + ")";
 }

 void JSWriter::generateShuffleVectorExpression(const ShuffleVectorInst *SVI, raw_string_ostream& Code) {
   Code << getAssignIfNeeded(SVI);

   // LLVM has no splat operator, so it makes do by using an insert and a
   // shuffle. If that's what this shuffle is doing, the code in
   // generateInsertElementExpression will have also detected it and skipped
   // emitting the insert, so we can just emit a splat here.
   if (isa<ConstantAggregateZero>(SVI->getMask()) &&
       isa<InsertElementInst>(SVI->getOperand(0)))
   {
     InsertElementInst *IEI = cast<InsertElementInst>(SVI->getOperand(0));
     if (ConstantInt *CI = dyn_cast<ConstantInt>(IEI->getOperand(2))) {
       if (CI->isZero()) {
         std::string operand = getValueAsStr(IEI->getOperand(1));
         if (!PreciseF32) {
           // SIMD_Float32x4_splat requires an actual float32 even if we're
           // otherwise not being precise about it.
           operand = "Math_fround(" + operand + ")";
         }
         Code << "SIMD_" + SIMDType(SVI->getType()) + "_splat(" << operand << ')';
         return;
       }
     }
   }

   // Check whether can generate SIMD.js swizzle or shuffle.
   std::string A = getValueAsStr(SVI->getOperand(0));
   std::string B = getValueAsStr(SVI->getOperand(1));
   int OpNumElements = cast<VectorType>(SVI->getOperand(0)->getType())->getNumElements();
   int ResultNumElements = SVI->getType()->getNumElements();
   bool swizzleA = true;
   bool swizzleB = true;
   for(int i = 0; i < ResultNumElements; ++i) {
     if (SVI->getMaskValue(i) >= OpNumElements) swizzleA = false;
     if (SVI->getMaskValue(i) < OpNumElements) swizzleB = false;
   }
   assert(!(swizzleA && swizzleB));
   if (swizzleA || swizzleB) {
     std::string T = (swizzleA ? A : B);
     Code << "SIMD_" << SIMDType(SVI->getType()) << "_swizzle(" << T;
     int i = 0;
     for (; i < ResultNumElements; ++i) {
       Code << ", ";
       int Mask = SVI->getMaskValue(i);
       if (Mask < 0) {
         Code << 0;
       } else if (Mask < OpNumElements) {
         Code << Mask;
       } else {
         assert(Mask < OpNumElements * 2);
         Code << (Mask-OpNumElements);
       }
     }
     Code << ")";
     return;
   }

   // Emit a fully-general shuffle.
   Code << "SIMD_" << SIMDType(SVI->getType()) << "_shuffle(";

   Code << getSIMDCast(cast<VectorType>(SVI->getOperand(0)->getType()), SVI->getType(), A) << ", "
        << getSIMDCast(cast<VectorType>(SVI->getOperand(1)->getType()), SVI->getType(), B) << ", ";

   SmallVector<int, 16> Indices;
   SVI->getShuffleMask(Indices);
   for (unsigned int i = 0; i < Indices.size(); ++i) {
     if (i != 0)
       Code << ", ";
     int Mask = Indices[i];
     if (Mask < 0)
       Code << 0;
     else
       Code << Mask;
   }

   Code << ')';
 }

 void JSWriter::generateICmpExpression(const ICmpInst *I, raw_string_ostream& Code) {
   bool Invert = false;
   const char *Name;
   switch (cast<ICmpInst>(I)->getPredicate()) {
     case ICmpInst::ICMP_EQ:  Name = "equal"; break;
     case ICmpInst::ICMP_NE:  Name = "equal"; Invert = true; break;
     case ICmpInst::ICMP_SLE: Name = "greaterThan"; Invert = true; break;
     case ICmpInst::ICMP_SGE: Name = "lessThan"; Invert = true; break;
     case ICmpInst::ICMP_ULE: Name = "unsignedLessThanOrEqual"; break;
     case ICmpInst::ICMP_UGE: Name = "unsignedGreaterThanOrEqual"; break;
     case ICmpInst::ICMP_ULT: Name = "unsignedLessThan"; break;
     case ICmpInst::ICMP_SLT: Name = "lessThan"; break;
     case ICmpInst::ICMP_UGT: Name = "unsignedGreaterThan"; break;
     case ICmpInst::ICMP_SGT: Name = "greaterThan"; break;
     default: I->dump(); error("invalid vector icmp"); break;
   }

   if (Invert)
     Code << "SIMD_" << SIMDType(cast<VectorType>(I->getType())) << "_not(";

   Code << getAssignIfNeeded(I) << "SIMD_" << SIMDType(cast<VectorType>(I->getOperand(0)->getType())) << '_' << Name << '('
        << getValueAsStr(I->getOperand(0)) << ',' << getValueAsStr(I->getOperand(1)) << ')';

   if (Invert)
     Code << ')';
 }

 void JSWriter::generateFCmpExpression(const FCmpInst *I, raw_string_ostream& Code) {
   const char *Name;
   bool Invert = false;
   VectorType *VT = cast<VectorType>(I->getType());
   checkVectorType(VT);
   switch (cast<FCmpInst>(I)->getPredicate()) {
     case ICmpInst::FCMP_FALSE:
       Code << getAssignIfNeeded(I) << "SIMD_" << SIMDType(cast<VectorType>(I->getType())) << "_splat(" << ensureFloat("0", true) << ')';
       return;
     case ICmpInst::FCMP_TRUE:
       Code << getAssignIfNeeded(I) << "SIMD_" << SIMDType(cast<VectorType>(I->getType())) << "_splat(" << ensureFloat("-1", true) << ')';
       return;
     case ICmpInst::FCMP_ONE:
       checkVectorType(I->getOperand(0)->getType());
       checkVectorType(I->getOperand(1)->getType());
       Code << getAssignIfNeeded(I)
            << castIntVecToBoolVec(VT->getNumElements(), "SIMD_" + SIMDType(cast<VectorType>(I->getType())) + "_and(SIMD_" + SIMDType(cast<VectorType>(I->getType())) + "_and("
             + castBoolVecToIntVec(VT->getNumElements(), "SIMD_" + SIMDType(cast<VectorType>(I->getOperand(0)->getType())) + "_equal(" + getValueAsStr(I->getOperand(0)) + ',' + getValueAsStr(I->getOperand(0)) + ')') + ','
             + castBoolVecToIntVec(VT->getNumElements(), "SIMD_" + SIMDType(cast<VectorType>(I->getOperand(1)->getType())) + "_equal(" + getValueAsStr(I->getOperand(1)) + ',' + getValueAsStr(I->getOperand(1)) + ')') + ','
             + castBoolVecToIntVec(VT->getNumElements(), "SIMD_" + SIMDType(cast<VectorType>(I->getOperand(0)->getType())) + "_notEqual(" + getValueAsStr(I->getOperand(0)) + ',' + getValueAsStr(I->getOperand(1)) + ')') + ')');
       return;
     case ICmpInst::FCMP_UEQ:
       checkVectorType(I->getOperand(0)->getType());
       checkVectorType(I->getOperand(1)->getType());
       Code << getAssignIfNeeded(I)
            << castIntVecToBoolVec(VT->getNumElements(), "SIMD_" + SIMDType(cast<VectorType>(I->getType())) + "_or(SIMD_" + SIMDType(cast<VectorType>(I->getType())) + "_or("
             + castBoolVecToIntVec(VT->getNumElements(), "SIMD_" + SIMDType(cast<VectorType>(I->getOperand(0)->getType())) + "_notEqual(" + getValueAsStr(I->getOperand(0)) + ',' + getValueAsStr(I->getOperand(0)) + ')') + ','
             + castBoolVecToIntVec(VT->getNumElements(), "SIMD_" + SIMDType(cast<VectorType>(I->getOperand(1)->getType())) + "_notEqual(" + getValueAsStr(I->getOperand(1)) + ',' + getValueAsStr(I->getOperand(1)) + ')') + ','
             + castBoolVecToIntVec(VT->getNumElements(), "SIMD_" + SIMDType(cast<VectorType>(I->getOperand(0)->getType())) + "_equal(" + getValueAsStr(I->getOperand(0)) + ',' + getValueAsStr(I->getOperand(1)) + ')') + ')');
       return;
     case FCmpInst::FCMP_ORD:
       checkVectorType(I->getOperand(0)->getType());
       checkVectorType(I->getOperand(1)->getType());
       Code << getAssignIfNeeded(I)
            << castIntVecToBoolVec(VT->getNumElements(), "SIMD_" + SIMDType(cast<VectorType>(I->getType())) + "_and("
             + castBoolVecToIntVec(VT->getNumElements(), "SIMD_" + SIMDType(cast<VectorType>(I->getOperand(0)->getType())) + "_equal(" + getValueAsStr(I->getOperand(0)) + ',' + getValueAsStr(I->getOperand(0)) + ')') + ','
             + castBoolVecToIntVec(VT->getNumElements(), "SIMD_" + SIMDType(cast<VectorType>(I->getOperand(1)->getType())) + "_equal(" + getValueAsStr(I->getOperand(1)) + ',' + getValueAsStr(I->getOperand(1)) + ')') + ')');
       return;

     case FCmpInst::FCMP_UNO:
       checkVectorType(I->getOperand(0)->getType());
       checkVectorType(I->getOperand(1)->getType());
       Code << getAssignIfNeeded(I)
            << castIntVecToBoolVec(VT->getNumElements(), "SIMD_" + SIMDType(cast<VectorType>(I->getType())) + "_or("
             + castBoolVecToIntVec(VT->getNumElements(), "SIMD_" + SIMDType(cast<VectorType>(I->getOperand(0)->getType())) + "_notEqual(" + getValueAsStr(I->getOperand(0)) + ',' + getValueAsStr(I->getOperand(0)) + ')') + ','
             + castBoolVecToIntVec(VT->getNumElements(), "SIMD_" + SIMDType(cast<VectorType>(I->getOperand(1)->getType())) + "_notEqual(" + getValueAsStr(I->getOperand(1)) + ',' + getValueAsStr(I->getOperand(1)) + ')') + ')');
       return;

     case ICmpInst::FCMP_OEQ:  Name = "equal"; break;
     case ICmpInst::FCMP_OGT:  Name = "greaterThan"; break;
     case ICmpInst::FCMP_OGE:  Name = "greaterThanOrEqual"; break;
     case ICmpInst::FCMP_OLT:  Name = "lessThan"; break;
     case ICmpInst::FCMP_OLE:  Name = "lessThanOrEqual"; break;
     case ICmpInst::FCMP_UGT:  Name = "lessThanOrEqual"; Invert = true; break;
     case ICmpInst::FCMP_UGE:  Name = "lessThan"; Invert = true; break;
     case ICmpInst::FCMP_ULT:  Name = "greaterThanOrEqual"; Invert = true; break;
     case ICmpInst::FCMP_ULE:  Name = "greaterThan"; Invert = true; break;
     case ICmpInst::FCMP_UNE:  Name = "notEqual"; break;
     default: I->dump(); error("invalid vector fcmp"); break;
   }

   if (Invert)
     Code << "SIMD_" << SIMDType(cast<VectorType>(I->getType())) << "_not(";

   checkVectorType(I->getOperand(0)->getType());
   checkVectorType(I->getOperand(1)->getType());
   Code << getAssignIfNeeded(I) << "SIMD_" << SIMDType(cast<VectorType>(I->getOperand(0)->getType())) << "_" << Name << "("
        << getValueAsStr(I->getOperand(0)) << ", " << getValueAsStr(I->getOperand(1)) << ")";

   if (Invert)
     Code << ")";
 }

 static const Value *getElement(const Value *V, unsigned i) {
     if (const InsertElementInst *II = dyn_cast<InsertElementInst>(V)) {
         if (ConstantInt *CI = dyn_cast<ConstantInt>(II->getOperand(2))) {
             if (CI->equalsInt(i))
                 return II->getOperand(1);
         }
         return getElement(II->getOperand(0), i);
     }
     return NULL;
 }

 static const Value *getSplatValue(const Value *V) {
     if (const Constant *C = dyn_cast<Constant>(V))
         return C->getSplatValue();

     VectorType *VTy = cast<VectorType>(V->getType());
     const Value *Result = NULL;
     for (unsigned i = 0; i < VTy->getNumElements(); ++i) {
         const Value *E = getElement(V, i);
         if (!E)
             return NULL;
         if (!Result)
             Result = E;
         else if (Result != E)
             return NULL;
     }
     return Result;

 }

 void JSWriter::generateShiftExpression(const BinaryOperator *I, raw_string_ostream& Code) {
     // If we're shifting every lane by the same amount (shifting by a splat value
     // then we can use a ByScalar shift.
     const Value *Count = I->getOperand(1);
     if (const Value *Splat = getSplatValue(Count)) {
         Code << getAssignIfNeeded(I) << "SIMD_" << SIMDType(cast<VectorType>(I->getType())) << '_';
         if (I->getOpcode() == Instruction::AShr)
             Code << "shiftRightArithmeticByScalar";
         else if (I->getOpcode() == Instruction::LShr)
             Code << "shiftRightLogicalByScalar";
         else
             Code << "shiftLeftByScalar";
         Code << "(" << getValueAsStr(I->getOperand(0)) << ", " << getValueAsStr(Splat) << ")";
         return;
     }

     // SIMD.js does not currently have vector-vector shifts.
     generateUnrolledExpression(I, Code);
 }

 void JSWriter::generateUnrolledExpression(const User *I, raw_string_ostream& Code) {
   VectorType *VT = cast<VectorType>(I->getType());

   Code << getAssignIfNeeded(I);

   Code << "SIMD_" << SIMDType(VT) << '(';

   for (unsigned Index = 0; Index < VT->getNumElements(); ++Index) {
     if (Index != 0)
         Code << ", ";
     if (!PreciseF32 && VT->getElementType()->isFloatTy()) {
         Code << "Math_fround(";
     }
     std::string Extract;
     if (VT->getElementType()->isIntegerTy()) {
       Extract = "SIMD_Int32x4_extractLane(";
       UsesSIMDInt32x4 = true;
     } else {
       Extract = "SIMD_Float32x4_extractLane(";
       UsesSIMDFloat32x4 = true;
     }
     switch (Operator::getOpcode(I)) {
       case Instruction::SDiv:
         Code << "(" << Extract << getValueAsStr(I->getOperand(0)) << "," << Index << ")|0)"
                 " / "
                 "(" << Extract << getValueAsStr(I->getOperand(1)) << "," << Index << ")|0)"
                 "|0";
         break;
       case Instruction::UDiv:
         Code << "(" << Extract << getValueAsStr(I->getOperand(0)) << "," << Index << ")>>>0)"
                 " / "
                 "(" << Extract << getValueAsStr(I->getOperand(1)) << "," << Index << ")>>>0)"
                 ">>>0";
         break;
       case Instruction::SRem:
         Code << "(" << Extract << getValueAsStr(I->getOperand(0)) << "," << Index << ")|0)"
                 " % "
                 "(" << Extract << getValueAsStr(I->getOperand(1)) << "," << Index << ")|0)"
                 "|0";
         break;
       case Instruction::URem:
         Code << "(" << Extract << getValueAsStr(I->getOperand(0)) << "," << Index << ")>>>0)"
                 " % "
                 "(" << Extract << getValueAsStr(I->getOperand(1)) << "," << Index << ")>>>0)"
                 ">>>0";
         break;
       case Instruction::AShr:
         Code << "(" << Extract << getValueAsStr(I->getOperand(0)) << "," << Index << ")|0)"
                 " >> "
                 "(" << Extract << getValueAsStr(I->getOperand(1)) << "," << Index << ")|0)"
                 "|0";
         break;
       case Instruction::LShr:
         Code << "(" << Extract << getValueAsStr(I->getOperand(0)) << "," << Index << ")|0)"
                 " >>> "
                 "(" << Extract << getValueAsStr(I->getOperand(1)) << "," << Index << ")|0)"
                 "|0";
         break;
       case Instruction::Shl:
         Code << "(" << Extract << getValueAsStr(I->getOperand(0)) << "," << Index << ")|0)"
                 " << "
                 "(" << Extract << getValueAsStr(I->getOperand(1)) << "," << Index << ")|0)"
                 "|0";
         break;
       default: I->dump(); error("invalid unrolled vector instr"); break;
     }
     if (!PreciseF32 && VT->getElementType()->isFloatTy()) {
         Code << ")";
     }
   }

   Code << ")";
 }

 bool JSWriter::generateSIMDExpression(const User *I, raw_string_ostream& Code) {
   VectorType *VT;
   if ((VT = dyn_cast<VectorType>(I->getType()))) {
     // vector-producing instructions
     checkVectorType(VT);
     std::string simdType = SIMDType(VT);

     switch (Operator::getOpcode(I)) {
       default: I->dump(); error("invalid vector instr"); break;
       case Instruction::Call: // return value is just a SIMD value, no special handling
         return false;
       case Instruction::PHI: // handled separately - we push them back into the relooper branchings
         break;
       case Instruction::ICmp:
         generateICmpExpression(cast<ICmpInst>(I), Code);
         break;
       case Instruction::FCmp:
         generateFCmpExpression(cast<FCmpInst>(I), Code);
         break;
       case Instruction::SExt:
         assert(cast<VectorType>(I->getOperand(0)->getType())->getElementType()->isIntegerTy(1) &&
                "sign-extension from vector of other than i1 not yet supported");
         Code << getAssignIfNeeded(I) << getSIMDCast(cast<VectorType>(I->getOperand(0)->getType()), VT, getValueAsStr(I->getOperand(0)));
         break;
       case Instruction::Select:
         // Since we represent vectors of i1 as vectors of sign extended wider integers,
         // selecting on them is just an elementwise select.
         if (isa<VectorType>(I->getOperand(0)->getType())) {
           if (cast<VectorType>(I->getType())->getElementType()->isIntegerTy()) {
             Code << getAssignIfNeeded(I) << "SIMD_" << simdType << "_select(" << getValueAsStr(I->getOperand(0)) << "," << getValueAsStr(I->getOperand(1)) << "," << getValueAsStr(I->getOperand(2)) << ")"; break;
           } else {
             Code << getAssignIfNeeded(I) << "SIMD_" << simdType << "_select(" << getValueAsStr(I->getOperand(0)) << "," << getValueAsStr(I->getOperand(1)) << "," << getValueAsStr(I->getOperand(2)) << ")"; break;
           }
           return true;
         }
         // Otherwise we have a scalar condition, so it's a ?: operator.
         return false;
       case Instruction::FAdd: Code << getAssignIfNeeded(I) << "SIMD_" << simdType << "_add(" << getValueAsStr(I->getOperand(0)) << "," << getValueAsStr(I->getOperand(1)) << ")"; break;
       case Instruction::FMul: Code << getAssignIfNeeded(I) << "SIMD_" << simdType << "_mul(" << getValueAsStr(I->getOperand(0)) << "," << getValueAsStr(I->getOperand(1)) << ")"; break;
       case Instruction::FDiv: Code << getAssignIfNeeded(I) << "SIMD_" << simdType << "_div(" << getValueAsStr(I->getOperand(0)) << "," << getValueAsStr(I->getOperand(1)) << ")"; break;
       case Instruction::Add: Code << getAssignIfNeeded(I) << "SIMD_" << simdType << "_add(" << getValueAsStr(I->getOperand(0)) << "," << getValueAsStr(I->getOperand(1)) << ")"; break;
       case Instruction::Sub: Code << getAssignIfNeeded(I) << "SIMD_" << simdType << "_sub(" << getValueAsStr(I->getOperand(0)) << "," << getValueAsStr(I->getOperand(1)) << ")"; break;
       case Instruction::Mul: Code << getAssignIfNeeded(I) << "SIMD_" << simdType << "_mul(" << getValueAsStr(I->getOperand(0)) << "," << getValueAsStr(I->getOperand(1)) << ")"; break;
       case Instruction::And: Code << getAssignIfNeeded(I) << "SIMD_" << simdType << "_and(" << getValueAsStr(I->getOperand(0)) << "," << getValueAsStr(I->getOperand(1)) << ")"; break;
       case Instruction::Or:  Code << getAssignIfNeeded(I) << "SIMD_" << simdType << "_or(" <<  getValueAsStr(I->getOperand(0)) << "," << getValueAsStr(I->getOperand(1)) << ")"; break;
       case Instruction::Xor:
         // LLVM represents a not(x) as -1 ^ x
         Code << getAssignIfNeeded(I);
         if (BinaryOperator::isNot(I)) {
           Code << "SIMD_" << simdType << "_not(" << getValueAsStr(BinaryOperator::getNotArgument(I)) << ")"; break;
         } else {
           Code << "SIMD_" << simdType << "_xor(" << getValueAsStr(I->getOperand(0)) << "," << getValueAsStr(I->getOperand(1)) << ")"; break;
         }
         break;
       case Instruction::FSub:
         // LLVM represents an fneg(x) as -0.0 - x.
         Code << getAssignIfNeeded(I);
         if (BinaryOperator::isFNeg(I)) {
           Code << "SIMD_" << simdType << "_neg(" << getValueAsStr(BinaryOperator::getFNegArgument(I)) << ")";
         } else {
           Code << "SIMD_" << simdType << "_sub(" << getValueAsStr(I->getOperand(0)) << "," << getValueAsStr(I->getOperand(1)) << ")";
         }
         break;
       case Instruction::BitCast: {
       case Instruction::SIToFP:
         Code << getAssignIfNeeded(I);
         Code << getSIMDCast(cast<VectorType>(I->getOperand(0)->getType()), cast<VectorType>(I->getType()), getValueAsStr(I->getOperand(0)));
         break;
       }
       case Instruction::Load: {
         const LoadInst *LI = cast<LoadInst>(I);
         const Value *P = LI->getPointerOperand();
         std::string PS = getValueAsStr(P);

         Code << getAssignIfNeeded(I) << "SIMD_" << simdType << "_load" << "(HEAPU8, " << PS << ")";
         break;
       }
       case Instruction::InsertElement:
         generateInsertElementExpression(cast<InsertElementInst>(I), Code);
         break;
       case Instruction::ShuffleVector:
         generateShuffleVectorExpression(cast<ShuffleVectorInst>(I), Code);
         break;
       case Instruction::SDiv:
       case Instruction::UDiv:
       case Instruction::SRem:
       case Instruction::URem:
         // The SIMD API does not currently support these operations directly.
         // Emulate them using scalar operations (which is essentially the same
         // as what would happen if the API did support them, since hardware
         // doesn't support them).
         generateUnrolledExpression(I, Code);
         break;
       case Instruction::AShr:
       case Instruction::LShr:
       case Instruction::Shl:
         generateShiftExpression(cast<BinaryOperator>(I), Code);
         break;
     }
     return true;
   } else {
     // vector-consuming instructions
     if (Operator::getOpcode(I) == Instruction::Store && (VT = dyn_cast<VectorType>(I->getOperand(0)->getType())) && VT->isVectorTy()) {
       checkVectorType(VT);
       std::string simdType = SIMDType(VT);
       const StoreInst *SI = cast<StoreInst>(I);
       const Value *P = SI->getPointerOperand();
       std::string PS = getOpName(P);
       std::string VS = getValueAsStr(SI->getValueOperand());
       Code << getAdHocAssign(PS, P->getType()) << getValueAsStr(P) << ';';
       Code << "SIMD_" << simdType << "_store" << "(HEAPU8, " << PS << ", " << VS << ")";
       return true;
     } else if (Operator::getOpcode(I) == Instruction::ExtractElement) {
       generateExtractElementExpression(cast<ExtractElementInst>(I), Code);
       return true;
     }
   }
   return false;
 }

 static uint64_t LSBMask(unsigned numBits) {
   return numBits >= 64 ? 0xFFFFFFFFFFFFFFFFULL : (1ULL << numBits) - 1;
 }

 // Given a string which contains a printed base address, print a new string
 // which contains that address plus the given offset.
 static std::string AddOffset(const std::string &base, int32_t Offset) {
   if (base.empty())
     return itostr(Offset);

   if (Offset == 0)
     return base;

   return "((" + base + ") + " + itostr(Offset) + "|0)";
 }

 // Generate code for and operator, either an Instruction or a ConstantExpr.
 void JSWriter::generateExpression(const User *I, raw_string_ostream& Code) {
   // To avoid emiting code and variables for the no-op pointer bitcasts
   // and all-zero-index geps that LLVM needs to satisfy its type system, we
   // call stripPointerCasts() on all values before translating them. This
   // includes bitcasts whose only use is lifetime marker intrinsics.
   assert(I == I->stripPointerCasts());

   Type *T = I->getType();
   if (T->isIntegerTy() && T->getIntegerBitWidth() > 32) {
     errs() << *I << "\n";
     report_fatal_error("legalization problem");
   }

   if (!generateSIMDExpression(I, Code)) switch (Operator::getOpcode(I)) {
   default: {
     I->dump();
     error("Invalid instruction in JSWriter::generateExpression");
     break;
   }
   case Instruction::Ret: {
     const ReturnInst* ret =  cast<ReturnInst>(I);
     const Value *RV = ret->getReturnValue();
     if (StackBumped) {
       Code << "STACKTOP = sp;";
     }
     Code << "return";
     if (RV != NULL) {
       Code << " " << getValueAsCastParenStr(RV, ASM_NONSPECIFIC | ASM_MUST_CAST);
     }
     break;
   }
   case Instruction::Br:
   case Instruction::IndirectBr:
   case Instruction::Switch: return; // handled while relooping
   case Instruction::Unreachable: {
     // Typically there should be an abort right before these, so we don't emit any code // TODO: when ASSERTIONS are on, emit abort(0)
     Code << "// unreachable";
     break;
   }
   case Instruction::Add:
   case Instruction::FAdd:
   case Instruction::Sub:
   case Instruction::FSub:
   case Instruction::Mul:
   case Instruction::FMul:
   case Instruction::UDiv:
   case Instruction::SDiv:
   case Instruction::FDiv:
   case Instruction::URem:
   case Instruction::SRem:
   case Instruction::FRem:
   case Instruction::And:
   case Instruction::Or:
   case Instruction::Xor:
   case Instruction::Shl:
   case Instruction::LShr:
   case Instruction::AShr:{
     Code << getAssignIfNeeded(I);
     unsigned opcode = Operator::getOpcode(I);
     switch (opcode) {
       case Instruction::Add:  Code << getParenCast(
                                         getValueAsParenStr(I->getOperand(0)) +
                                         " + " +
                                         getValueAsParenStr(I->getOperand(1)),
                                         I->getType()
                                       ); break;
       case Instruction::Sub:  Code << getParenCast(
                                         getValueAsParenStr(I->getOperand(0)) +
                                         " - " +
                                         getValueAsParenStr(I->getOperand(1)),
                                         I->getType()
                                       ); break;
       case Instruction::Mul:  Code << getIMul(I->getOperand(0), I->getOperand(1)); break;
       case Instruction::UDiv:
       case Instruction::SDiv:
       case Instruction::URem:
       case Instruction::SRem: Code << "(" <<
                                       getValueAsCastParenStr(I->getOperand(0), (opcode == Instruction::SDiv || opcode == Instruction::SRem) ? ASM_SIGNED : ASM_UNSIGNED) <<
                                       ((opcode == Instruction::UDiv || opcode == Instruction::SDiv) ? " / " : " % ") <<
                                       getValueAsCastParenStr(I->getOperand(1), (opcode == Instruction::SDiv || opcode == Instruction::SRem) ? ASM_SIGNED : ASM_UNSIGNED) <<
                                       ")&-1"; break;
       case Instruction::And:  Code << getValueAsStr(I->getOperand(0)) << " & " <<   getValueAsStr(I->getOperand(1)); break;
       case Instruction::Or:   Code << getValueAsStr(I->getOperand(0)) << " | " <<   getValueAsStr(I->getOperand(1)); break;
       case Instruction::Xor:  Code << getValueAsStr(I->getOperand(0)) << " ^ " <<   getValueAsStr(I->getOperand(1)); break;
       case Instruction::Shl:  {
         std::string Shifted = getValueAsStr(I->getOperand(0)) + " << " +  getValueAsStr(I->getOperand(1));
         if (I->getType()->getIntegerBitWidth() < 32) {
           Shifted = getParenCast(Shifted, I->getType(), ASM_UNSIGNED); // remove bits that are shifted beyond the size of this value
         }
         Code << Shifted;
         break;
       }
       case Instruction::AShr:
       case Instruction::LShr: {
         std::string Input = getValueAsStr(I->getOperand(0));
         if (I->getType()->getIntegerBitWidth() < 32) {
           Input = '(' + getCast(Input, I->getType(), opcode == Instruction::AShr ? ASM_SIGNED : ASM_UNSIGNED) + ')'; // fill in high bits, as shift needs those and is done in 32-bit
         }
         Code << Input << (opcode == Instruction::AShr ? " >> " : " >>> ") <<  getValueAsStr(I->getOperand(1));
         break;
       }

       case Instruction::FAdd: Code << ensureFloat(getValueAsStr(I->getOperand(0)) + " + " + getValueAsStr(I->getOperand(1)), I->getType()); break;
       case Instruction::FMul: Code << ensureFloat(getValueAsStr(I->getOperand(0)) + " * " + getValueAsStr(I->getOperand(1)), I->getType()); break;
       case Instruction::FDiv: Code << ensureFloat(getValueAsStr(I->getOperand(0)) + " / " + getValueAsStr(I->getOperand(1)), I->getType()); break;
       case Instruction::FRem: Code << ensureFloat(getValueAsStr(I->getOperand(0)) + " % " + getValueAsStr(I->getOperand(1)), I->getType()); break;
       case Instruction::FSub:
         // LLVM represents an fneg(x) as -0.0 - x.
         if (BinaryOperator::isFNeg(I)) {
           Code << ensureFloat("-" + getValueAsStr(BinaryOperator::getFNegArgument(I)), I->getType());
         } else {
           Code << ensureFloat(getValueAsStr(I->getOperand(0)) + " - " + getValueAsStr(I->getOperand(1)), I->getType());
         }
         break;
       default: error("bad binary opcode"); break;
     }
     break;
   }
   case Instruction::FCmp: {
     unsigned predicate = isa<ConstantExpr>(I) ?
                          cast<ConstantExpr>(I)->getPredicate() :
                          cast<FCmpInst>(I)->getPredicate();
     Code << getAssignIfNeeded(I);
     switch (predicate) {
       // Comparisons which are simple JS operators.
       case FCmpInst::FCMP_OEQ:   Code << getValueAsStr(I->getOperand(0)) << " == " << getValueAsStr(I->getOperand(1)); break;
       case FCmpInst::FCMP_UNE:   Code << getValueAsStr(I->getOperand(0)) << " != " << getValueAsStr(I->getOperand(1)); break;
       case FCmpInst::FCMP_OGT:   Code << getValueAsStr(I->getOperand(0)) << " > "  << getValueAsStr(I->getOperand(1)); break;
       case FCmpInst::FCMP_OGE:   Code << getValueAsStr(I->getOperand(0)) << " >= " << getValueAsStr(I->getOperand(1)); break;
       case FCmpInst::FCMP_OLT:   Code << getValueAsStr(I->getOperand(0)) << " < "  << getValueAsStr(I->getOperand(1)); break;
       case FCmpInst::FCMP_OLE:   Code << getValueAsStr(I->getOperand(0)) << " <= " << getValueAsStr(I->getOperand(1)); break;

       // Comparisons which are inverses of JS operators.
       case FCmpInst::FCMP_UGT:
         Code << "!(" << getValueAsStr(I->getOperand(0)) << " <= " << getValueAsStr(I->getOperand(1)) << ")";
         break;
       case FCmpInst::FCMP_UGE:
         Code << "!(" << getValueAsStr(I->getOperand(0)) << " < "  << getValueAsStr(I->getOperand(1)) << ")";
         break;
       case FCmpInst::FCMP_ULT:
         Code << "!(" << getValueAsStr(I->getOperand(0)) << " >= " << getValueAsStr(I->getOperand(1)) << ")";
         break;
       case FCmpInst::FCMP_ULE:
         Code << "!(" << getValueAsStr(I->getOperand(0)) << " > "  << getValueAsStr(I->getOperand(1)) << ")";
         break;

       // Comparisons which require explicit NaN checks.
       case FCmpInst::FCMP_UEQ:
         Code << "(" << getValueAsStr(I->getOperand(0)) << " != " << getValueAsStr(I->getOperand(0)) << ") | " <<
                 "(" << getValueAsStr(I->getOperand(1)) << " != " << getValueAsStr(I->getOperand(1)) << ") |" <<
                 "(" << getValueAsStr(I->getOperand(0)) << " == " << getValueAsStr(I->getOperand(1)) << ")";
         break;
       case FCmpInst::FCMP_ONE:
         Code << "(" << getValueAsStr(I->getOperand(0)) << " == " << getValueAsStr(I->getOperand(0)) << ") & " <<
                 "(" << getValueAsStr(I->getOperand(1)) << " == " << getValueAsStr(I->getOperand(1)) << ") &" <<
                 "(" << getValueAsStr(I->getOperand(0)) << " != " << getValueAsStr(I->getOperand(1)) << ")";
         break;

       // Simple NaN checks.
       case FCmpInst::FCMP_ORD:   Code << "(" << getValueAsStr(I->getOperand(0)) << " == " << getValueAsStr(I->getOperand(0)) << ") & " <<
                                          "(" << getValueAsStr(I->getOperand(1)) << " == " << getValueAsStr(I->getOperand(1)) << ")"; break;
       case FCmpInst::FCMP_UNO:   Code << "(" << getValueAsStr(I->getOperand(0)) << " != " << getValueAsStr(I->getOperand(0)) << ") | " <<
                                          "(" << getValueAsStr(I->getOperand(1)) << " != " << getValueAsStr(I->getOperand(1)) << ")"; break;

       // Simple constants.
       case FCmpInst::FCMP_FALSE: Code << "0"; break;
       case FCmpInst::FCMP_TRUE : Code << "1"; break;

       default: error("bad fcmp"); break;
     }
     break;
   }
   case Instruction::ICmp: {
     unsigned predicate = isa<ConstantExpr>(I) ?
                          cast<ConstantExpr>(I)->getPredicate() :
                          cast<ICmpInst>(I)->getPredicate();
     AsmCast sign = CmpInst::isUnsigned(predicate) ? ASM_UNSIGNED : ASM_SIGNED;
     Code << getAssignIfNeeded(I) << "(" <<
       getValueAsCastStr(I->getOperand(0), sign) <<
     ")";
     switch (predicate) {
     case ICmpInst::ICMP_EQ:  Code << "==";  break;
     case ICmpInst::ICMP_NE:  Code << "!=";  break;
     case ICmpInst::ICMP_ULE: Code << "<="; break;
     case ICmpInst::ICMP_SLE: Code << "<="; break;
     case ICmpInst::ICMP_UGE: Code << ">="; break;
     case ICmpInst::ICMP_SGE: Code << ">="; break;
     case ICmpInst::ICMP_ULT: Code << "<"; break;
     case ICmpInst::ICMP_SLT: Code << "<"; break;
     case ICmpInst::ICMP_UGT: Code << ">"; break;
     case ICmpInst::ICMP_SGT: Code << ">"; break;
     default: llvm_unreachable("Invalid ICmp predicate");
     }
     Code << "(" <<
       getValueAsCastStr(I->getOperand(1), sign) <<
     ")";
     break;
   }
   case Instruction::Alloca: {
     const AllocaInst* AI = cast<AllocaInst>(I);

     // We've done an alloca, so we'll have bumped the stack and will
     // need to restore it.
     // Yes, we shouldn't have to bump it for nativized vars, however
     // they are included in the frame offset, so the restore is still
     // needed until that is fixed.
     StackBumped = true;

     if (NativizedVars.count(AI)) {
       // nativized stack variable, we just need a 'var' definition
       UsedVars[getJSName(AI)] = AI->getType()->getElementType();
       return;
     }

     // Fixed-size entry-block allocations are allocated all at once in the
     // function prologue.
     if (AI->isStaticAlloca()) {
       uint64_t Offset;
       if (Allocas.getFrameOffset(AI, &Offset)) {
         Code << getAssign(AI);
         if (Allocas.getMaxAlignment() <= STACK_ALIGN) {
           Code << "sp";
         } else {
           Code << "sp_a"; // aligned base of stack is different, use that
         }
         if (Offset != 0) {
           Code << " + " << Offset << "|0";
         }
         break;
       }
       // Otherwise, this alloca is being represented by another alloca, so
       // there's nothing to print.
       return;
     }

     assert(AI->getAlignment() <= STACK_ALIGN); // TODO

     Type *T = AI->getAllocatedType();
     std::string Size;
     uint64_t BaseSize = DL->getTypeAllocSize(T);
     const Value *AS = AI->getArraySize();
     if (const ConstantInt *CI = dyn_cast<ConstantInt>(AS)) {
       Size = Twine(stackAlign(BaseSize * CI->getZExtValue())).str();
     } else {
       Size = stackAlignStr("((" + utostr(BaseSize) + '*' + getValueAsStr(AS) + ")|0)");
     }
     Code << getAssign(AI) << "STACKTOP; " << getStackBump(Size);
     break;
   }
   case Instruction::Load: {
     const LoadInst *LI = cast<LoadInst>(I);
     const Value *P = LI->getPointerOperand();
     unsigned Alignment = LI->getAlignment();
     if (NativizedVars.count(P)) {
       Code << getAssign(LI) << getValueAsStr(P);
     } else {
       Code << getLoad(LI, P, LI->getType(), Alignment);
     }
     break;
   }
   case Instruction::Store: {
     const StoreInst *SI = cast<StoreInst>(I);
     const Value *P = SI->getPointerOperand();
     const Value *V = SI->getValueOperand();
     unsigned Alignment = SI->getAlignment();
     std::string VS = getValueAsStr(V);
     if (NativizedVars.count(P)) {
       Code << getValueAsStr(P) << " = " << VS;
     } else {
       Code << getStore(SI, P, V->getType(), VS, Alignment);
     }

     Type *T = V->getType();
     if (T->isIntegerTy() && T->getIntegerBitWidth() > 32) {
       errs() << *I << "\n";
       report_fatal_error("legalization problem");
     }
     break;
   }
   case Instruction::GetElementPtr: {
     Code << getAssignIfNeeded(I);
     const GEPOperator *GEP = cast<GEPOperator>(I);
     gep_type_iterator GTI = gep_type_begin(GEP);
     int32_t ConstantOffset = 0;
     std::string text;

     // If the base is an initialized global variable, the address is just an
     // integer constant, so we can fold it into the ConstantOffset directly.
     const Value *Ptr = GEP->getPointerOperand()->stripPointerCasts();
     if (isa<GlobalVariable>(Ptr) && cast<GlobalVariable>(Ptr)->hasInitializer() && !Relocatable) {
       ConstantOffset = getGlobalAddress(Ptr->getName().str());
     } else {
       text = getValueAsParenStr(Ptr);
     }

     GetElementPtrInst::const_op_iterator I = GEP->op_begin();
     I++;
     for (GetElementPtrInst::const_op_iterator E = GEP->op_end();
        I != E; ++I) {
       const Value *Index = *I;
       if (StructType *STy = dyn_cast<StructType>(*GTI++)) {
         // For a struct, add the member offset.
         unsigned FieldNo = cast<ConstantInt>(Index)->getZExtValue();
         uint32_t Offset = DL->getStructLayout(STy)->getElementOffset(FieldNo);
         ConstantOffset = (uint32_t)ConstantOffset + Offset;
       } else {
         // For an array, add the element offset, explicitly scaled.
         uint32_t ElementSize = DL->getTypeAllocSize(*GTI);
         if (const ConstantInt *CI = dyn_cast<ConstantInt>(Index)) {
           // The index is constant. Add it to the accumulating offset.
           ConstantOffset = (uint32_t)ConstantOffset + (uint32_t)CI->getSExtValue() * ElementSize;
         } else {
           // The index is non-constant. To avoid reassociating, which increases
           // the risk of slow wraparounds, add the accumulated offset first.
           text = AddOffset(text, ConstantOffset);
           ConstantOffset = 0;

           // Now add the scaled dynamic index.
           std::string Mul = getIMul(Index, ConstantInt::get(Type::getInt32Ty(GEP->getContext()), ElementSize));
           text = text.empty() ? Mul : ("(" + text + " + (" + Mul + ")|0)");
         }
       }
     }
     // Add in the final accumulated offset.
     Code << AddOffset(text, ConstantOffset);
     break;
   }
   case Instruction::PHI: {
     // handled separately - we push them back into the relooper branchings
     return;
   }
   case Instruction::PtrToInt:
   case Instruction::IntToPtr:
     Code << getAssignIfNeeded(I) << getValueAsStr(I->getOperand(0));
     break;
   case Instruction::Trunc:
   case Instruction::ZExt:
   case Instruction::SExt:
   case Instruction::FPTrunc:
   case Instruction::FPExt:
   case Instruction::FPToUI:
   case Instruction::FPToSI:
   case Instruction::UIToFP:
   case Instruction::SIToFP: {
     Code << getAssignIfNeeded(I);
     switch (Operator::getOpcode(I)) {
     case Instruction::Trunc: {
       //unsigned inBits = V->getType()->getIntegerBitWidth();
       unsigned outBits = I->getType()->getIntegerBitWidth();
       Code << getValueAsStr(I->getOperand(0)) << "&" << utostr(LSBMask(outBits));
       break;
     }
     case Instruction::SExt: {
       std::string bits = utostr(32 - I->getOperand(0)->getType()->getIntegerBitWidth());
       Code << getValueAsStr(I->getOperand(0)) << " << " << bits << " >> " << bits;
       break;
     }
     case Instruction::ZExt: {
       Code << getValueAsCastStr(I->getOperand(0), ASM_UNSIGNED);
       break;
     }
     case Instruction::FPExt: {
       if (PreciseF32) {
         Code << "+" << getValueAsStr(I->getOperand(0)); break;
       } else {
         Code << getValueAsStr(I->getOperand(0)); break;
       }
       break;
     }
     case Instruction::FPTrunc: {
       Code << ensureFloat(getValueAsStr(I->getOperand(0)), I->getType());
       break;
     }
     case Instruction::SIToFP:   Code << '(' << getCast(getValueAsCastParenStr(I->getOperand(0), ASM_SIGNED),   I->getType()) << ')'; break;
     case Instruction::UIToFP:   Code << '(' << getCast(getValueAsCastParenStr(I->getOperand(0), ASM_UNSIGNED), I->getType()) << ')'; break;
     case Instruction::FPToSI:   Code << '(' << getDoubleToInt(getValueAsParenStr(I->getOperand(0))) << ')'; break;
     case Instruction::FPToUI:   Code << '(' << getCast(getDoubleToInt(getValueAsParenStr(I->getOperand(0))), I->getType(), ASM_UNSIGNED) << ')'; break;
     case Instruction::PtrToInt: Code << '(' << getValueAsStr(I->getOperand(0)) << ')'; break;
     case Instruction::IntToPtr: Code << '(' << getValueAsStr(I->getOperand(0)) << ')'; break;
     default: llvm_unreachable("Unreachable");
     }
     break;
   }
   case Instruction::BitCast: {
     Code << getAssignIfNeeded(I);
     // Most bitcasts are no-ops for us. However, the exception is int to float and float to int
     Type *InType = I->getOperand(0)->getType();
     Type *OutType = I->getType();
     std::string V = getValueAsStr(I->getOperand(0));
     if (InType->isIntegerTy() && OutType->isFloatingPointTy()) {
       assert(InType->getIntegerBitWidth() == 32);
       Code << "(HEAP32[tempDoublePtr>>2]=" << V << "," << getCast("HEAPF32[tempDoublePtr>>2]", Type::getFloatTy(TheModule->getContext())) << ")";
     } else if (OutType->isIntegerTy() && InType->isFloatingPointTy()) {
       assert(OutType->getIntegerBitWidth() == 32);
       Code << "(HEAPF32[tempDoublePtr>>2]=" << V << "," "HEAP32[tempDoublePtr>>2]|0)";
     } else {
       Code << V;
     }
     break;
   }
   case Instruction::Call: {
     const CallInst *CI = cast<CallInst>(I);
     std::string Call = handleCall(CI);
     if (Call.empty()) return;
     Code << Call;
     break;
   }
   case Instruction::Select: {
     Code << getAssignIfNeeded(I) << getValueAsStr(I->getOperand(0)) << " ? " <<
                                     getValueAsStr(I->getOperand(1)) << " : " <<
                                     getValueAsStr(I->getOperand(2));
     break;
   }
   case Instruction::AtomicRMW: {
     const AtomicRMWInst *rmwi = cast<AtomicRMWInst>(I);
     const Value *P = rmwi->getOperand(0);
     const Value *V = rmwi->getOperand(1);
     std::string VS = getValueAsStr(V);

     if (EnablePthreads) {
       std::string Assign = getAssign(rmwi);
       std::string text;
       const char *HeapName;
       std::string Index = getHeapNameAndIndex(P, &HeapName);
       const char *atomicFunc = 0;
       switch (rmwi->getOperation()) {
         case AtomicRMWInst::Xchg: atomicFunc = "exchange"; break;
         case AtomicRMWInst::Add:  atomicFunc = "add"; break;
         case AtomicRMWInst::Sub:  atomicFunc = "sub"; break;
         case AtomicRMWInst::And:  atomicFunc = "and"; break;
         case AtomicRMWInst::Or:   atomicFunc = "or"; break;
         case AtomicRMWInst::Xor:  atomicFunc = "xor"; break;
         case AtomicRMWInst::Nand: // TODO
         case AtomicRMWInst::Max:
         case AtomicRMWInst::Min:
         case AtomicRMWInst::UMax:
         case AtomicRMWInst::UMin:
         case AtomicRMWInst::BAD_BINOP: llvm_unreachable("Bad atomic operation");
       }
       if (!strcmp(HeapName, "HEAPF32") || !strcmp(HeapName, "HEAPF64")) {
         // TODO: If https://bugzilla.mozilla.org/show_bug.cgi?id=1131613 and https://bugzilla.mozilla.org/show_bug.cgi?id=1131624 are
         // implemented, we could remove the emulation, but until then we must emulate manually.
         bool fround = PreciseF32 && !strcmp(HeapName, "HEAPF32");
         Code << Assign << (fround ? "Math_fround(" : "+") << "_emscripten_atomic_" << atomicFunc << "_" << heapNameToAtomicTypeName(HeapName) << "(" << getValueAsStr(P) << ", " << VS << (fround ? "))" : ")"); break;

       // TODO: Remove the following two lines once https://bugzilla.mozilla.org/show_bug.cgi?id=1141986 is implemented!
       } else if (rmwi->getOperation() == AtomicRMWInst::Xchg && !strcmp(HeapName, "HEAP32")) {
         Code << Assign << "_emscripten_atomic_exchange_u32(" << getValueAsStr(P) << ", " << VS << ")|0"; break;

       } else {
         Code << Assign << "Atomics_" << atomicFunc << "(" << HeapName << ", " << Index << ", " << VS << ")"; break;
       }
     } else {
       Code << getLoad(rmwi, P, I->getType(), 0) << ';';
       // Most bitcasts are no-ops for us. However, the exception is int to float and float to int
       switch (rmwi->getOperation()) {
         case AtomicRMWInst::Xchg: Code << getStore(rmwi, P, I->getType(), VS, 0); break;
         case AtomicRMWInst::Add:  Code << getStore(rmwi, P, I->getType(), "((" + getJSName(I) + '+' + VS + ")|0)", 0); break;
         case AtomicRMWInst::Sub:  Code << getStore(rmwi, P, I->getType(), "((" + getJSName(I) + '-' + VS + ")|0)", 0); break;
         case AtomicRMWInst::And:  Code << getStore(rmwi, P, I->getType(), "(" + getJSName(I) + '&' + VS + ")", 0); break;
         case AtomicRMWInst::Nand: Code << getStore(rmwi, P, I->getType(), "(~(" + getJSName(I) + '&' + VS + "))", 0); break;
         case AtomicRMWInst::Or:   Code << getStore(rmwi, P, I->getType(), "(" + getJSName(I) + '|' + VS + ")", 0); break;
         case AtomicRMWInst::Xor:  Code << getStore(rmwi, P, I->getType(), "(" + getJSName(I) + '^' + VS + ")", 0); break;
         case AtomicRMWInst::Max:
         case AtomicRMWInst::Min:
         case AtomicRMWInst::UMax:
         case AtomicRMWInst::UMin:
         case AtomicRMWInst::BAD_BINOP: llvm_unreachable("Bad atomic operation");
       }
     }
     break;
   }
   case Instruction::Fence:
     if (EnablePthreads) {
       Code << "Atomics_fence()";
     } else {
       Code << "/* fence */"; // no threads, so nothing to do here
     }
     break;
   }

   if (const Instruction *Inst = dyn_cast<Instruction>(I)) {
     Code << ';';
     // append debug info
     emitDebugInfo(Code, Inst);
     Code << '\n';
   }
 }

 // Checks whether to use a condition variable. We do so for switches and for indirectbrs
 static const Value *considerConditionVar(const Instruction *I) {
   if (const IndirectBrInst *IB = dyn_cast<const IndirectBrInst>(I)) {
     return IB->getAddress();
   }
   const SwitchInst *SI = dyn_cast<SwitchInst>(I);
   if (!SI) return NULL;
   // otherwise, we trust LLVM switches. if they were too big or sparse, the switch expansion pass should have fixed that
   return SI->getCondition();
 }

 void JSWriter::addBlock(const BasicBlock *BB, Relooper& R, LLVMToRelooperMap& LLVMToRelooper) {
   std::string Code;
   raw_string_ostream CodeStream(Code);
   for (BasicBlock::const_iterator I = BB->begin(), E = BB->end();
        I != E; ++I) {
     if (I->stripPointerCasts() == I) {
       generateExpression(I, CodeStream);
     }
   }
   CodeStream.flush();
   const Value* Condition = considerConditionVar(BB->getTerminator());
   Block *Curr = new Block(Code.c_str(), Condition ? getValueAsCastStr(Condition).c_str() : NULL);
   LLVMToRelooper[BB] = Curr;
   R.AddBlock(Curr);
 }

 void JSWriter::printFunctionBody(const Function *F) {
   assert(!F->isDeclaration());

   // Prepare relooper
   Relooper::MakeOutputBuffer(1024*1024);
   Relooper R;
   //if (!canReloop(F)) R.SetEmulate(true);
   if (F->getAttributes().hasAttribute(AttributeSet::FunctionIndex, Attribute::MinSize) ||
       F->getAttributes().hasAttribute(AttributeSet::FunctionIndex, Attribute::OptimizeForSize)) {
     R.SetMinSize(true);
   }
   R.SetAsmJSMode(1);
   Block *Entry = NULL;
   LLVMToRelooperMap LLVMToRelooper;

   // Create relooper blocks with their contents. TODO: We could optimize
   // indirectbr by emitting indexed blocks first, so their indexes
   // match up with the label index.
   for (Function::const_iterator BI = F->begin(), BE = F->end();
        BI != BE; ++BI) {
     InvokeState = 0; // each basic block begins in state 0; the previous may not have cleared it, if e.g. it had a throw in the middle and the rest of it was decapitated
     addBlock(BI, R, LLVMToRelooper);
     if (!Entry) Entry = LLVMToRelooper[BI];
   }
   assert(Entry);

   // Create branchings
   for (Function::const_iterator BI = F->begin(), BE = F->end();
        BI != BE; ++BI) {
     const TerminatorInst *TI = BI->getTerminator();
     switch (TI->getOpcode()) {
       default: {
         report_fatal_error("invalid branch instr " + Twine(TI->getOpcodeName()));
         break;
       }
       case Instruction::Br: {
         const BranchInst* br = cast<BranchInst>(TI);
         if (br->getNumOperands() == 3) {
           BasicBlock *S0 = br->getSuccessor(0);
           BasicBlock *S1 = br->getSuccessor(1);
           std::string P0 = getPhiCode(&*BI, S0);
           std::string P1 = getPhiCode(&*BI, S1);
           LLVMToRelooper[&*BI]->AddBranchTo(LLVMToRelooper[&*S0], getValueAsStr(TI->getOperand(0)).c_str(), P0.size() > 0 ? P0.c_str() : NULL);
           LLVMToRelooper[&*BI]->AddBranchTo(LLVMToRelooper[&*S1], NULL,                                     P1.size() > 0 ? P1.c_str() : NULL);
         } else if (br->getNumOperands() == 1) {
           BasicBlock *S = br->getSuccessor(0);
           std::string P = getPhiCode(&*BI, S);
           LLVMToRelooper[&*BI]->AddBranchTo(LLVMToRelooper[&*S], NULL, P.size() > 0 ? P.c_str() : NULL);
         } else {
           error("Branch with 2 operands?");
         }
         break;
       }
       case Instruction::IndirectBr: {
         const IndirectBrInst* br = cast<IndirectBrInst>(TI);
         unsigned Num = br->getNumDestinations();
         std::set<const BasicBlock*> Seen; // sadly llvm allows the same block to appear multiple times
         bool SetDefault = false; // pick the first and make it the default, llvm gives no reasonable default here
         for (unsigned i = 0; i < Num; i++) {
           const BasicBlock *S = br->getDestination(i);
           if (Seen.find(S) != Seen.end()) continue;
           Seen.insert(S);
           std::string P = getPhiCode(&*BI, S);
           std::string Target;
           if (!SetDefault) {
             SetDefault = true;
           } else {
             Target = "case " + utostr(getBlockAddress(F, S)) + ": ";
           }
           LLVMToRelooper[&*BI]->AddBranchTo(LLVMToRelooper[&*S], Target.size() > 0 ? Target.c_str() : NULL, P.size() > 0 ? P.c_str() : NULL);
         }
         break;
       }
       case Instruction::Switch: {
         const SwitchInst* SI = cast<SwitchInst>(TI);
         bool UseSwitch = !!considerConditionVar(SI);
         BasicBlock *DD = SI->getDefaultDest();
         std::string P = getPhiCode(&*BI, DD);
         LLVMToRelooper[&*BI]->AddBranchTo(LLVMToRelooper[&*DD], NULL, P.size() > 0 ? P.c_str() : NULL);
         typedef std::map<const BasicBlock*, std::string> BlockCondMap;
         BlockCondMap BlocksToConditions;
         for (SwitchInst::ConstCaseIt i = SI->case_begin(), e = SI->case_end(); i != e; ++i) {
           const BasicBlock *BB = i.getCaseSuccessor();
           std::string Curr = i.getCaseValue()->getValue().toString(10, true);
           std::string Condition;
           if (UseSwitch) {
             Condition = "case " + Curr + ": ";
           } else {
             Condition = "(" + getValueAsCastParenStr(SI->getCondition()) + " == " + Curr + ")";
           }
           BlocksToConditions[BB] = Condition + (!UseSwitch && BlocksToConditions[BB].size() > 0 ? " | " : "") + BlocksToConditions[BB];
         }
         std::set<const BasicBlock *> alreadyProcessed;
         for (SwitchInst::ConstCaseIt i = SI->case_begin(), e = SI->case_end(); i != e; ++i) {
           const BasicBlock *BB = i.getCaseSuccessor();
           if (!alreadyProcessed.insert(BB).second) continue;
           if (BB == DD) continue; // ok to eliminate this, default dest will get there anyhow
           std::string P = getPhiCode(&*BI, BB);
           LLVMToRelooper[&*BI]->AddBranchTo(LLVMToRelooper[&*BB], BlocksToConditions[BB].c_str(), P.size() > 0 ? P.c_str() : NULL);
         }
         break;
       }
       case Instruction::Ret:
       case Instruction::Unreachable: break;
     }
   }

   // Calculate relooping and print
   R.Calculate(Entry);
   R.Render();

   // Emit local variables
   UsedVars["sp"] = Type::getInt32Ty(F->getContext());
   unsigned MaxAlignment = Allocas.getMaxAlignment();
   if (MaxAlignment > STACK_ALIGN) {
     UsedVars["sp_a"] = Type::getInt32Ty(F->getContext());
   }
   UsedVars["label"] = Type::getInt32Ty(F->getContext());
   if (!UsedVars.empty()) {
     unsigned Count = 0;
     for (VarMap::const_iterator VI = UsedVars.begin(); VI != UsedVars.end(); ++VI) {
       if (Count == 20) {
         Out << ";\n";
         Count = 0;
       }
       if (Count == 0) Out << " var ";
       if (Count > 0) {
         Out << ", ";
       }
       Count++;
       Out << VI->first << " = ";
       switch (VI->second->getTypeID()) {
         default:
           llvm_unreachable("unsupported variable initializer type");
         case Type::PointerTyID:
         case Type::IntegerTyID:
           Out << "0";
           break;
         case Type::FloatTyID:
           if (PreciseF32) {
             Out << "Math_fround(0)";
             break;
           }
           // otherwise fall through to double
         case Type::DoubleTyID:
           Out << "+0";
           break;
         case Type::VectorTyID:
           Out << "SIMD_" << SIMDType(cast<VectorType>(VI->second)) << "(0";
           for (unsigned i = 1; i < cast<VectorType>(VI->second)->getNumElements(); ++i) {
             Out << ",0";
           }
           Out << ')';
           break;
       }
     }
     Out << ";";
     nl(Out);
   }

   {
     static bool Warned = false;
     if (!Warned && OptLevel < 2 && UsedVars.size() > 2000) {
       prettyWarning() << "emitted code will contain very large numbers of local variables, which is bad for performance (build to JS with -O2 or above to avoid this - make sure to do so both on source files, and during 'linking')\n";
       Warned = true;
     }
   }

   // Emit stack entry
   Out << " " << getAdHocAssign("sp", Type::getInt32Ty(F->getContext())) << "STACKTOP;";
   if (uint64_t FrameSize = Allocas.getFrameSize()) {
     if (MaxAlignment > STACK_ALIGN) {
       // We must align this entire stack frame to something higher than the default
       Out << "\n ";
       Out << "sp_a = STACKTOP = (STACKTOP + " << utostr(MaxAlignment-1) << ")&-" << utostr(MaxAlignment) << ";";
     }
     Out << "\n ";
     Out << getStackBump(FrameSize);
   }

   // Emit extern loads, if we have any
   if (Relocatable) {
     if (FuncRelocatableExterns.size() > 0) {
       for (auto& RE : FuncRelocatableExterns) {
         std::string Temp = "t$" + RE;
         std::string Call = "g$" + RE;
         Out << Temp + " = " + Call + "() | 0;\n";
       }
       FuncRelocatableExterns.clear();
     }
   }

   // Emit (relooped) code
   char *buffer = Relooper::GetOutputBuffer();
   nl(Out) << buffer;

   // Ensure a final return if necessary
   Type *RT = F->getFunctionType()->getReturnType();
   if (!RT->isVoidTy()) {
     char *LastCurly = strrchr(buffer, '}');
     if (!LastCurly) LastCurly = buffer;
     char *FinalReturn = strstr(LastCurly, "return ");
     if (!FinalReturn) {
       Out << " return " << getParenCast(getConstant(UndefValue::get(RT)), RT, ASM_NONSPECIFIC) << ";\n";
     }
   }

   if (Relocatable) {
     if (!F->hasInternalLinkage()) {
       Exports.push_back(getJSName(F));
     }
   }
 }

 void JSWriter::processConstants() {
   // Ensure a name for each global
   for (Module::global_iterator I = TheModule->global_begin(),
          E = TheModule->global_end(); I != E; ++I) {
     if (I->hasInitializer()) {
       if (!I->hasName()) {
         // ensure a unique name
         static int id = 1;
         std::string newName;
         while (1) {
           newName = std::string("glb_") + utostr(id);
           if (!TheModule->getGlobalVariable("glb_" + utostr(id))) break;
           id++;
           assert(id != 0);
         }
         I->setName(Twine(newName));
       }
     }
   }
   // First, calculate the address of each constant
   for (Module::const_global_iterator I = TheModule->global_begin(),
          E = TheModule->global_end(); I != E; ++I) {
     if (I->hasInitializer()) {
       parseConstant(I->getName().str(), I->getInitializer(), I->getAlignment(), true);
     }
   }
   // Calculate MaxGlobalAlign, adjust final paddings, and adjust GlobalBasePadding
   assert(MaxGlobalAlign == 0);
   for (auto& GI : GlobalDataMap) {
     int Alignment = GI.first;
     if (Alignment > MaxGlobalAlign) MaxGlobalAlign = Alignment;
     ensureAligned(Alignment, &GlobalDataMap[Alignment]);
   }
   if (!Relocatable && MaxGlobalAlign > 0) {
     while ((GlobalBase+GlobalBasePadding) % MaxGlobalAlign != 0) GlobalBasePadding++;
   }
   while (AlignedHeapStarts.size() <= (unsigned)MaxGlobalAlign) AlignedHeapStarts.push_back(0);
   for (auto& GI : GlobalDataMap) {
     int Alignment = GI.first;
     int Curr = GlobalBase + GlobalBasePadding;
     for (auto& GI : GlobalDataMap) { // bigger alignments show up first, smaller later
       if (GI.first > Alignment) {
         Curr += GI.second.size();
       }
     }
     AlignedHeapStarts[Alignment] = Curr;
   }
   // Second, allocate their contents
   for (Module::const_global_iterator I = TheModule->global_begin(),
          E = TheModule->global_end(); I != E; ++I) {
     if (I->hasInitializer()) {
       parseConstant(I->getName().str(), I->getInitializer(), I->getAlignment(), false);
     }
   }
   if (Relocatable) {
     for (Module::const_global_iterator I = TheModule->global_begin(),
            E = TheModule->global_end(); I != E; ++I) {
       if (I->hasInitializer() && !I->hasInternalLinkage()) {
         std::string Name = I->getName().str();
         if (GlobalAddresses.find(Name) != GlobalAddresses.end()) {
           std::string JSName = getJSName(I).substr(1);
           if (Name == JSName) { // don't export things that have weird internal names, that C can't dlsym anyhow
             NamedGlobals[Name] = getGlobalAddress(Name);
           }
         }
       }
     }
   }
 }

 void JSWriter::printFunction(const Function *F) {
   ValueNames.clear();

   // Prepare and analyze function

   UsedVars.clear();
   UniqueNum = 0;

   // When optimizing, the regular optimizer (mem2reg, SROA, GVN, and others)
   // will have already taken all the opportunities for nativization.
   if (OptLevel == CodeGenOpt::None)
     calculateNativizedVars(F);

   // Do alloca coloring at -O1 and higher.
   Allocas.analyze(*F, *DL, OptLevel != CodeGenOpt::None);

   // Emit the function

   std::string Name = F->getName();
   sanitizeGlobal(Name);
   Out << "function " << Name << "(";
   for (Function::const_arg_iterator AI = F->arg_begin(), AE = F->arg_end();
        AI != AE; ++AI) {
     if (AI != F->arg_begin()) Out << ",";
     Out << getJSName(AI);
   }
   Out << ") {";
   nl(Out);
   for (Function::const_arg_iterator AI = F->arg_begin(), AE = F->arg_end();
        AI != AE; ++AI) {
     std::string name = getJSName(AI);
     Out << " " << name << " = " << getCast(name, AI->getType(), ASM_NONSPECIFIC) << ";";
     nl(Out);
   }
   printFunctionBody(F);
   Out << "}";
   nl(Out);

   Allocas.clear();
   StackBumped = false;
 }

 void JSWriter::printModuleBody() {
   processConstants();

   if (Relocatable) {
     for (Module::const_alias_iterator I = TheModule->alias_begin(), E = TheModule->alias_end();
          I != E; ++I) {
       if (const GlobalAlias *GA = dyn_cast<GlobalAlias>(I)) {
         const Value* Target = resolveFully(GA);
         Aliases[getJSName(GA)] = getJSName(Target);
       }
     }
   }

   // Emit function bodies.
   nl(Out) << "// EMSCRIPTEN_START_FUNCTIONS"; nl(Out);
   for (Module::const_iterator I = TheModule->begin(), E = TheModule->end();
        I != E; ++I) {
     if (!I->isDeclaration()) printFunction(I);
   }
   // Emit postSets, split up into smaller functions to avoid one massive one that is slow to compile (more likely to occur in dynamic linking, as more postsets)
   {
     const int CHUNK = 100;
     int i = 0;
     int chunk = 0;
     int num = PostSets.size();
     do {
       if (chunk == 0) {
         Out << "function runPostSets() {\n";
       } else {
         Out << "function runPostSets" << chunk << "() {\n";
       }
       if (Relocatable) Out << " var temp = 0;\n"; // need a temp var for relocation calls, for proper validation in heap growth
       int j = i + CHUNK;
       if (j > num) j = num;
       while (i < j) {
         Out << PostSets[i] << "\n";
         i++;
       }
       // call the next chunk, if there is one
       chunk++;
       if (i < num) {
         Out << " runPostSets" << chunk << "();\n";
       }
       Out << "}\n";
     } while (i < num);
     PostSets.clear();
   }
   Out << "// EMSCRIPTEN_END_FUNCTIONS\n\n";

   if (EnablePthreads) {
     Out << "if (!ENVIRONMENT_IS_PTHREAD) {\n";
   }
   Out << "/* memory initializer */ allocate([";
   if (MaxGlobalAlign > 0) {
     bool First = true;
     for (int i = 0; i < GlobalBasePadding; i++) {
       if (First) {
         First = false;
       } else {
         Out << ",";
       }
       Out << "0";
     }
     int Curr = MaxGlobalAlign;
     while (Curr > 0) {
       if (GlobalDataMap.find(Curr) == GlobalDataMap.end()) {
         Curr = Curr/2;
         continue;
       }
       HeapData* GlobalData = &GlobalDataMap[Curr];
       if (GlobalData->size() > 0) {
         if (First) {
           First = false;
         } else {
           Out << ",";
         }
         printCommaSeparated(*GlobalData);
       }
       Curr = Curr/2;
     }
   }
   Out << "], \"i8\", ALLOC_NONE, Runtime.GLOBAL_BASE);\n";
   if (EnablePthreads) {
     Out << "}\n";
   }
   // Emit metadata for emcc driver
   Out << "\n\n// EMSCRIPTEN_METADATA\n";
   Out << "{\n";

   Out << "\"declares\": [";
   bool first = true;
   for (Module::const_iterator I = TheModule->begin(), E = TheModule->end();
        I != E; ++I) {
     if (I->isDeclaration() && !I->use_empty()) {
       // Ignore intrinsics that are always no-ops or expanded into other code
       // which doesn't require the intrinsic function itself to be declared.
       if (I->isIntrinsic()) {
         switch (I->getIntrinsicID()) {
         case Intrinsic::dbg_declare:
         case Intrinsic::dbg_value:
         case Intrinsic::lifetime_start:
         case Intrinsic::lifetime_end:
         case Intrinsic::invariant_start:
         case Intrinsic::invariant_end:
         case Intrinsic::prefetch:
         case Intrinsic::memcpy:
         case Intrinsic::memset:
         case Intrinsic::memmove:
         case Intrinsic::expect:
         case Intrinsic::flt_rounds:
           continue;
         }
       }

       if (first) {
         first = false;
       } else {
         Out << ", ";
       }
       Out << "\"" << I->getName() << "\"";
     }
   }
   for (NameSet::const_iterator I = Declares.begin(), E = Declares.end();
        I != E; ++I) {
     if (first) {
       first = false;
     } else {
       Out << ", ";
     }
     Out << "\"" << *I << "\"";
   }
   Out << "],";

   Out << "\"redirects\": {";
   first = true;
   for (StringMap::const_iterator I = Redirects.begin(), E = Redirects.end();
        I != E; ++I) {
     if (first) {
       first = false;
     } else {
       Out << ", ";
     }
     Out << "\"_" << I->first << "\": \"" << I->second << "\"";
   }
   Out << "},";

   Out << "\"externs\": [";
   first = true;
   for (NameSet::const_iterator I = Externals.begin(), E = Externals.end();
        I != E; ++I) {
     if (first) {
       first = false;
     } else {
       Out << ", ";
     }
     Out << "\"" << *I << "\"";
   }
   Out << "],";

   Out << "\"implementedFunctions\": [";
   first = true;
   for (Module::const_iterator I = TheModule->begin(), E = TheModule->end();
        I != E; ++I) {
     if (!I->isDeclaration()) {
       if (first) {
         first = false;
       } else {
         Out << ", ";
       }
       std::string name = I->getName();
       sanitizeGlobal(name);
       Out << "\"" << name << '"';
     }
   }
   Out << "],";

   Out << "\"tables\": {";
   unsigned Num = FunctionTables.size();
   for (FunctionTableMap::iterator I = FunctionTables.begin(), E = FunctionTables.end(); I != E; ++I) {
     Out << "  \"" << I->first << "\": \"var FUNCTION_TABLE_" << I->first << " = [";
     FunctionTable &Table = I->second;
     // ensure power of two
     unsigned Size = 1;
     while (Size < Table.size()) Size <<= 1;
     while (Table.size() < Size) Table.push_back("0");
     for (unsigned i = 0; i < Table.size(); i++) {
       Out << Table[i];
       if (i < Table.size()-1) Out << ",";
     }
     Out << "];\"";
     if (--Num > 0) Out << ",";
     Out << "\n";
   }
   Out << "},";

   Out << "\"initializers\": [";
   first = true;
   for (unsigned i = 0; i < GlobalInitializers.size(); i++) {
     if (first) {
       first = false;
     } else {
       Out << ", ";
     }
     Out << "\"" << GlobalInitializers[i] << "\"";
   }
   Out << "],";

   Out << "\"exports\": [";
   first = true;
   for (unsigned i = 0; i < Exports.size(); i++) {
     if (first) {
       first = false;
     } else {
       Out << ", ";
     }
     Out << "\"" << Exports[i] << "\"";
   }
   Out << "],";

   Out << "\"aliases\": {";
   first = true;
   for (StringMap::const_iterator I = Aliases.begin(), E = Aliases.end();
        I != E; ++I) {
     if (first) {
       first = false;
     } else {
       Out << ", ";
     }
     Out << "\"" << I->first << "\": \"" << I->second << "\"";
   }
   Out << "},";

   Out << "\"cantValidate\": \"" << CantValidate << "\",";

   Out << "\"simd\": " << (UsesSIMDInt8x16 || UsesSIMDInt8x16 || UsesSIMDInt32x4 || UsesSIMDFloat32x4 || UsesSIMDFloat64x2 ? "1" : "0") << ",";
   Out << "\"simdInt8x16\": " << (UsesSIMDInt8x16 ? "1" : "0") << ",";
   Out << "\"simdInt16x8\": " << (UsesSIMDInt16x8 ? "1" : "0") << ",";
   Out << "\"simdInt32x4\": " << (UsesSIMDInt32x4 ? "1" : "0") << ",";
   Out << "\"simdFloat32x4\": " << (UsesSIMDFloat32x4 ? "1" : "0") << ",";
   Out << "\"simdFloat64x2\": " << (UsesSIMDFloat64x2 ? "1" : "0") << ",";

   Out << "\"maxGlobalAlign\": " << utostr(MaxGlobalAlign) << ",";

   Out << "\"namedGlobals\": {";
   first = true;
   for (NameIntMap::const_iterator I = NamedGlobals.begin(), E = NamedGlobals.end(); I != E; ++I) {
     if (first) {
       first = false;
     } else {
       Out << ", ";
     }
     Out << "\"" << I->first << "\": \"" << utostr(I->second) << "\"";
   }
   Out << "},";

   Out << "\"asmConsts\": {";
   first = true;
   for (NameIntMap::const_iterator I = AsmConsts.begin(), E = AsmConsts.end(); I != E; ++I) {
     if (first) {
       first = false;
     } else {
       Out << ", ";
     }
     Out << "\"" << utostr(I->second) << "\": \"" << I->first.c_str() << "\"";
   }
   Out << "},";

   Out << "\"asmConstArities\": {";
   first = true;
   for (IntIntMap::const_iterator I = AsmConstArities.begin(), E = AsmConstArities.end();
        I != E; ++I) {
     if (first) {
       first = false;
     } else {
       Out << ", ";
     }
     Out << "\"" << utostr(I->first) << "\": " << utostr(I->second) << "";
   }
   Out << "}";

   Out << "\n}\n";
 }

 void JSWriter::parseConstant(const std::string& name, const Constant* CV, int Alignment, bool calculate) {
   if (isa<GlobalValue>(CV))
     return;
   if (Alignment == 0) Alignment = DEFAULT_MEM_ALIGN;
   //errs() << "parsing constant " << name << " : " << Alignment << "\n";
   // TODO: we repeat some work in both calculate and emit phases here
   // FIXME: use the proper optimal alignments
   if (const ConstantDataSequential *CDS =
          dyn_cast<ConstantDataSequential>(CV)) {
     assert(CDS->isString());
     if (calculate) {
       HeapData *GlobalData = allocateAddress(name, Alignment);
       StringRef Str = CDS->getAsString();
       ensureAligned(Alignment, GlobalData);
       for (unsigned int i = 0; i < Str.size(); i++) {
         GlobalData->push_back(Str.data()[i]);
       }
     }
   } else if (const ConstantFP *CFP = dyn_cast<ConstantFP>(CV)) {
     APFloat APF = CFP->getValueAPF();
     if (CFP->getType() == Type::getFloatTy(CFP->getContext())) {
       if (calculate) {
         HeapData *GlobalData = allocateAddress(name, Alignment);
         union flt { float f; unsigned char b[sizeof(float)]; } flt;
         flt.f = APF.convertToFloat();
         ensureAligned(Alignment, GlobalData);
         for (unsigned i = 0; i < sizeof(float); ++i) {
           GlobalData->push_back(flt.b[i]);
         }
       }
     } else if (CFP->getType() == Type::getDoubleTy(CFP->getContext())) {
       if (calculate) {
         HeapData *GlobalData = allocateAddress(name, Alignment);
         union dbl { double d; unsigned char b[sizeof(double)]; } dbl;
         dbl.d = APF.convertToDouble();
         ensureAligned(Alignment, GlobalData);
         for (unsigned i = 0; i < sizeof(double); ++i) {
           GlobalData->push_back(dbl.b[i]);
         }
       }
     } else {
       assert(false && "Unsupported floating-point type");
     }
   } else if (const ConstantInt *CI = dyn_cast<ConstantInt>(CV)) {
     if (calculate) {
       union { uint64_t i; unsigned char b[sizeof(uint64_t)]; } integer;
       integer.i = *CI->getValue().getRawData();
       unsigned BitWidth = 64; // CI->getValue().getBitWidth();
       assert(BitWidth == 32 || BitWidth == 64);
       HeapData *GlobalData = allocateAddress(name, Alignment);
       // assuming compiler is little endian
       ensureAligned(Alignment, GlobalData);
       for (unsigned i = 0; i < BitWidth / 8; ++i) {
         GlobalData->push_back(integer.b[i]);
       }
     }
   } else if (isa<ConstantPointerNull>(CV)) {
     assert(false && "Unlowered ConstantPointerNull");
   } else if (isa<ConstantAggregateZero>(CV)) {
     if (calculate) {
       unsigned Bytes = DL->getTypeStoreSize(CV->getType());
       HeapData *GlobalData = allocateAddress(name, Alignment);
       ensureAligned(Alignment, GlobalData);
       for (unsigned i = 0; i < Bytes; ++i) {
         GlobalData->push_back(0);
       }
       // FIXME: create a zero section at the end, avoid filling meminit with zeros
     }
   } else if (const ConstantArray *CA = dyn_cast<ConstantArray>(CV)) {
     if (calculate) {
       for (Constant::const_user_iterator UI = CV->user_begin(), UE = CV->user_end(); UI != UE; ++UI) {
         if ((*UI)->getName() == "llvm.used") {
           // export the kept-alives
           for (unsigned i = 0; i < CA->getNumOperands(); i++) {
             const Constant *C = CA->getOperand(i);
             if (const ConstantExpr *CE = dyn_cast<ConstantExpr>(C)) {
               C = CE->getOperand(0); // ignore bitcasts
             }
             if (isa<Function>(C)) Exports.push_back(getJSName(C));
           }
         } else if ((*UI)->getName() == "llvm.global.annotations") {
           // llvm.global.annotations can be ignored.
         } else {
           llvm_unreachable("Unexpected constant array");
         }
         break; // we assume one use here
       }
     }
   } else if (const ConstantStruct *CS = dyn_cast<ConstantStruct>(CV)) {
     if (name == "__init_array_start") {
       // this is the global static initializer
       if (calculate) {
         unsigned Num = CS->getNumOperands();
         for (unsigned i = 0; i < Num; i++) {
           const Value* C = CS->getOperand(i);
           if (const ConstantExpr *CE = dyn_cast<ConstantExpr>(C)) {
             C = CE->getOperand(0); // ignore bitcasts
           }
           GlobalInitializers.push_back(getJSName(C));
         }
       }
     } else if (calculate) {
       HeapData *GlobalData = allocateAddress(name, Alignment);
       unsigned Bytes = DL->getTypeStoreSize(CV->getType());
       ensureAligned(Alignment, GlobalData);
       for (unsigned i = 0; i < Bytes; ++i) {
         GlobalData->push_back(0);
       }
     } else {
       // Per the PNaCl abi, this must be a packed struct of a very specific type
       // https://chromium.googlesource.com/native_client/pnacl-llvm/+/7287c45c13dc887cebe3db6abfa2f1080186bb97/lib/Transforms/NaCl/FlattenGlobals.cpp
       assert(CS->getType()->isPacked());
       // This is the only constant where we cannot just emit everything during the first phase, 'calculate', as we may refer to other globals
       unsigned Num = CS->getNumOperands();
       unsigned Offset = getRelativeGlobalAddress(name);
       unsigned OffsetStart = Offset;
       unsigned Absolute = getGlobalAddress(name);
       for (unsigned i = 0; i < Num; i++) {
         const Constant* C = CS->getOperand(i);
         if (isa<ConstantAggregateZero>(C)) {
           unsigned Bytes = DL->getTypeStoreSize(C->getType());
           Offset += Bytes; // zeros, so just skip
         } else if (const ConstantExpr *CE = dyn_cast<ConstantExpr>(C)) {
           const Value *V = CE->getOperand(0);
           unsigned Data = 0;
           if (CE->getOpcode() == Instruction::PtrToInt) {
             Data = getConstAsOffset(V, Absolute + Offset - OffsetStart);
           } else if (CE->getOpcode() == Instruction::Add) {
             V = cast<ConstantExpr>(V)->getOperand(0);
             Data = getConstAsOffset(V, Absolute + Offset - OffsetStart);
             ConstantInt *CI = cast<ConstantInt>(CE->getOperand(1));
             Data += *CI->getValue().getRawData();
           } else {
             CE->dump();
             llvm_unreachable("Unexpected constant expr kind");
           }
           union { unsigned i; unsigned char b[sizeof(unsigned)]; } integer;
           integer.i = Data;
           HeapData& GlobalData = GlobalDataMap[Alignment];
           assert(Offset+4 <= GlobalData.size());
           ensureAligned(Alignment, GlobalData);
           for (unsigned i = 0; i < 4; ++i) {
             GlobalData[Offset++] = integer.b[i];
           }
         } else if (const ConstantDataSequential *CDS = dyn_cast<ConstantDataSequential>(C)) {
           assert(CDS->isString());
           StringRef Str = CDS->getAsString();
           HeapData& GlobalData = GlobalDataMap[Alignment];
           assert(Offset+Str.size() <= GlobalData.size());
           ensureAligned(Alignment, GlobalData);
           for (unsigned int i = 0; i < Str.size(); i++) {
             GlobalData[Offset++] = Str.data()[i];
           }
         } else {
           C->dump();
           llvm_unreachable("Unexpected constant kind");
         }
       }
     }
   } else if (isa<ConstantVector>(CV)) {
     assert(false && "Unlowered ConstantVector");
   } else if (isa<BlockAddress>(CV)) {
     assert(false && "Unlowered BlockAddress");
   } else if (const ConstantExpr *CE = dyn_cast<ConstantExpr>(CV)) {
     if (name == "__init_array_start") {
       // this is the global static initializer
       if (calculate) {
         const Value *V = CE->getOperand(0);
         GlobalInitializers.push_back(getJSName(V));
         // is the func
       }
     } else if (name == "__fini_array_start") {
       // nothing to do
     } else {
       // a global equal to a ptrtoint of some function, so a 32-bit integer for us
       if (calculate) {
         HeapData *GlobalData = allocateAddress(name, Alignment);
         ensureAligned(Alignment, GlobalData);
         for (unsigned i = 0; i < 4; ++i) {
           GlobalData->push_back(0);
         }
       } else {
         unsigned Data = 0;

         // Deconstruct lowered getelementptrs.
         if (CE->getOpcode() == Instruction::Add) {
           Data = cast<ConstantInt>(CE->getOperand(1))->getZExtValue();
           CE = cast<ConstantExpr>(CE->getOperand(0));
         }
         const Value *V = CE;
         if (CE->getOpcode() == Instruction::PtrToInt) {
           V = CE->getOperand(0);
         }

         // Deconstruct getelementptrs.
         int64_t BaseOffset;
         V = GetPointerBaseWithConstantOffset(V, BaseOffset, *DL);
         Data += (uint64_t)BaseOffset;

         Data += getConstAsOffset(V, getGlobalAddress(name));
         union { unsigned i; unsigned char b[sizeof(unsigned)]; } integer;
         integer.i = Data;
         unsigned Offset = getRelativeGlobalAddress(name);
         HeapData& GlobalData = GlobalDataMap[Alignment];
         assert(Offset+4 <= GlobalData.size());
         ensureAligned(Alignment, GlobalData);
         for (unsigned i = 0; i < 4; ++i) {
           GlobalData[Offset++] = integer.b[i];
         }
       }
     }
   } else if (isa<UndefValue>(CV)) {
     assert(false && "Unlowered UndefValue");
   } else {
     CV->dump();
     assert(false && "Unsupported constant kind");
   }
 }

 // nativization

 void JSWriter::calculateNativizedVars(const Function *F) {
   NativizedVars.clear();

   for (Function::const_iterator BI = F->begin(), BE = F->end(); BI != BE; ++BI) {
     for (BasicBlock::const_iterator II = BI->begin(), E = BI->end(); II != E; ++II) {
       const Instruction *I = &*II;
       if (const AllocaInst *AI = dyn_cast<const AllocaInst>(I)) {
         if (AI->getAllocatedType()->isVectorTy()) continue; // we do not nativize vectors, we rely on the LLVM optimizer to avoid load/stores on them
         if (AI->getAllocatedType()->isAggregateType()) continue; // we do not nativize aggregates either
         // this is on the stack. if its address is never used nor escaped, we can nativize it
         bool Fail = false;
         for (Instruction::const_user_iterator UI = I->user_begin(), UE = I->user_end(); UI != UE && !Fail; ++UI) {
           const Instruction *U = dyn_cast<Instruction>(*UI);
           if (!U) { Fail = true; break; } // not an instruction, not cool
           switch (U->getOpcode()) {
             case Instruction::Load: break; // load is cool
             case Instruction::Store: {
               if (U->getOperand(0) == I) Fail = true; // store *of* it is not cool; store *to* it is fine
               break;
             }
             default: { Fail = true; break; } // anything that is "not" "cool", is "not cool"
           }
         }
         if (!Fail) NativizedVars.insert(I);
       }
     }
   }
 }

 // special analyses

 bool JSWriter::canReloop(const Function *F) {
   return true;
 }

 // main entry

 void JSWriter::printCommaSeparated(const HeapData data) {
   for (HeapData::const_iterator I = data.begin();
        I != data.end(); ++I) {
     if (I != data.begin()) {
       Out << ",";
     }
     Out << (int)*I;
   }
 }

 void JSWriter::printProgram(const std::string& fname,
                              const std::string& mName) {
   printModule(fname,mName);
 }

 void JSWriter::printModule(const std::string& fname,
                             const std::string& mName) {
   printModuleBody();
 }

 bool JSWriter::runOnModule(Module &M) {
   TheModule = &M;
   DL = &M.getDataLayout();

   // sanity checks on options
   assert(Relocatable ? GlobalBase == 0 : true);
   assert(Relocatable ? EmulatedFunctionPointers : true);

   setupCallHandlers();

   printProgram("", "");

   return false;
 }

 char JSWriter::ID = 0;

 class CheckTriple : public ModulePass {
 public:
   static char ID;
   CheckTriple() : ModulePass(ID) {}
   bool runOnModule(Module &M) override {
     if (M.getTargetTriple() != "asmjs-unknown-emscripten") {
       prettyWarning() << "incorrect target triple '" << M.getTargetTriple() << "' (did you use emcc/em++ on all source files and not clang directly?)\n";
     }
     return false;
   }
 };

 char CheckTriple::ID;

 Pass *createCheckTriplePass() {
   return new CheckTriple();
 }

 //===----------------------------------------------------------------------===//
 //                       External Interface declaration
 //===----------------------------------------------------------------------===//

 bool JSTargetMachine::addPassesToEmitFile(PassManagerBase &PM,
                                           raw_pwrite_stream &o,
                                           CodeGenFileType FileType,
                                           bool DisableVerify,
                                           AnalysisID StartAfter,
                                           AnalysisID StopAfter) {
   assert(FileType == TargetMachine::CGFT_AssemblyFile);

   PM.add(createCheckTriplePass());
   PM.add(createExpandInsertExtractElementPass());
   PM.add(createExpandI64Pass());

   CodeGenOpt::Level OptLevel = getOptLevel();

   // When optimizing, there shouldn't be any opportunities for SimplifyAllocas
   // because the regular optimizer should have taken them all (GVN, and possibly
   // also SROA).
   if (OptLevel == CodeGenOpt::None)
     PM.add(createEmscriptenSimplifyAllocasPass());

   PM.add(createEmscriptenRemoveLLVMAssumePass());
   PM.add(createEmscriptenExpandBigSwitchesPass());

   PM.add(new JSWriter(o, OptLevel));

   return false;
 }