mirror of
				https://github.com/c64scene-ar/llvm-6502.git
				synced 2025-10-30 16:17:05 +00:00 
			
		
		
		
	For PR1284:
Implement the "part_set" intrinsic. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@35938 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
		| @@ -203,12 +203,15 @@ def int_siglongjmp : Intrinsic<[llvm_void_ty, llvm_ptr_ty, llvm_i32_ty]>; | |||||||
|  |  | ||||||
| // None of these intrinsics accesses memory at all. | // None of these intrinsics accesses memory at all. | ||||||
| let Properties = [IntrNoMem] in { | let Properties = [IntrNoMem] in { | ||||||
|   def int_part_select :  |  | ||||||
|      Intrinsic<[llvm_int_ty, llvm_int_ty, llvm_i32_ty, llvm_i32_ty]>; |  | ||||||
|   def int_bswap: Intrinsic<[llvm_int_ty, llvm_int_ty]>; |   def int_bswap: Intrinsic<[llvm_int_ty, llvm_int_ty]>; | ||||||
|   def int_ctpop: Intrinsic<[llvm_i32_ty, llvm_int_ty]>; |   def int_ctpop: Intrinsic<[llvm_i32_ty, llvm_int_ty]>; | ||||||
|   def int_ctlz : Intrinsic<[llvm_i32_ty, llvm_int_ty]>; |   def int_ctlz : Intrinsic<[llvm_i32_ty, llvm_int_ty]>; | ||||||
|   def int_cttz : Intrinsic<[llvm_i32_ty, llvm_int_ty]>; |   def int_cttz : Intrinsic<[llvm_i32_ty, llvm_int_ty]>; | ||||||
|  |   def int_part_select :  | ||||||
|  |      Intrinsic<[llvm_int_ty, llvm_int_ty, llvm_i32_ty, llvm_i32_ty]>; | ||||||
|  |   def int_part_set : | ||||||
|  |      Intrinsic<[llvm_int_ty, llvm_int_ty, llvm_int_ty, llvm_i32_ty,  | ||||||
|  |                 llvm_i32_ty]>; | ||||||
| } | } | ||||||
|  |  | ||||||
| //===------------------------ Debugger Intrinsics -------------------------===// | //===------------------------ Debugger Intrinsics -------------------------===// | ||||||
|   | |||||||
| @@ -236,14 +236,17 @@ static Value *LowerCTLZ(Value *V, Instruction *IP) { | |||||||
|   return LowerCTPOP(V, IP); |   return LowerCTPOP(V, IP); | ||||||
| } | } | ||||||
|  |  | ||||||
| /// Convert the llvm.bit.part_select.iX.iY.iZ intrinsic. This intrinsic takes  | /// Convert the llvm.part.select.iX.iY intrinsic. This intrinsic takes  | ||||||
| /// three integer operands of arbitrary bit width. The first operand is the  | /// three integer arguments. The first argument is the Value from which the | ||||||
| /// value from which to select the bits. The second and third operands define a  | /// bits will be selected. It may be of any bit width. The second and third | ||||||
| /// range of bits to select.  The result is the bits selected and has a  | /// arguments specify a range of bits to select with the second argument  | ||||||
| /// corresponding width of Left-Right (second operand - third operand). | /// specifying the low bit and the third argument specifying the high bit. Both | ||||||
| /// @see IEEE 1666-2005, System C, Section 7.2.6, pg 175.  | /// must be type i32. The result is the corresponding selected bits from the | ||||||
| /// @brief Lowering of llvm.bit.part_select intrinsic. | /// Value in the same width as the Value (first argument). If the low bit index | ||||||
| static Instruction *LowerBitPartSelect(CallInst *CI) { | /// is higher than the high bit index then the inverse selection is done and  | ||||||
|  | /// the bits are returned in inverse order.  | ||||||
|  | /// @brief Lowering of llvm.part.select intrinsic. | ||||||
|  | static Instruction *LowerPartSelect(CallInst *CI) { | ||||||
|   // Make sure we're dealing with a part select intrinsic here |   // Make sure we're dealing with a part select intrinsic here | ||||||
|   Function *F = CI->getCalledFunction(); |   Function *F = CI->getCalledFunction(); | ||||||
|   const FunctionType *FT = F->getFunctionType(); |   const FunctionType *FT = F->getFunctionType(); | ||||||
| @@ -268,8 +271,8 @@ static Instruction *LowerBitPartSelect(CallInst *CI) { | |||||||
|  |  | ||||||
|     // Get the arguments to the function |     // Get the arguments to the function | ||||||
|     Value* Val = F->getOperand(0); |     Value* Val = F->getOperand(0); | ||||||
|     Value* Left = F->getOperand(1); |     Value* Right = F->getOperand(1); | ||||||
|     Value* Right = F->getOperand(2); |     Value* Left = F->getOperand(2); | ||||||
|  |  | ||||||
|     // We want to select a range of bits here such that [Left, Right] is shifted |     // We want to select a range of bits here such that [Left, Right] is shifted | ||||||
|     // down to the low bits. However, it is quite possible that Left is smaller |     // down to the low bits. However, it is quite possible that Left is smaller | ||||||
| @@ -406,6 +409,181 @@ static Instruction *LowerBitPartSelect(CallInst *CI) { | |||||||
|   return new CallInst(F, Args, 3, CI->getName(), CI); |   return new CallInst(F, Args, 3, CI->getName(), CI); | ||||||
| } | } | ||||||
|  |  | ||||||
|  | /// Convert the llvm.part.set.iX.iY.iZ intrinsic. This intrinsic takes  | ||||||
|  | /// four integer arguments (iAny %Value, iAny %Replacement, i32 %Low, i32 %High) | ||||||
|  | /// The first two arguments can be any bit width. The result is the same width | ||||||
|  | /// as %Value. The operation replaces bits between %Low and %High with the value | ||||||
|  | /// in %Replacement. If %Replacement is not the same width, it is truncated or | ||||||
|  | /// zero extended as appropriate to fit the bits being replaced. If %Low is | ||||||
|  | /// greater than %High then the inverse set of bits are replaced. | ||||||
|  | /// @brief Lowering of llvm.bit.part.set intrinsic. | ||||||
|  | static Instruction *LowerPartSet(CallInst *CI) { | ||||||
|  |   // Make sure we're dealing with a part select intrinsic here | ||||||
|  |   Function *F = CI->getCalledFunction(); | ||||||
|  |   const FunctionType *FT = F->getFunctionType(); | ||||||
|  |   if (!F->isDeclaration() || !FT->getReturnType()->isInteger() || | ||||||
|  |       FT->getNumParams() != 4 || !FT->getParamType(0)->isInteger() || | ||||||
|  |       !FT->getParamType(1)->isInteger() || !FT->getParamType(2)->isInteger() || | ||||||
|  |       !FT->getParamType(3)->isInteger()) | ||||||
|  |     return CI; | ||||||
|  |  | ||||||
|  |   // Get the intrinsic implementation function by converting all the . to _ | ||||||
|  |   // in the intrinsic's function name and then reconstructing the function | ||||||
|  |   // declaration. | ||||||
|  |   std::string Name(F->getName()); | ||||||
|  |   for (unsigned i = 4; i < Name.length(); ++i) | ||||||
|  |     if (Name[i] == '.') | ||||||
|  |       Name[i] = '_'; | ||||||
|  |   Module* M = F->getParent(); | ||||||
|  |   F = cast<Function>(M->getOrInsertFunction(Name, FT)); | ||||||
|  |   F->setLinkage(GlobalValue::InternalLinkage); | ||||||
|  |  | ||||||
|  |   // If we haven't defined the impl function yet, do so now | ||||||
|  |   if (F->isDeclaration()) { | ||||||
|  |     // Note: the following code is based on code generated by llvm2cpp with  | ||||||
|  |     // the following input. This is just *one* example of a generated function. | ||||||
|  |     // The functions vary by bit width of result and first two arguments. | ||||||
|  |     // The generated code has been changed to deal with any bit width not just | ||||||
|  |     // the 32/64 bitwidths used in the above sample. | ||||||
|  |     // | ||||||
|  |     // define i64 @part_set(i64 %Val, i32 %Rep, i32 %Lo, i32 %Hi) { | ||||||
|  |     // entry: | ||||||
|  |     //   %is_forward = icmp ult i32 %Lo, %Hi | ||||||
|  |     //   %Lo.pn = select i1 %is_forward, i32 %Hi, i32 %Lo | ||||||
|  |     //   %Hi.pn = select i1 %is_forward, i32 %Lo, i32 %Hi | ||||||
|  |     //   %iftmp.16.0 = sub i32 %Lo.pn, %Hi.pn | ||||||
|  |     //   icmp ult i32 %iftmp.16.0, 32 | ||||||
|  |     //   br i1 %1, label %cond_true11, label %cond_next19 | ||||||
|  |     // cond_true11: | ||||||
|  |     //   %tmp13 = sub i32 32, %iftmp.16.0 | ||||||
|  |     //   %tmp14 = lshr i32 -1, %tmp13 | ||||||
|  |     //   %tmp16 = and i32 %tmp14, %Rep | ||||||
|  |     //   br label %cond_next19 | ||||||
|  |     // cond_next19: | ||||||
|  |     //   %iftmp.17.0 = phi i32 [ %tmp16, %cond_true11 ], [ %Rep, %entry ] | ||||||
|  |     //   %tmp2021 = zext i32 %iftmp.17.0 to i64 | ||||||
|  |     //   icmp ugt i32 %Lo, %Hi | ||||||
|  |     //   br i1 %2, label %cond_next60, label %cond_true24 | ||||||
|  |     // cond_true24: | ||||||
|  |     //   %tmp25.cast = zext i32 %Hi to i64 | ||||||
|  |     //   %tmp26 = lshr i64 -1, %tmp25.cast | ||||||
|  |     //   %tmp27.cast = zext i32 %Lo to i64 | ||||||
|  |     //   %tmp28 = shl i64 %tmp26, %tmp27.cast | ||||||
|  |     //   %tmp28not = xor i64 %tmp28, -1 | ||||||
|  |     //   %tmp31 = shl i64 %tmp2021, %tmp27.cast | ||||||
|  |     //   %tmp34 = and i64 %tmp28not, %Val | ||||||
|  |     //   %Val_addr.064 = or i64 %tmp31, %tmp34 | ||||||
|  |     //   ret i64 %Val_addr.064 | ||||||
|  |     // cond_next60: | ||||||
|  |     //   %tmp39.cast = zext i32 %Lo to i64 | ||||||
|  |     //   %tmp40 = shl i64 -1, %tmp39.cast | ||||||
|  |     //   %tmp41.cast = zext i32 %Hi to i64 | ||||||
|  |     //   %tmp42 = shl i64 -1, %tmp41.cast | ||||||
|  |     //   %tmp45.demorgan = or i64 %tmp42, %tmp40 | ||||||
|  |     //   %tmp45 = xor i64 %tmp45.demorgan, -1 | ||||||
|  |     //   %tmp47 = and i64 %tmp45, %Val | ||||||
|  |     //   %tmp50 = shl i64 %tmp2021, %tmp39.cast | ||||||
|  |     //   %tmp52 = sub i32 32, %Hi | ||||||
|  |     //   %tmp52.cast = zext i32 %tmp52 to i64 | ||||||
|  |     //   %tmp54 = lshr i64 %tmp2021, %tmp52.cast | ||||||
|  |     //   %tmp57 = or i64 %tmp50, %tmp47 | ||||||
|  |     //   %Val_addr.0 = or i64 %tmp57, %tmp54 | ||||||
|  |     //   ret i64 %Val_addr.0 | ||||||
|  |     // } | ||||||
|  |  | ||||||
|  |     // Get the arguments for the function. | ||||||
|  |     Function::arg_iterator args = F->arg_begin(); | ||||||
|  |     Value* Val = args++; Val->setName("Val"); | ||||||
|  |     Value* Rep = args++; Rep->setName("Rep"); | ||||||
|  |     Value* Lo  = args++; Lo->setName("Lo"); | ||||||
|  |     Value* Hi  = args++; Hi->setName("Hi"); | ||||||
|  |  | ||||||
|  |     // Get some types we need | ||||||
|  |     const IntegerType* ValTy = cast<IntegerType>(Val->getType()); | ||||||
|  |     const IntegerType* RepTy = cast<IntegerType>(Rep->getType()); | ||||||
|  |     uint32_t ValBits = ValTy->getBitWidth(); | ||||||
|  |     uint32_t RepBits = RepTy->getBitWidth(); | ||||||
|  |  | ||||||
|  |     // Constant Definitions | ||||||
|  |     ConstantInt* RepBitWidth = ConstantInt::get(Type::Int32Ty, RepBits); | ||||||
|  |     ConstantInt* RepMask = ConstantInt::getAllOnesValue(RepTy); | ||||||
|  |     ConstantInt* ValMask = ConstantInt::getAllOnesValue(ValTy); | ||||||
|  |  | ||||||
|  |     BasicBlock* entry = new BasicBlock("entry",F,0); | ||||||
|  |     BasicBlock* large = new BasicBlock("large",F,0); | ||||||
|  |     BasicBlock* small = new BasicBlock("small",F,0); | ||||||
|  |     BasicBlock* forward = new BasicBlock("cond_true24",F,0); | ||||||
|  |     BasicBlock* reverse = new BasicBlock("cond_next60",F,0); | ||||||
|  |  | ||||||
|  |     // Block entry (entry) | ||||||
|  |     // First, convert Lo and Hi to ValTy bit width | ||||||
|  |     if (ValBits > 32) { | ||||||
|  |       Hi = new ZExtInst(Hi, ValTy, "", entry); | ||||||
|  |       Lo = new ZExtInst(Lo, ValTy, "", entry); | ||||||
|  |     } else if (ValBits < 32) { | ||||||
|  |       Hi = new TruncInst(Hi, ValTy, "", entry); | ||||||
|  |       Lo = new TruncInst(Lo, ValTy, "", entry); | ||||||
|  |     } | ||||||
|  |     ICmpInst* is_forward =  | ||||||
|  |       new ICmpInst(ICmpInst::ICMP_ULT, Lo, Hi, "", entry); | ||||||
|  |     SelectInst* Lo_pn = new SelectInst(is_forward, Hi, Lo, "", entry); | ||||||
|  |     SelectInst* Hi_pn = new SelectInst(is_forward, Lo, Hi, "", entry); | ||||||
|  |     BinaryOperator* NumBits = BinaryOperator::createSub(Lo_pn, Hi_pn, "",entry); | ||||||
|  |     ICmpInst* is_large =  | ||||||
|  |       new ICmpInst(ICmpInst::ICMP_ULT, NumBits, RepBitWidth, "", entry); | ||||||
|  |     new BranchInst(large, small, is_large, entry); | ||||||
|  |  | ||||||
|  |     // Block "large" | ||||||
|  |     BinaryOperator* MaskBits =  | ||||||
|  |       BinaryOperator::createSub(RepBitWidth, NumBits, "", large); | ||||||
|  |     BinaryOperator* Mask1 =  | ||||||
|  |       BinaryOperator::createLShr(RepMask, MaskBits, "", large); | ||||||
|  |     BinaryOperator* Rep2 = BinaryOperator::createAnd(Mask1, Rep, "", large); | ||||||
|  |     new BranchInst(small, large); | ||||||
|  |  | ||||||
|  |     // Block "small" | ||||||
|  |     PHINode* Rep3 = new PHINode(RepTy, "", small); | ||||||
|  |     Rep3->reserveOperandSpace(2); | ||||||
|  |     Rep3->addIncoming(Rep2, small); | ||||||
|  |     Rep3->addIncoming(Rep, entry); | ||||||
|  |     CastInst* Rep4 = new ZExtInst(Rep3, ValTy, "", small); | ||||||
|  |     ICmpInst* is_reverse =  | ||||||
|  |       new ICmpInst(ICmpInst::ICMP_UGT, Lo, Hi, "", small); | ||||||
|  |     new BranchInst(reverse, forward, is_reverse, small); | ||||||
|  |  | ||||||
|  |     // Block "forward" | ||||||
|  |     Value* t1    = BinaryOperator::createLShr(ValMask, Hi, "", forward); | ||||||
|  |     Value* t2    = BinaryOperator::createShl(t1, Lo, "", forward); | ||||||
|  |     Value* nott2 = BinaryOperator::createXor(t2, ValMask, "", forward); | ||||||
|  |     Value* t3    = BinaryOperator::createShl(Rep4, Lo, "", forward); | ||||||
|  |     Value* t4    = BinaryOperator::createAnd(nott2, Val, "", forward); | ||||||
|  |     Value* FRslt = BinaryOperator::createOr(t3, t4, "", forward); | ||||||
|  |     new ReturnInst(FRslt, forward); | ||||||
|  |  | ||||||
|  |     // Block "reverse" | ||||||
|  |     Value* t5    = BinaryOperator::createShl(ValMask, Lo, "", reverse); | ||||||
|  |     Value* t6    = BinaryOperator::createShl(ValMask, Hi, "", reverse); | ||||||
|  |     Value* t7    = BinaryOperator::createOr(t6, t5, "", reverse); | ||||||
|  |     Value* t8    = BinaryOperator::createXor(t7, ValMask, "", reverse); | ||||||
|  |     Value* t9    = BinaryOperator::createAnd(t8, Val, "", reverse); | ||||||
|  |     Value* t10   = BinaryOperator::createShl(Rep4, Lo, "", reverse); | ||||||
|  |     Value* t11   = BinaryOperator::createSub(RepBitWidth, Hi, "", reverse); | ||||||
|  |     Value* t12   = new ZExtInst(t11, ValTy, "", reverse); | ||||||
|  |     Value* t13   = BinaryOperator::createLShr(Rep4, t12, "",reverse); | ||||||
|  |     Value* t14   = BinaryOperator::createOr(t10, t9, "", reverse); | ||||||
|  |     Value* RRslt = BinaryOperator::createOr(t14, t13, "", reverse); | ||||||
|  |     new ReturnInst(RRslt, reverse); | ||||||
|  |   } | ||||||
|  |  | ||||||
|  |   // Return a call to the implementation function | ||||||
|  |   Value *Args[3]; | ||||||
|  |   Args[0] = CI->getOperand(0); | ||||||
|  |   Args[1] = CI->getOperand(1); | ||||||
|  |   Args[2] = CI->getOperand(2); | ||||||
|  |   Args[3] = CI->getOperand(3); | ||||||
|  |   return new CallInst(F, Args, 4, CI->getName(), CI); | ||||||
|  | } | ||||||
|  |  | ||||||
|  |  | ||||||
| void IntrinsicLowering::LowerIntrinsicCall(CallInst *CI) { | void IntrinsicLowering::LowerIntrinsicCall(CallInst *CI) { | ||||||
|   Function *Callee = CI->getCalledFunction(); |   Function *Callee = CI->getCalledFunction(); | ||||||
| @@ -476,7 +654,11 @@ void IntrinsicLowering::LowerIntrinsicCall(CallInst *CI) { | |||||||
|   } |   } | ||||||
|  |  | ||||||
|   case Intrinsic::part_select: |   case Intrinsic::part_select: | ||||||
|     CI->replaceAllUsesWith(LowerBitPartSelect(CI)); |     CI->replaceAllUsesWith(LowerPartSelect(CI)); | ||||||
|  |     break; | ||||||
|  |  | ||||||
|  |   case Intrinsic::part_set: | ||||||
|  |     CI->replaceAllUsesWith(LowerPartSet(CI)); | ||||||
|     break; |     break; | ||||||
|  |  | ||||||
|   case Intrinsic::stacksave: |   case Intrinsic::stacksave: | ||||||
|   | |||||||
| @@ -2691,7 +2691,12 @@ SelectionDAGLowering::visitIntrinsicCall(CallInst &I, unsigned Intrinsic) { | |||||||
|   } |   } | ||||||
|   case Intrinsic::part_select: { |   case Intrinsic::part_select: { | ||||||
|     // Currently not implemented: just abort |     // Currently not implemented: just abort | ||||||
|     assert(0 && "bit_part_select intrinsic not implemented"); |     assert(0 && "part_select intrinsic not implemented"); | ||||||
|  |     abort(); | ||||||
|  |   } | ||||||
|  |   case Intrinsic::part_set: { | ||||||
|  |     // Currently not implemented: just abort | ||||||
|  |     assert(0 && "part_set intrinsic not implemented"); | ||||||
|     abort(); |     abort(); | ||||||
|   } |   } | ||||||
|   case Intrinsic::bswap: |   case Intrinsic::bswap: | ||||||
|   | |||||||
| @@ -1028,13 +1028,14 @@ void Verifier::VerifyIntrinsicPrototype(Intrinsic::ID ID, Function *F, ...) { | |||||||
|           if (GotBits < 16 || GotBits % 16 != 0) |           if (GotBits < 16 || GotBits % 16 != 0) | ||||||
|             CheckFailed("Intrinsic requires even byte width argument", F); |             CheckFailed("Intrinsic requires even byte width argument", F); | ||||||
|           /* FALL THROUGH */ |           /* FALL THROUGH */ | ||||||
|  |         case Intrinsic::part_set: | ||||||
|         case Intrinsic::part_select: |         case Intrinsic::part_select: | ||||||
|           if (ArgNo == 1) { |           if (ArgNo == 1) { | ||||||
|             unsigned ResultBits =  |             unsigned ResultBits =  | ||||||
|               cast<IntegerType>(FTy->getReturnType())->getBitWidth(); |               cast<IntegerType>(FTy->getReturnType())->getBitWidth(); | ||||||
|             if (GotBits != ResultBits) |             if (GotBits != ResultBits) | ||||||
|               CheckFailed("Intrinsic requires parameter and result bit " |               CheckFailed("Intrinsic requires the bit widths of the first " | ||||||
|                           "widths to match", F); |                           "parameter and the result to match", F); | ||||||
|           } |           } | ||||||
|           break; |           break; | ||||||
|       } |       } | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user