mirror of
https://github.com/c64scene-ar/llvm-6502.git
synced 2025-01-28 06:32:09 +00:00
NEON support for _lane ops, and multiplies by scalar.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@105769 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
db03adb346
commit
4b425a8caa
@ -137,6 +137,7 @@ static char ModType(const char mod, char type, bool &quad, bool &poly,
|
||||
usgn = true;
|
||||
break;
|
||||
case 's':
|
||||
case 'a':
|
||||
scal = true;
|
||||
break;
|
||||
case 'k':
|
||||
@ -442,14 +443,7 @@ static std::string GenArgs(const std::string &proto, StringRef typestr) {
|
||||
return s;
|
||||
}
|
||||
|
||||
// Generate the definition for this intrinsic, e.g. "a + b" for OpAdd.
|
||||
// If structTypes is true, the NEON types are structs of vector types rather
|
||||
// than vector types, and the call becomes "a.val + b.val"
|
||||
static std::string GenOpString(OpKind op, const std::string &proto,
|
||||
StringRef typestr, bool structTypes = true) {
|
||||
std::string ts = TypeString(proto[0], typestr);
|
||||
std::string s = ts + " r; r";
|
||||
|
||||
static std::string Duplicate(StringRef typestr, const std::string &a) {
|
||||
bool dummy, quad = false;
|
||||
char type = ClassifyType(typestr, quad, dummy, dummy);
|
||||
unsigned nElts = 0;
|
||||
@ -463,6 +457,27 @@ static std::string GenOpString(OpKind op, const std::string &proto,
|
||||
}
|
||||
nElts <<= quad;
|
||||
|
||||
std::string s;
|
||||
|
||||
s = "(__neon_" + TypeString('d', typestr) + "){ ";
|
||||
for (unsigned i = 0; i != nElts; ++i) {
|
||||
s += a;
|
||||
if ((i + 1) < nElts)
|
||||
s += ", ";
|
||||
}
|
||||
s += " }";
|
||||
|
||||
return s;
|
||||
}
|
||||
|
||||
// Generate the definition for this intrinsic, e.g. "a + b" for OpAdd.
|
||||
// If structTypes is true, the NEON types are structs of vector types rather
|
||||
// than vector types, and the call becomes "a.val + b.val"
|
||||
static std::string GenOpString(OpKind op, const std::string &proto,
|
||||
StringRef typestr, bool structTypes = true) {
|
||||
std::string ts = TypeString(proto[0], typestr);
|
||||
std::string s = ts + " r; r";
|
||||
|
||||
if (structTypes)
|
||||
s += ".val";
|
||||
|
||||
@ -481,12 +496,18 @@ static std::string GenOpString(OpKind op, const std::string &proto,
|
||||
case OpSub:
|
||||
s += a + " - " + b;
|
||||
break;
|
||||
case OpMulN:
|
||||
b = Duplicate(typestr, "b");
|
||||
case OpMul:
|
||||
s += a + " * " + b;
|
||||
break;
|
||||
case OpMlaN:
|
||||
c = Duplicate(typestr, "c");
|
||||
case OpMla:
|
||||
s += a + " + ( " + b + " * " + c + " )";
|
||||
break;
|
||||
case OpMlsN:
|
||||
c = Duplicate(typestr, "c");
|
||||
case OpMls:
|
||||
s += a + " - ( " + b + " * " + c + " )";
|
||||
break;
|
||||
@ -540,13 +561,7 @@ static std::string GenOpString(OpKind op, const std::string &proto,
|
||||
s += "(__neon_int64x1_t)(((__neon_int64x2_t)" + a + ")[0])";
|
||||
break;
|
||||
case OpDup:
|
||||
s += "(__neon_" + ts + "){ ";
|
||||
for (unsigned i = 0; i != nElts; ++i) {
|
||||
s += a;
|
||||
if ((i + 1) < nElts)
|
||||
s += ", ";
|
||||
}
|
||||
s += " }";
|
||||
s += Duplicate(typestr, a);
|
||||
break;
|
||||
default:
|
||||
throw "unknown OpKind!";
|
||||
@ -649,8 +664,15 @@ static std::string GenBuiltin(const std::string &name, const std::string &proto,
|
||||
}
|
||||
}
|
||||
|
||||
bool splat = proto.find('a') != std::string::npos;
|
||||
|
||||
s += "__builtin_neon_";
|
||||
if (splat) {
|
||||
std::string vname(name, 0, name.size()-2);
|
||||
s += MangleName(vname, typestr, ck);
|
||||
} else {
|
||||
s += MangleName(name, typestr, ck);
|
||||
}
|
||||
s += "(";
|
||||
|
||||
for (unsigned i = 1, e = proto.size(); i != e; ++i, ++arg) {
|
||||
@ -672,12 +694,18 @@ static std::string GenBuiltin(const std::string &name, const std::string &proto,
|
||||
// Parenthesize the args from the macro.
|
||||
if (define)
|
||||
s.push_back('(');
|
||||
|
||||
if (splat && (i + 1) == e)
|
||||
s += Duplicate(typestr, std::string(&arg, 1));
|
||||
else
|
||||
s.push_back(arg);
|
||||
|
||||
// Parenthesize the args from the macro.
|
||||
if (define)
|
||||
s.push_back(')');
|
||||
|
||||
if (structTypes && proto[i] != 's' && proto[i] != 'i' && proto[i] != 'l' &&
|
||||
proto[i] != 'p' && proto[i] != 'c') {
|
||||
proto[i] != 'p' && proto[i] != 'c' && proto[i] != 'a') {
|
||||
s += ".val";
|
||||
}
|
||||
if ((i + 1) < e)
|
||||
@ -748,7 +776,6 @@ void NeonEmitter::run(raw_ostream &OS) {
|
||||
|
||||
// Emit NEON-specific scalar typedefs.
|
||||
// FIXME: probably need to do something better for polynomial types.
|
||||
// FIXME: is this the correct thing to do for float16?
|
||||
OS << "typedef float float32_t;\n";
|
||||
OS << "typedef uint8_t poly8_t;\n";
|
||||
OS << "typedef uint16_t poly16_t;\n";
|
||||
@ -869,6 +896,9 @@ void NeonEmitter::runHeader(raw_ostream &OS) {
|
||||
std::string Proto = R->getValueAsString("Prototype");
|
||||
std::string Types = R->getValueAsString("Types");
|
||||
|
||||
if (Proto.find('a') != std::string::npos)
|
||||
continue;
|
||||
|
||||
SmallVector<StringRef, 16> TypeVec;
|
||||
ParseTypes(R, Types, TypeVec);
|
||||
|
||||
|
@ -28,6 +28,9 @@ enum OpKind {
|
||||
OpMul,
|
||||
OpMla,
|
||||
OpMls,
|
||||
OpMulN,
|
||||
OpMlaN,
|
||||
OpMlsN,
|
||||
OpEq,
|
||||
OpGe,
|
||||
OpLe,
|
||||
@ -70,6 +73,9 @@ namespace llvm {
|
||||
OpMap["OP_MUL"] = OpMul;
|
||||
OpMap["OP_MLA"] = OpMla;
|
||||
OpMap["OP_MLS"] = OpMls;
|
||||
OpMap["OP_MUL_N"] = OpMulN;
|
||||
OpMap["OP_MLA_N"] = OpMlaN;
|
||||
OpMap["OP_MLS_N"] = OpMlsN;
|
||||
OpMap["OP_EQ"] = OpEq;
|
||||
OpMap["OP_GE"] = OpGe;
|
||||
OpMap["OP_LE"] = OpLe;
|
||||
@ -91,11 +97,9 @@ namespace llvm {
|
||||
Record *SI = R.getClass("SInst");
|
||||
Record *II = R.getClass("IInst");
|
||||
Record *WI = R.getClass("WInst");
|
||||
Record *BI = R.getClass("BInst");
|
||||
ClassMap[SI] = ClassS;
|
||||
ClassMap[II] = ClassI;
|
||||
ClassMap[WI] = ClassW;
|
||||
ClassMap[BI] = ClassB;
|
||||
}
|
||||
|
||||
// run - Emit arm_neon.h.inc
|
||||
|
Loading…
x
Reference in New Issue
Block a user