-
Notifications
You must be signed in to change notification settings - Fork 12.5k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
[AArch64] Implement GCS ACLE intrinsics (#96903)
This adds intrinsics defined in ARM-software/acle#260 Doing this requires some changes to the GCS instruction definitions, as these intrinsics make use of how some instructions don't modify the input register when GCS is disabled, and they need to be correctly marked with mayLoad/mayStore/hasSideEffects for instruction selection to work.
- Loading branch information
1 parent
81cdf94
commit 3a14ffb
Showing
7 changed files
with
185 additions
and
4 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,56 @@ | ||
// NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py UTC_ARGS: --version 2 | ||
// RUN: %clang_cc1 -triple aarch64-eabi -target-feature +gcs -emit-llvm %s -o - | FileCheck %s | ||
|
||
#include <arm_acle.h> | ||
|
||
// CHECK-LABEL: define dso_local i64 @test_chkfeat | ||
// CHECK-SAME: () #[[ATTR0:[0-9]+]] { | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: [[__FEATURES_ADDR_I:%.*]] = alloca i64, align 8 | ||
// CHECK-NEXT: store i64 1, ptr [[__FEATURES_ADDR_I]], align 8 | ||
// CHECK-NEXT: [[TMP0:%.*]] = load i64, ptr [[__FEATURES_ADDR_I]], align 8 | ||
// CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.aarch64.chkfeat(i64 [[TMP0]]) | ||
// CHECK-NEXT: [[TMP2:%.*]] = load i64, ptr [[__FEATURES_ADDR_I]], align 8 | ||
// CHECK-NEXT: [[XOR_I:%.*]] = xor i64 [[TMP1]], [[TMP2]] | ||
// CHECK-NEXT: ret i64 [[XOR_I]] | ||
// | ||
uint64_t test_chkfeat() { | ||
return __chkfeat(_CHKFEAT_GCS); | ||
} | ||
|
||
// CHECK-LABEL: define dso_local ptr @test_gcspr | ||
// CHECK-SAME: () #[[ATTR0]] { | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: [[TMP0:%.*]] = call i64 @llvm.read_volatile_register.i64(metadata [[META2:![0-9]+]]) | ||
// CHECK-NEXT: [[TMP1:%.*]] = inttoptr i64 [[TMP0]] to ptr | ||
// CHECK-NEXT: ret ptr [[TMP1]] | ||
// | ||
void *test_gcspr() { | ||
return __gcspr(); | ||
} | ||
|
||
// CHECK-LABEL: define dso_local i64 @test_gcspopm | ||
// CHECK-SAME: () #[[ATTR0]] { | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: [[TMP0:%.*]] = call i64 @llvm.aarch64.gcspopm(i64 0) | ||
// CHECK-NEXT: ret i64 [[TMP0]] | ||
// | ||
uint64_t test_gcspopm() { | ||
return __gcspopm(); | ||
} | ||
|
||
// CHECK-LABEL: define dso_local ptr @test_gcsss | ||
// CHECK-SAME: (ptr noundef [[P:%.*]]) #[[ATTR0]] { | ||
// CHECK-NEXT: entry: | ||
// CHECK-NEXT: [[__STACK_ADDR_I:%.*]] = alloca ptr, align 8 | ||
// CHECK-NEXT: [[P_ADDR:%.*]] = alloca ptr, align 8 | ||
// CHECK-NEXT: store ptr [[P]], ptr [[P_ADDR]], align 8 | ||
// CHECK-NEXT: [[TMP0:%.*]] = load ptr, ptr [[P_ADDR]], align 8 | ||
// CHECK-NEXT: store ptr [[TMP0]], ptr [[__STACK_ADDR_I]], align 8 | ||
// CHECK-NEXT: [[TMP1:%.*]] = load ptr, ptr [[__STACK_ADDR_I]], align 8 | ||
// CHECK-NEXT: [[TMP2:%.*]] = call ptr @llvm.aarch64.gcsss(ptr [[TMP1]]) | ||
// CHECK-NEXT: ret ptr [[TMP2]] | ||
// | ||
const void *test_gcsss(const void *p) { | ||
return __gcsss(p); | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,54 @@ | ||
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py | ||
; RUN: llc -mtriple=aarch64 -mattr=+gcs -verify-machineinstrs -o - %s | FileCheck %s | ||
|
||
; We call each intrinsic twice, once with the result being unused and once with | ||
; it being used, to check that dead code elimination is being done correctly. | ||
; chkfeat does not have side effects so can be eliminated, but the others do and | ||
; can't be eliminated. | ||
|
||
define i64 @test_chkfeat(i64 %arg) { | ||
; CHECK-LABEL: test_chkfeat: | ||
; CHECK: // %bb.0: // %entry | ||
; CHECK-NEXT: mov x16, x0 | ||
; CHECK-NEXT: chkfeat x16 | ||
; CHECK-NEXT: mov x0, x16 | ||
; CHECK-NEXT: ret | ||
entry: | ||
%0 = call i64 @llvm.aarch64.chkfeat(i64 %arg) | ||
%1 = call i64 @llvm.aarch64.chkfeat(i64 %arg) | ||
ret i64 %1 | ||
} | ||
|
||
define i64 @test_gcspopm(i64 %arg) { | ||
; CHECK-LABEL: test_gcspopm: | ||
; CHECK: // %bb.0: // %entry | ||
; CHECK-NEXT: mov x8, x0 | ||
; CHECK-NEXT: gcspopm x8 | ||
; CHECK-NEXT: gcspopm x0 | ||
; CHECK-NEXT: ret | ||
entry: | ||
%0 = call i64 @llvm.aarch64.gcspopm(i64 %arg) | ||
%1 = call i64 @llvm.aarch64.gcspopm(i64 %arg) | ||
ret i64 %1 | ||
} | ||
|
||
define ptr @test_gcsss(ptr %p) { | ||
; CHECK-LABEL: test_gcsss: | ||
; CHECK: // %bb.0: // %entry | ||
; CHECK-NEXT: mov x9, xzr | ||
; CHECK-NEXT: gcsss1 x0 | ||
; CHECK-NEXT: mov x8, xzr | ||
; CHECK-NEXT: gcsss2 x9 | ||
; CHECK-NEXT: gcsss1 x0 | ||
; CHECK-NEXT: gcsss2 x8 | ||
; CHECK-NEXT: mov x0, x8 | ||
; CHECK-NEXT: ret | ||
entry: | ||
%0 = call ptr @llvm.aarch64.gcsss(ptr %p) | ||
%1 = call ptr @llvm.aarch64.gcsss(ptr %p) | ||
ret ptr %1 | ||
} | ||
|
||
declare i64 @llvm.aarch64.chkfeat(i64) | ||
declare i64 @llvm.aarch64.gcspopm(i64) | ||
declare ptr @llvm.aarch64.gcsss(ptr) |