88 lines
3.5 KiB
LLVM
88 lines
3.5 KiB
LLVM
; RUN: opt -passes=argpromotion -mtriple=bpf-pc-linux -S %s | FileCheck %s
|
|
; Source:
|
|
; struct t {
|
|
; int a, b, c, d, e, f, g;
|
|
; };
|
|
; __attribute__((noinline)) static int foo1(struct t *p1, struct t *p2, struct t *p3) {
|
|
; return p1->a + p1->b + p2->c + p2->e + p3->f + p3->g;
|
|
; }
|
|
; __attribute__((noinline)) static int foo2(struct t *p1, struct t *p2, struct t *p3) {
|
|
; return p1->a + p1->b + p2->c + p2->e + p3->f;
|
|
; }
|
|
; void init(void *);
|
|
; int bar(void) {
|
|
; struct t v1, v2, v3;
|
|
; init(&v1); init(&v2); init(&v3);
|
|
; return foo1(&v1, &v2, &v3) + foo2(&v1, &v2, &v3);
|
|
; }
|
|
; Compilation flag:
|
|
; clang -target bpf -O2 -S t.c -mllvm -print-before=argpromotion -mllvm -print-module-scope
|
|
; and then do some manual tailoring to remove some attributes/metadata which is not used
|
|
; by argpromotion pass.
|
|
|
|
%struct.t = type { i32, i32, i32, i32, i32, i32, i32 }
|
|
|
|
define i32 @bar() {
|
|
entry:
|
|
%v1 = alloca %struct.t, align 4
|
|
%v2 = alloca %struct.t, align 4
|
|
%v3 = alloca %struct.t, align 4
|
|
call void @init(ptr noundef nonnull %v1)
|
|
call void @init(ptr noundef nonnull %v2)
|
|
call void @init(ptr noundef nonnull %v3)
|
|
%call = call fastcc i32 @foo1(ptr noundef nonnull %v1, ptr noundef nonnull %v2, ptr noundef nonnull %v3)
|
|
%call1 = call fastcc i32 @foo2(ptr noundef nonnull %v1, ptr noundef nonnull %v2, ptr noundef nonnull %v3)
|
|
%add = add nsw i32 %call, %call1
|
|
ret i32 %add
|
|
}
|
|
|
|
declare void @init(ptr noundef)
|
|
|
|
define internal i32 @foo1(ptr nocapture noundef readonly %p1, ptr nocapture noundef readonly %p2, ptr nocapture noundef readonly %p3) {
|
|
entry:
|
|
%0 = load i32, ptr %p1, align 4
|
|
%b = getelementptr inbounds %struct.t, ptr %p1, i64 0, i32 1
|
|
%1 = load i32, ptr %b, align 4
|
|
%add = add nsw i32 %1, %0
|
|
%c = getelementptr inbounds %struct.t, ptr %p2, i64 0, i32 2
|
|
%2 = load i32, ptr %c, align 4
|
|
%add1 = add nsw i32 %add, %2
|
|
%e = getelementptr inbounds %struct.t, ptr %p2, i64 0, i32 4
|
|
%3 = load i32, ptr %e, align 4
|
|
%add2 = add nsw i32 %add1, %3
|
|
%f = getelementptr inbounds %struct.t, ptr %p3, i64 0, i32 5
|
|
%4 = load i32, ptr %f, align 4
|
|
%add3 = add nsw i32 %add2, %4
|
|
%g = getelementptr inbounds %struct.t, ptr %p3, i64 0, i32 6
|
|
%5 = load i32, ptr %g, align 4
|
|
%add4 = add nsw i32 %add3, %5
|
|
ret i32 %add4
|
|
}
|
|
|
|
; Without number-of-argument constraint, argpromotion will create a function signature with 6 arguments. Since
|
|
; bpf target only supports maximum 5 arguments, so no argpromotion here.
|
|
;
|
|
; CHECK: i32 @foo1(ptr nocapture noundef readonly %p1, ptr nocapture noundef readonly %p2, ptr nocapture noundef readonly %p3)
|
|
|
|
define internal i32 @foo2(ptr noundef %p1, ptr noundef %p2, ptr noundef %p3) {
|
|
entry:
|
|
%0 = load i32, ptr %p1, align 4
|
|
%b = getelementptr inbounds %struct.t, ptr %p1, i64 0, i32 1
|
|
%1 = load i32, ptr %b, align 4
|
|
%add = add nsw i32 %0, %1
|
|
%c = getelementptr inbounds %struct.t, ptr %p2, i64 0, i32 2
|
|
%2 = load i32, ptr %c, align 4
|
|
%add1 = add nsw i32 %add, %2
|
|
%e = getelementptr inbounds %struct.t, ptr %p2, i64 0, i32 4
|
|
%3 = load i32, ptr %e, align 4
|
|
%add2 = add nsw i32 %add1, %3
|
|
%f = getelementptr inbounds %struct.t, ptr %p3, i64 0, i32 5
|
|
%4 = load i32, ptr %f, align 4
|
|
%add3 = add nsw i32 %add2, %4
|
|
ret i32 %add3
|
|
}
|
|
|
|
; Without number-of-argument constraint, argpromotion will create a function signature with 5 arguments, which equals
|
|
; the maximum number of argument permitted by bpf backend, so argpromotion result code does work.
|
|
;
|
|
; CHECK: i32 @foo2(i32 %p1.0.val, i32 %p1.4.val, i32 %p2.8.val, i32 %p2.16.val, i32 %p3.20.val)
|