llvm/llvm/test/Transforms/ArgumentPromotion/BPF/argpromotion.ll

; RUN: opt -passes=argpromotion -mtriple=bpf-pc-linux -S %s | FileCheck %s
; Source:
;  struct t {
;    int a, b, c, d, e, f, g;
;  };
;  __attribute__((noinline)) static int foo1(struct t *p1, struct t *p2, struct t *p3) {
;    return p1->a + p1->b + p2->c + p2->e + p3->f + p3->g;
;  }
;  __attribute__((noinline)) static int foo2(struct t *p1, struct t *p2, struct t *p3) {
;    return p1->a + p1->b + p2->c + p2->e + p3->f;
;  }
;  void init(void *);
;  int bar(void) {
;    struct t v1, v2, v3;
;    init(&v1); init(&v2); init(&v3);
;    return foo1(&v1, &v2, &v3) + foo2(&v1, &v2, &v3);
;  }
; Compilation flag:
;   clang -target bpf -O2 -S t.c -mllvm -print-before=argpromotion -mllvm -print-module-scope
;   and then do some manual tailoring to remove some attributes/metadata which is not used
;   by argpromotion pass.

%struct.t = type { i32, i32, i32, i32, i32, i32, i32 }

define i32 @bar() {
entry:
  %v1 = alloca %struct.t, align 4
  %v2 = alloca %struct.t, align 4
  %v3 = alloca %struct.t, align 4
  call void @init(ptr noundef nonnull %v1)
  call void @init(ptr noundef nonnull %v2)
  call void @init(ptr noundef nonnull %v3)
  %call = call fastcc i32 @foo1(ptr noundef nonnull %v1, ptr noundef nonnull %v2, ptr noundef nonnull %v3)
  %call1 = call fastcc i32 @foo2(ptr noundef nonnull %v1, ptr noundef nonnull %v2, ptr noundef nonnull %v3)
  %add = add nsw i32 %call, %call1
  ret i32 %add
}

declare void @init(ptr noundef)

define internal i32 @foo1(ptr nocapture noundef readonly %p1, ptr nocapture noundef readonly %p2, ptr nocapture noundef readonly %p3) {
entry:
  %0 = load i32, ptr %p1, align 4
  %b = getelementptr inbounds %struct.t, ptr %p1, i64 0, i32 1
  %1 = load i32, ptr %b, align 4
  %add = add nsw i32 %1, %0
  %c = getelementptr inbounds %struct.t, ptr %p2, i64 0, i32 2
  %2 = load i32, ptr %c, align 4
  %add1 = add nsw i32 %add, %2
  %e = getelementptr inbounds %struct.t, ptr %p2, i64 0, i32 4
  %3 = load i32, ptr %e, align 4
  %add2 = add nsw i32 %add1, %3
  %f = getelementptr inbounds %struct.t, ptr %p3, i64 0, i32 5
  %4 = load i32, ptr %f, align 4
  %add3 = add nsw i32 %add2, %4
  %g = getelementptr inbounds %struct.t, ptr %p3, i64 0, i32 6
  %5 = load i32, ptr %g, align 4
  %add4 = add nsw i32 %add3, %5
  ret i32 %add4
}

; Without number-of-argument constraint, argpromotion will create a function signature with 6 arguments. Since
; bpf target only supports maximum 5 arguments, so no argpromotion here.
;
; CHECK:  i32 @foo1(ptr nocapture noundef readonly %p1, ptr nocapture noundef readonly %p2, ptr nocapture noundef readonly %p3)

define internal i32 @foo2(ptr noundef %p1, ptr noundef %p2, ptr noundef %p3) {
entry:
  %0 = load i32, ptr %p1, align 4
  %b = getelementptr inbounds %struct.t, ptr %p1, i64 0, i32 1
  %1 = load i32, ptr %b, align 4
  %add = add nsw i32 %0, %1
  %c = getelementptr inbounds %struct.t, ptr %p2, i64 0, i32 2
  %2 = load i32, ptr %c, align 4
  %add1 = add nsw i32 %add, %2
  %e = getelementptr inbounds %struct.t, ptr %p2, i64 0, i32 4
  %3 = load i32, ptr %e, align 4
  %add2 = add nsw i32 %add1, %3
  %f = getelementptr inbounds %struct.t, ptr %p3, i64 0, i32 5
  %4 = load i32, ptr %f, align 4
  %add3 = add nsw i32 %add2, %4
  ret i32 %add3
}

; Without number-of-argument constraint, argpromotion will create a function signature with 5 arguments, which equals
; the maximum number of argument permitted by bpf backend, so argpromotion result code does work.
;
; CHECK:  i32 @foo2(i32 %p1.0.val, i32 %p1.4.val, i32 %p2.8.val, i32 %p2.16.val, i32 %p3.20.val)