From 1f59a32e297041099a68e56cbfb9ddb6fad287fa Mon Sep 17 00:00:00 2001 From: "Thing-han, Lim" <15379156+potsrevennil@users.noreply.github.com> Date: Mon, 18 Nov 2024 16:20:47 +0800 Subject: [PATCH] Benchmark in CI with -flto cflags enabled Signed-off-by: Thing-han, Lim <15379156+potsrevennil@users.noreply.github.com> --- .github/workflows/bench.yml | 20 ++++++++++---------- 1 file changed, 10 insertions(+), 10 deletions(-) diff --git a/.github/workflows/bench.yml b/.github/workflows/bench.yml index 407bb4afd..42d457113 100644 --- a/.github/workflows/bench.yml +++ b/.github/workflows/bench.yml @@ -26,19 +26,19 @@ jobs: name: Arm Cortex-A72 (Raspberry Pi 4) benchmarks bench_pmu: PMU archflags: -mcpu=cortex-a72 -DSYS_AARCH64_SLOW_BARREL_SHIFTER - cflags: -DFORCE_AARCH64 + cflags: "-flto -DFORCE_AARCH64" bench_extra_args: "" - system: rpi5 name: Arm Cortex-A76 (Raspberry Pi 5) benchmarks bench_pmu: PERF archflags: "-mcpu=cortex-a76 -march=armv8.2-a" - cflags: -DFORCE_AARCH64 + cflags: "-flto -DFORCE_AARCH64" bench_extra_args: "" - system: a55 name: Arm Cortex-A55 (Snapdragon 888) benchmarks bench_pmu: PERF archflags: "-mcpu=cortex-a55 -march=armv8.2-a" - cflags: "-static -DFORCE_AARCH64 -DFIPS202_NATIVE_PROFILE=\"aarch64/profiles/cortex_a55.h\"" + cflags: "-flto -static -DFORCE_AARCH64 -DFIPS202_NATIVE_PROFILE=\"aarch64/profiles/cortex_a55.h\"" bench_extra_args: -w exec-on-a55 if: github.repository_owner == 'pq-code-package' && (github.event.label.name == 'benchmark' || github.ref == 'refs/heads/main') runs-on: self-hosted-${{ matrix.target.system }} @@ -71,43 +71,43 @@ jobs: ec2_instance_type: t4g.small ec2_ami: ubuntu-latest (aarch64) archflags: -mcpu=cortex-a76 -march=armv8.2-a - cflags: -DFORCE_AARCH64 + cflags: "-flto -DFORCE_AARCH64" perf: PERF - name: Graviton3 ec2_instance_type: c7g.medium ec2_ami: ubuntu-latest (aarch64) archflags: -march=armv8.4-a+sha3 - cflags: -DFORCE_AARCH64 + cflags: "-flto -DFORCE_AARCH64" perf: PERF - name: Graviton4 ec2_instance_type: c8g.medium ec2_ami: ubuntu-latest (aarch64) archflags: -march=armv9-a+sha3 - cflags: -DFORCE_AARCH64 + cflags: "-flto -DFORCE_AARCH64" perf: PERF - name: AMD EPYC 4th gen (c7a) ec2_instance_type: c7a.medium ec2_ami: ubuntu-latest (x86_64) archflags: -mavx2 -mbmi2 -mpopcnt -maes - cflags: -DFORCE_X86_64 + cflags: "-flto -DFORCE_X86_64" perf: PMU - name: Intel Xeon 4th gen (c7i) ec2_instance_type: c7i.large ec2_ami: ubuntu-latest (x86_64) archflags: -mavx2 -mbmi2 -mpopcnt -maes - cflags: -DFORCE_X86_64 + cflags: "-flto -DFORCE_X86_64" perf: PMU - name: AMD EPYC 3rd gen (c6a) ec2_instance_type: c7a.medium ec2_ami: ubuntu-latest (x86_64) archflags: -mavx2 -mbmi2 -mpopcnt -maes - cflags: -DFORCE_X86_64 + cflags: "-flto -DFORCE_X86_64" perf: PMU - name: Intel Xeon 3rd gen (c6i) ec2_instance_type: c7i.large ec2_ami: ubuntu-latest (x86_64) archflags: -mavx2 -mbmi2 -mpopcnt -maes - cflags: -DFORCE_X86_64 + cflags: "-flto -DFORCE_X86_64" perf: PMU uses: ./.github/workflows/bench_ec2_reusable.yml if: github.repository_owner == 'pq-code-package' && (github.event.label.name == 'benchmark' || github.ref == 'refs/heads/main')