diff --git a/test/codegen/reference/sha256/avx2.json b/test/codegen/reference/sha256/avx2.json index 5a4f86f9..3f819c40 100644 --- a/test/codegen/reference/sha256/avx2.json +++ b/test/codegen/reference/sha256/avx2.json @@ -17,12 +17,12 @@ "exo_swap": "805f2a357a4709c9ad3c548d7c1225d2d630b453269190f1d6a66b765c22c5bf", "exo_symm": "3676ce1cbd96dbd378b277e26bea9514afa44dfad54e06e22d6434cf93c9b629", "exo_symv": "d84d487822d9839dd6caf34c77acc3461644facaa938a78648b3d78c1bbc48aa", - "exo_syr": "22b4c2eaa19929159563ddaf2b5d6b4e6ee0967d58e039689e3371f05792dc9a", + "exo_syr": "ec81e1b55e18367b5a941d2f4fbff18a303a432efca0752b8e540a11c2d2eb7f", "exo_syr2": "8bd9def6d6aba8be6a763a5970721c048b6e5a102c5fe1434fc740ef36636450", "exo_syrk": "1d751306796e0f091f6049dd28e48ec9fc7ecfd231a3a0072c96e8e7452a09ad", "exo_tbmv": "dc55c55ecc566cf14a3e59d28884dc900c5476f3294b5b1010f47a0c6fe2b170", "exo_tbsv": "b48649263f7dce7317c24470f7bf8c75d0cb26dbb40915d2745782976f931511", "exo_trmm": "42593a2611d0d2452c5287c81b3c636b146f035e87a77b6b30d549f94dc13d36", "exo_trmv": "e3c0bc8d5a0195df1b51a742d9a595bbdfb7e27930305896017672c7e58a2c7e", - "exo_trsv": "d2176f2046d149e9a92bc4955d8e1e1ff5c4861886f45e27e2cbb54c29eaefd9" + "exo_trsv": "b86fa2a87c49c58bdf9a905a43887b78d28a6be0318528dc0b7e9d031951bb8d" } diff --git a/test/graph.py b/test/graph.py index dda5e446..f32aef06 100644 --- a/test/graph.py +++ b/test/graph.py @@ -13,6 +13,7 @@ "syr": 3, "syr2": 3, "trmv": 2, + "trsv": 2, "gemv": 2, "gbmv": 2, "tbmv": 2, @@ -37,6 +38,7 @@ "tbmv", "sdsdot", "dsdot", + "trsv", } write_bound_kernels = { "copy", @@ -73,6 +75,7 @@ def mem_footprint(kernel_name, size, wordsize, **kwargs): "syr", "syr2", "trmv", + "trsv", "tbmv", "gemm", "syrk", @@ -116,6 +119,7 @@ def mem_ops(kernel_name, size, wordsize, **kwargs): "syr": 1, "syr2": 1, "trmv": 0.5, + "trsv": 0.5, "tbmv": 0.5, "symv": 1, }, diff --git a/test/level2/dtrsv/correctness.cpp b/test/level2/dtrsv/correctness.cpp index d2fb2130..dab81d6f 100644 --- a/test/level2/dtrsv/correctness.cpp +++ b/test/level2/dtrsv/correctness.cpp @@ -22,7 +22,7 @@ void test_dtrsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, // TODO: Figure out how to pass correct inputs for (int i = 0; i < N; ++i) { - for (int j = 0; j < N; ++j) A[i * lda + j] += 4; + for (int j = 0; j < N; ++j) A[i * lda + j] = 2.0; } for (int i = 0; i < X.size(); ++i) { X[i] = i; diff --git a/test/level2/strsv/correctness.cpp b/test/level2/strsv/correctness.cpp index b39ab600..6074a088 100644 --- a/test/level2/strsv/correctness.cpp +++ b/test/level2/strsv/correctness.cpp @@ -22,7 +22,7 @@ void test_strsv(const enum CBLAS_ORDER order, const enum CBLAS_UPLO Uplo, // TODO: Figure out how to pass correct inputs for (int i = 0; i < N; ++i) { - for (int j = 0; j < N; ++j) A[i * lda + j] += 4; + for (int j = 0; j < N; ++j) A[i * lda + j] = 2.0; } for (int i = 0; i < X.size(); ++i) { X[i] = i;