Skip to content

Commit

Permalink
added SVE reg width output in main func
Browse files Browse the repository at this point in the history
JanLJL committed Sep 3, 2024
1 parent ef00b67 commit d4d98bd
Showing 13 changed files with 144 additions and 52 deletions.
13 changes: 10 additions & 3 deletions validation/kernels/2d-5pt.c
Original file line number Diff line number Diff line change
@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif

#define DTYPE double
@@ -15,7 +18,7 @@ void kernel(DTYPE* a, DTYPE* b, const int repeat, const int cur_elementsy, const
for(int y=1; y<cur_elementsy-1; y++) {
for(int x=1; x<cur_elementsx-1; x++) {
a[y*cur_elementsx+x] = 1.0234 * (
b[(y-1)*cur_elementsx+x] +
b[(y-1)*cur_elementsx+x] +
b[y*cur_elementsx+x-1] +
b[y*cur_elementsx+x+1] +
b[(y+1)*cur_elementsx+x]);
@@ -49,7 +52,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: 2d-5pt\n");
printf("elementsize: %lu\n", sizeof(DTYPE));

#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif

//SETUP
DTYPE* a = malloc(maxproduct*sizeof(DTYPE));
DTYPE* b = malloc(maxproduct*sizeof(DTYPE));
@@ -85,4 +92,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif
51 changes: 29 additions & 22 deletions validation/kernels/3d-27pt.c
Original file line number Diff line number Diff line change
@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif

#define DTYPE double
@@ -16,31 +19,31 @@ void kernel(DTYPE* a, DTYPE* b, const int repeat, const int cur_elementsz, const
for(int y=1; y<cur_elementsy-1; y++) {
for(int x=1; x<cur_elementsx-1; x++) {
a[z*cur_elementsy*cur_elementsx+y*cur_elementsx+x] = 1.0234 * (
b[(z+1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x-1] +
b[(z+1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x ] +
b[(z+1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x+1] +
b[(z+1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x-1] +
b[(z+1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x ] +
b[(z+1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x+1] +
b[(z+1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x-1] +
b[(z+1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x ] +
b[(z+1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x+1] +
b[ z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x-1] +
b[ z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x ] +
b[ z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x+1] +
b[(z+1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x-1] +
b[(z+1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x ] +
b[(z+1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x+1] +
b[(z+1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x-1] +
b[(z+1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x ] +
b[(z+1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x+1] +
b[(z+1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x-1] +
b[(z+1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x ] +
b[(z+1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x+1] +
b[ z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x-1] +
b[ z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x ] +
b[ z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x+1] +
b[ z*cur_elementsy*cur_elementsx+ y*cur_elementsx+x-1] +
b[ z*cur_elementsy*cur_elementsx+ y*cur_elementsx+x+1] +
b[ z*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x-1] +
b[ z*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x ] +
b[ z*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x+1] +
b[(z-1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x-1] +
b[(z-1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x ] +
b[(z-1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x+1] +
b[(z-1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x-1] +
b[(z-1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x ] +
b[(z-1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x+1] +
b[(z-1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x-1] +
b[(z-1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x ] +
b[(z-1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x-1] +
b[(z-1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x ] +
b[(z-1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x+1] +
b[(z-1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x-1] +
b[(z-1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x ] +
b[(z-1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x+1] +
b[(z-1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x-1] +
b[(z-1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x ] +
b[(z-1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x+1]);
}
}
@@ -76,7 +79,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: 3d-27pt\n");
printf("elementsize: %lu\n", sizeof(DTYPE));

#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif

//SETUP
DTYPE* a = malloc(maxproduct*sizeof(DTYPE));
DTYPE* b = malloc(maxproduct*sizeof(DTYPE));
@@ -115,4 +122,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif
15 changes: 11 additions & 4 deletions validation/kernels/3d-7pt.c
Original file line number Diff line number Diff line change
@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif

#define DTYPE double
@@ -16,8 +19,8 @@ void kernel(DTYPE* a, DTYPE* b, const int repeat, const int cur_elementsz, const
for(int y=1; y<cur_elementsy-1; y++) {
for(int x=1; x<cur_elementsx-1; x++) {
a[z*cur_elementsy*cur_elementsx+y*cur_elementsx+x] = 1.0234 * (
b[(z+1)*cur_elementsy*cur_elementsx+y*cur_elementsx+x] +
b[z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x] +
b[(z+1)*cur_elementsy*cur_elementsx+y*cur_elementsx+x] +
b[z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x] +
b[z*cur_elementsy*cur_elementsx+y*cur_elementsx+x-1] +
b[z*cur_elementsy*cur_elementsx+y*cur_elementsx+x+1] +
b[z*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x] +
@@ -56,7 +59,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: 3d-7pt\n");
printf("elementsize: %lu\n", sizeof(DTYPE));

#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif

//SETUP
DTYPE* a = malloc(maxproduct*sizeof(DTYPE));
DTYPE* b = malloc(maxproduct*sizeof(DTYPE));
@@ -95,4 +102,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif
15 changes: 11 additions & 4 deletions validation/kernels/3d-r3-11pt.c
Original file line number Diff line number Diff line change
@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif

#define DTYPE double
@@ -18,8 +21,8 @@ void kernel(DTYPE* a, DTYPE* b, const int repeat, const int cur_elementsz, const
a[z*cur_elementsy*cur_elementsx+y*cur_elementsx+x] = 1.0234 * (
b[(z+3)*cur_elementsy*cur_elementsx+y*cur_elementsx+x] +
b[(z+1)*cur_elementsy*cur_elementsx+y*cur_elementsx+x] +
b[z*cur_elementsy*cur_elementsx+(y-3)*cur_elementsx+x] +
b[z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x] +
b[z*cur_elementsy*cur_elementsx+(y-3)*cur_elementsx+x] +
b[z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x] +
b[z*cur_elementsy*cur_elementsx+y*cur_elementsx+x-1] +
b[z*cur_elementsy*cur_elementsx+y*cur_elementsx+x+1] +
b[z*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x] +
@@ -60,7 +63,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: 3d-r3-11pt\n");
printf("elementsize: %lu\n", sizeof(DTYPE));

#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif

//SETUP
DTYPE* a = malloc(maxproduct*sizeof(DTYPE));
DTYPE* b = malloc(maxproduct*sizeof(DTYPE));
@@ -99,4 +106,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif
11 changes: 9 additions & 2 deletions validation/kernels/add.c
Original file line number Diff line number Diff line change
@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif

#define DTYPE double
@@ -38,7 +41,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: add\n");
printf("elementsize: %lu\n", sizeof(DTYPE));

#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif

//SETUP
DTYPE* a = malloc(maxelements*sizeof(DTYPE));
DTYPE* b = malloc(maxelements*sizeof(DTYPE));
@@ -75,4 +82,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif
11 changes: 9 additions & 2 deletions validation/kernels/copy.c
Original file line number Diff line number Diff line change
@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif

#define DTYPE double
@@ -38,7 +41,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: copy\n");
printf("elementsize: %lu\n", sizeof(DTYPE));

#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif

//SETUP
DTYPE* a = malloc(maxelements*sizeof(DTYPE));
DTYPE* b = malloc(maxelements*sizeof(DTYPE));
@@ -73,4 +80,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif
13 changes: 10 additions & 3 deletions validation/kernels/gs-2d-5pt.c
Original file line number Diff line number Diff line change
@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif

#define DTYPE double
@@ -15,7 +18,7 @@ void kernel(DTYPE* a, const int repeat, const int cur_elementsy, const int cur_e
for(int y=1; y<cur_elementsy-1; y++) {
for(int x=1; x<cur_elementsx-1; x++) {
a[y*cur_elementsx+x] = 1.0234 * (
a[(y-1)*cur_elementsx+x] +
a[(y-1)*cur_elementsx+x] +
a[y*cur_elementsx+x-1] +
a[y*cur_elementsx+x+1] +
a[(y+1)*cur_elementsx+x]);
@@ -48,7 +51,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: gs-2d-5pt\n");
printf("elementsize: %lu\n", sizeof(DTYPE));

#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif

//SETUP
DTYPE* a = malloc(maxproduct*sizeof(DTYPE));
for(int i=0; i<maxproduct; i++) {
@@ -82,4 +89,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif
12 changes: 10 additions & 2 deletions validation/kernels/pi.c
Original file line number Diff line number Diff line change
@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif

#define DTYPE double
@@ -40,7 +43,12 @@ int main(int argc, char *argv[]) {
}
printf("kernel: pi\n");
printf("elementsize: %lu\n", sizeof(DTYPE));

#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif


//SETUP

likwid_markerInit();
@@ -68,4 +76,4 @@ int main(int argc, char *argv[]) {
likwid_markerClose();
return 0;
}
#endif
#endif
11 changes: 9 additions & 2 deletions validation/kernels/store.c
Original file line number Diff line number Diff line change
@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif

#define DTYPE double
@@ -39,7 +42,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: store\n");
printf("elementsize: %lu\n", sizeof(DTYPE));

#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif

//SETUP
DTYPE* a = malloc(maxelements*sizeof(DTYPE));
for(int i=0; i<maxelements; i++) {
@@ -72,4 +79,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif
11 changes: 9 additions & 2 deletions validation/kernels/striad.c
Original file line number Diff line number Diff line change
@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif

#define DTYPE double
@@ -38,7 +41,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: triad\n");
printf("elementsize: %lu\n", sizeof(DTYPE));

#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif

//SETUP
DTYPE* a = malloc(maxelements*sizeof(DTYPE));
DTYPE* b = malloc(maxelements*sizeof(DTYPE));
@@ -77,4 +84,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif
Loading

0 comments on commit d4d98bd

Please sign in to comment.