added SVE reg width output in main func

This commit is contained in:
JanLJL
2024-09-03 14:27:28 +02:00
parent 0a160a95b3
commit 19d3a27355
13 changed files with 144 additions and 52 deletions

View File

@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif
#define DTYPE double
@@ -15,7 +18,7 @@ void kernel(DTYPE* a, DTYPE* b, const int repeat, const int cur_elementsy, const
for(int y=1; y<cur_elementsy-1; y++) {
for(int x=1; x<cur_elementsx-1; x++) {
a[y*cur_elementsx+x] = 1.0234 * (
b[(y-1)*cur_elementsx+x] +
b[(y-1)*cur_elementsx+x] +
b[y*cur_elementsx+x-1] +
b[y*cur_elementsx+x+1] +
b[(y+1)*cur_elementsx+x]);
@@ -49,7 +52,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: 2d-5pt\n");
printf("elementsize: %lu\n", sizeof(DTYPE));
#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif
//SETUP
DTYPE* a = malloc(maxproduct*sizeof(DTYPE));
DTYPE* b = malloc(maxproduct*sizeof(DTYPE));
@@ -85,4 +92,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif

View File

@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif
#define DTYPE double
@@ -16,31 +19,31 @@ void kernel(DTYPE* a, DTYPE* b, const int repeat, const int cur_elementsz, const
for(int y=1; y<cur_elementsy-1; y++) {
for(int x=1; x<cur_elementsx-1; x++) {
a[z*cur_elementsy*cur_elementsx+y*cur_elementsx+x] = 1.0234 * (
b[(z+1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x-1] +
b[(z+1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x ] +
b[(z+1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x+1] +
b[(z+1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x-1] +
b[(z+1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x ] +
b[(z+1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x+1] +
b[(z+1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x-1] +
b[(z+1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x ] +
b[(z+1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x+1] +
b[ z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x-1] +
b[ z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x ] +
b[ z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x+1] +
b[(z+1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x-1] +
b[(z+1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x ] +
b[(z+1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x+1] +
b[(z+1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x-1] +
b[(z+1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x ] +
b[(z+1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x+1] +
b[(z+1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x-1] +
b[(z+1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x ] +
b[(z+1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x+1] +
b[ z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x-1] +
b[ z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x ] +
b[ z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x+1] +
b[ z*cur_elementsy*cur_elementsx+ y*cur_elementsx+x-1] +
b[ z*cur_elementsy*cur_elementsx+ y*cur_elementsx+x+1] +
b[ z*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x-1] +
b[ z*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x ] +
b[ z*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x+1] +
b[(z-1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x-1] +
b[(z-1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x ] +
b[(z-1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x+1] +
b[(z-1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x-1] +
b[(z-1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x ] +
b[(z-1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x+1] +
b[(z-1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x-1] +
b[(z-1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x ] +
b[(z-1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x-1] +
b[(z-1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x ] +
b[(z-1)*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x+1] +
b[(z-1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x-1] +
b[(z-1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x ] +
b[(z-1)*cur_elementsy*cur_elementsx+ y*cur_elementsx+x+1] +
b[(z-1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x-1] +
b[(z-1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x ] +
b[(z-1)*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x+1]);
}
}
@@ -76,7 +79,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: 3d-27pt\n");
printf("elementsize: %lu\n", sizeof(DTYPE));
#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif
//SETUP
DTYPE* a = malloc(maxproduct*sizeof(DTYPE));
DTYPE* b = malloc(maxproduct*sizeof(DTYPE));
@@ -115,4 +122,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif

View File

@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif
#define DTYPE double
@@ -16,8 +19,8 @@ void kernel(DTYPE* a, DTYPE* b, const int repeat, const int cur_elementsz, const
for(int y=1; y<cur_elementsy-1; y++) {
for(int x=1; x<cur_elementsx-1; x++) {
a[z*cur_elementsy*cur_elementsx+y*cur_elementsx+x] = 1.0234 * (
b[(z+1)*cur_elementsy*cur_elementsx+y*cur_elementsx+x] +
b[z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x] +
b[(z+1)*cur_elementsy*cur_elementsx+y*cur_elementsx+x] +
b[z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x] +
b[z*cur_elementsy*cur_elementsx+y*cur_elementsx+x-1] +
b[z*cur_elementsy*cur_elementsx+y*cur_elementsx+x+1] +
b[z*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x] +
@@ -56,7 +59,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: 3d-7pt\n");
printf("elementsize: %lu\n", sizeof(DTYPE));
#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif
//SETUP
DTYPE* a = malloc(maxproduct*sizeof(DTYPE));
DTYPE* b = malloc(maxproduct*sizeof(DTYPE));
@@ -95,4 +102,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif

View File

@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif
#define DTYPE double
@@ -18,8 +21,8 @@ void kernel(DTYPE* a, DTYPE* b, const int repeat, const int cur_elementsz, const
a[z*cur_elementsy*cur_elementsx+y*cur_elementsx+x] = 1.0234 * (
b[(z+3)*cur_elementsy*cur_elementsx+y*cur_elementsx+x] +
b[(z+1)*cur_elementsy*cur_elementsx+y*cur_elementsx+x] +
b[z*cur_elementsy*cur_elementsx+(y-3)*cur_elementsx+x] +
b[z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x] +
b[z*cur_elementsy*cur_elementsx+(y-3)*cur_elementsx+x] +
b[z*cur_elementsy*cur_elementsx+(y-1)*cur_elementsx+x] +
b[z*cur_elementsy*cur_elementsx+y*cur_elementsx+x-1] +
b[z*cur_elementsy*cur_elementsx+y*cur_elementsx+x+1] +
b[z*cur_elementsy*cur_elementsx+(y+1)*cur_elementsx+x] +
@@ -60,7 +63,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: 3d-r3-11pt\n");
printf("elementsize: %lu\n", sizeof(DTYPE));
#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif
//SETUP
DTYPE* a = malloc(maxproduct*sizeof(DTYPE));
DTYPE* b = malloc(maxproduct*sizeof(DTYPE));
@@ -99,4 +106,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif

View File

@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif
#define DTYPE double
@@ -38,7 +41,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: add\n");
printf("elementsize: %lu\n", sizeof(DTYPE));
#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif
//SETUP
DTYPE* a = malloc(maxelements*sizeof(DTYPE));
DTYPE* b = malloc(maxelements*sizeof(DTYPE));
@@ -75,4 +82,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif

View File

@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif
#define DTYPE double
@@ -38,7 +41,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: copy\n");
printf("elementsize: %lu\n", sizeof(DTYPE));
#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif
//SETUP
DTYPE* a = malloc(maxelements*sizeof(DTYPE));
DTYPE* b = malloc(maxelements*sizeof(DTYPE));
@@ -73,4 +80,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif

View File

@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif
#define DTYPE double
@@ -15,7 +18,7 @@ void kernel(DTYPE* a, const int repeat, const int cur_elementsy, const int cur_e
for(int y=1; y<cur_elementsy-1; y++) {
for(int x=1; x<cur_elementsx-1; x++) {
a[y*cur_elementsx+x] = 1.0234 * (
a[(y-1)*cur_elementsx+x] +
a[(y-1)*cur_elementsx+x] +
a[y*cur_elementsx+x-1] +
a[y*cur_elementsx+x+1] +
a[(y+1)*cur_elementsx+x]);
@@ -48,7 +51,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: gs-2d-5pt\n");
printf("elementsize: %lu\n", sizeof(DTYPE));
#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif
//SETUP
DTYPE* a = malloc(maxproduct*sizeof(DTYPE));
for(int i=0; i<maxproduct; i++) {
@@ -82,4 +89,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif

View File

@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif
#define DTYPE double
@@ -40,7 +43,12 @@ int main(int argc, char *argv[]) {
}
printf("kernel: pi\n");
printf("elementsize: %lu\n", sizeof(DTYPE));
#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif
//SETUP
likwid_markerInit();
@@ -68,4 +76,4 @@ int main(int argc, char *argv[]) {
likwid_markerClose();
return 0;
}
#endif
#endif

View File

@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif
#define DTYPE double
@@ -39,7 +42,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: store\n");
printf("elementsize: %lu\n", sizeof(DTYPE));
#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif
//SETUP
DTYPE* a = malloc(maxelements*sizeof(DTYPE));
for(int i=0; i<maxelements; i++) {
@@ -72,4 +79,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif

View File

@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif
#define DTYPE double
@@ -38,7 +41,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: triad\n");
printf("elementsize: %lu\n", sizeof(DTYPE));
#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif
//SETUP
DTYPE* a = malloc(maxelements*sizeof(DTYPE));
DTYPE* b = malloc(maxelements*sizeof(DTYPE));
@@ -77,4 +84,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif

View File

@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif
#define DTYPE double
@@ -40,7 +43,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: sumreduction\n");
printf("elementsize: %lu\n", sizeof(DTYPE));
#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif
//SETUP
DTYPE* a = malloc(maxelements*sizeof(DTYPE));
for(int i=0; i<maxelements; i++) {
@@ -73,4 +80,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif

View File

@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif
#define DTYPE double
@@ -38,7 +41,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: triad\n");
printf("elementsize: %lu\n", sizeof(DTYPE));
#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif
//SETUP
DTYPE* a = malloc(maxelements*sizeof(DTYPE));
DTYPE* b = malloc(maxelements*sizeof(DTYPE));
@@ -75,4 +82,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif

View File

@@ -2,6 +2,9 @@
#include <stdio.h>
#include <stdlib.h>
#include <likwid.h>
#ifdef __ARM_FEATURE_SVE
#include <sys/prctl.h>
#endif
#endif
#define DTYPE double
@@ -38,7 +41,11 @@ int main(int argc, char *argv[]) {
}
printf("kernel: update\n");
printf("elementsize: %lu\n", sizeof(DTYPE));
#ifdef __ARM_FEATURE_SVE
int vl_in_bytes = prctl(PR_SVE_GET_VL) & PR_SVE_VL_LEN_MASK;
printf("vector length: %d bits\n", vl_in_bytes*8);
#endif
//SETUP
DTYPE* a = malloc(maxelements*sizeof(DTYPE));
DTYPE* b = malloc(maxelements*sizeof(DTYPE));
@@ -75,4 +82,4 @@ int main(int argc, char *argv[]) {
free(a);
return 0;
}
#endif
#endif