perf test coresight: Add unroll thread test tool
Add test tool to be driven by further test scripts. This is a simple C based test that is for arm64 with some inline ASM to manually unroll a lot of code to have a very long sequence of commands. Reviewed-by: James Clark <james.clark@arm.com> Signed-off-by: Carsten Haitzler <carsten.haitzler@arm.com> Cc: Leo Yan <leo.yan@linaro.org> Cc: Mathieu Poirier <mathieu.poirier@linaro.org> Cc: Mike Leach <mike.leach@linaro.org> Cc: Suzuki Poulouse <suzuki.poulose@arm.com> Cc: coresight@lists.linaro.org Link: https://lore.kernel.org/r/20220909152803.2317006-11-carsten.haitzler@foss.arm.com Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
This commit is contained in:
parent
74c62b8d61
commit
fc0a0ea039
|
@ -7,7 +7,8 @@ include ../../../../../tools/scripts/utilities.mak
|
|||
SUBDIRS = \
|
||||
asm_pure_loop \
|
||||
memcpy_thread \
|
||||
thread_loop
|
||||
thread_loop \
|
||||
unroll_loop_thread
|
||||
|
||||
all: $(SUBDIRS)
|
||||
$(SUBDIRS):
|
||||
|
|
|
@ -0,0 +1 @@
|
|||
unroll_loop_thread
|
|
@ -0,0 +1,33 @@
|
|||
# SPDX-License-Identifier: GPL-2.0
|
||||
# Carsten Haitzler <carsten.haitzler@arm.com>, 2021
|
||||
include ../Makefile.miniconfig
|
||||
|
||||
# Binary to produce
|
||||
BIN=unroll_loop_thread
|
||||
# Any linking/libraries needed for the binary - empty if none needed
|
||||
LIB=-pthread
|
||||
|
||||
all: $(BIN)
|
||||
|
||||
$(BIN): $(BIN).c
|
||||
ifdef CORESIGHT
|
||||
ifeq ($(ARCH),arm64)
|
||||
# Build line
|
||||
$(Q)$(CC) $(BIN).c -o $(BIN) $(LIB)
|
||||
endif
|
||||
endif
|
||||
|
||||
install-tests: all
|
||||
ifdef CORESIGHT
|
||||
ifeq ($(ARCH),arm64)
|
||||
# Install the test tool in the right place
|
||||
$(call QUIET_INSTALL, tests) \
|
||||
$(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/$(INSTDIR_SUB)/$(BIN)'; \
|
||||
$(INSTALL) $(BIN) '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/$(INSTDIR_SUB)/$(BIN)/$(BIN)'
|
||||
endif
|
||||
endif
|
||||
|
||||
clean:
|
||||
$(Q)$(RM) -f $(BIN)
|
||||
|
||||
.PHONY: all clean install-tests
|
|
@ -0,0 +1,74 @@
|
|||
// SPDX-License-Identifier: GPL-2.0
|
||||
// Carsten Haitzler <carsten.haitzler@arm.com>, 2021
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <unistd.h>
|
||||
#include <string.h>
|
||||
#include <pthread.h>
|
||||
|
||||
struct args {
|
||||
pthread_t th;
|
||||
unsigned int in;
|
||||
void *ret;
|
||||
};
|
||||
|
||||
static void *thrfn(void *arg)
|
||||
{
|
||||
struct args *a = arg;
|
||||
unsigned int i, in = a->in;
|
||||
|
||||
for (i = 0; i < 10000; i++) {
|
||||
asm volatile (
|
||||
// force an unroll of thia add instruction so we can test long runs of code
|
||||
#define SNIP1 "add %[in], %[in], #1\n"
|
||||
// 10
|
||||
#define SNIP2 SNIP1 SNIP1 SNIP1 SNIP1 SNIP1 SNIP1 SNIP1 SNIP1 SNIP1 SNIP1
|
||||
// 100
|
||||
#define SNIP3 SNIP2 SNIP2 SNIP2 SNIP2 SNIP2 SNIP2 SNIP2 SNIP2 SNIP2 SNIP2
|
||||
// 1000
|
||||
#define SNIP4 SNIP3 SNIP3 SNIP3 SNIP3 SNIP3 SNIP3 SNIP3 SNIP3 SNIP3 SNIP3
|
||||
// 10000
|
||||
#define SNIP5 SNIP4 SNIP4 SNIP4 SNIP4 SNIP4 SNIP4 SNIP4 SNIP4 SNIP4 SNIP4
|
||||
// 100000
|
||||
SNIP5 SNIP5 SNIP5 SNIP5 SNIP5 SNIP5 SNIP5 SNIP5 SNIP5 SNIP5
|
||||
: /* out */
|
||||
: /* in */ [in] "r" (in)
|
||||
: /* clobber */
|
||||
);
|
||||
}
|
||||
}
|
||||
|
||||
static pthread_t new_thr(void *(*fn) (void *arg), void *arg)
|
||||
{
|
||||
pthread_t t;
|
||||
pthread_attr_t attr;
|
||||
|
||||
pthread_attr_init(&attr);
|
||||
pthread_create(&t, &attr, fn, arg);
|
||||
return t;
|
||||
}
|
||||
|
||||
int main(int argc, char **argv)
|
||||
{
|
||||
unsigned int i, thr;
|
||||
pthread_t threads[256];
|
||||
struct args args[256];
|
||||
|
||||
if (argc < 2) {
|
||||
printf("ERR: %s [numthreads]\n", argv[0]);
|
||||
exit(1);
|
||||
}
|
||||
|
||||
thr = atoi(argv[1]);
|
||||
if ((thr > 256) || (thr < 1)) {
|
||||
printf("ERR: threads 1-256\n");
|
||||
exit(1);
|
||||
}
|
||||
for (i = 0; i < thr; i++) {
|
||||
args[i].in = rand();
|
||||
args[i].th = new_thr(thrfn, &(args[i]));
|
||||
}
|
||||
for (i = 0; i < thr; i++)
|
||||
pthread_join(args[i].th, &(args[i].ret));
|
||||
return 0;
|
||||
}
|
Loading…
Reference in New Issue