Context Navigation

Reverse Diff

perf.c [b4a4ad94:e131833c] in mainline

File:

: 1 edited

uspace/app/perf/perf.c (modified) (6 diffs)

Legend:

: Unmodified
: Added
: Removed

uspace/app/perf/perf.c

-              rb4a4ad94
+              re131833c
 /*
  * Copyright (c) 2018 Jiri Svoboda
- * Copyright (c) 2018 Vojtech Horky
  * All rights reserved.
+ *
 …
  */
-#include <assert.h>
-#include <math.h>
 #include <stdio.h>
 #include <stddef.h>
 #include <stdlib.h>
 #include <str.h>
-#include <time.h>
-#include <errno.h>
-#include <perf.h>
-#include <types/casting.h>
 #include "perf.h"
-#include "benchlist.h"
+#define MIN_DURATION_SECS 10
+#define NUM_SAMPLES 10
+#define MAX_ERROR_STR_LENGTH 1024
+static void short_report(stopwatch_t *stopwatch, int run_index,
+    benchmark_t *bench, uint64_t workload_size)
+{
+        usec_t duration_usec = NSEC2USEC(stopwatch_get_nanos(stopwatch));
+        printf("Completed %" PRIu64 " operations in %llu us",
+            workload_size, duration_usec);
+        if (duration_usec > 0) {
+                double nanos = stopwatch_get_nanos(stopwatch);
+                double thruput = (double) workload_size / (nanos / 1000000000.0l);
+                printf(", %.0f ops/s.\n", thruput);
+        } else {
+                printf(".\n");
+        }
+}
+/*
+ * This is a temporary solution until we have proper sqrt() implementation
+ * in libmath.
+ *
+ * The algorithm uses Babylonian method [1].
+ *
+ * [1] https://en.wikipedia.org/wiki/Methods_of_computing_square_roots#Babylonian_method
+ */
+static double estimate_square_root(double value, double precision)
+{
+        double estimate = 1.;
+        double prev_estimate = estimate + 10 * precision;
+        while (fabs(estimate - prev_estimate) > precision) {
+                prev_estimate = estimate;
+                estimate = (prev_estimate + value / prev_estimate) / 2.;
+        }
+        return estimate;
+}
+/*
+ * Compute available statistics from given stopwatches.
+ *
+ * We compute normal mean for average duration of the workload and geometric
+ * mean for average thruput. Note that geometric mean is necessary to compute
+ * average throughput correctly - consider the following example:
+ *  - we run always 60 operations,
+ *  - first run executes in 30 s (i.e. 2 ops/s)
+ *  - and second one in 10 s (6 ops/s).
+ * Then, naively, average throughput would be (2+6)/2 = 4 [ops/s]. However, we
+ * actually executed 60 + 60 ops in 30 + 10 seconds. So the actual average
+ * throughput is 3 ops/s (which is exactly what geometric mean means).
+ *
+ */
+static void compute_stats(stopwatch_t *stopwatch, size_t stopwatch_count,
+    uint64_t workload_size, double precision, double *out_duration_avg,
+    double *out_duration_sigma, double *out_thruput_avg)
+{
+        double inv_thruput_sum = 0.0;
+        double nanos_sum = 0.0;
+        double nanos_sum2 = 0.0;
+        for (size_t i = 0; i < stopwatch_count; i++) {
+                double nanos = stopwatch_get_nanos(&stopwatch[i]);
+                double thruput = (double) workload_size / nanos;
+                inv_thruput_sum += 1.0 / thruput;
+                nanos_sum += nanos;
+                nanos_sum2 += nanos * nanos;
+        }
+        *out_duration_avg = nanos_sum / stopwatch_count;
+        double sigma2 = (nanos_sum2 - nanos_sum * (*out_duration_avg)) /
+            ((double) stopwatch_count - 1);
+        // FIXME: implement sqrt properly
+        *out_duration_sigma = estimate_square_root(sigma2, precision);
+        *out_thruput_avg = 1.0 / (inv_thruput_sum / stopwatch_count);
+}
+static void summary_stats(stopwatch_t *stopwatch, size_t stopwatch_count,
+    benchmark_t *bench, uint64_t workload_size)
+{
+        double duration_avg, duration_sigma, thruput_avg;
+        compute_stats(stopwatch, stopwatch_count, workload_size, 0.001,
+            &duration_avg, &duration_sigma, &thruput_avg);
+        printf("Average: %" PRIu64 " ops in %.0f us (sd %.0f us); "
+            "%.0f ops/s; Samples: %zu\n",
+            workload_size, duration_avg / 1000.0, duration_sigma / 1000.0,
+            thruput_avg * 1000000000.0, stopwatch_count);
+}
+benchmark_t benchmarks[] = {
+#include "ipc/ns_ping.def"
+#include "ipc/ping_pong.def"
+#include "malloc/malloc1.def"
+#include "malloc/malloc2.def"
+        { NULL, NULL, NULL }
+};
 static bool run_benchmark(benchmark_t *bench)
+{
+        printf("Warm up and determine workload size...\n");
+        /* Execute the benchmarl */
+        const char *ret = bench->entry();
+        char *error_msg = malloc(MAX_ERROR_STR_LENGTH + 1);
+        if (error_msg == NULL) {
+                printf("Out of memory!\n");
+                return false;
+        }
+        str_cpy(error_msg, MAX_ERROR_STR_LENGTH, "");
+        bool ret = true;
+        if (bench->setup != NULL) {
+                ret = bench->setup(error_msg, MAX_ERROR_STR_LENGTH);
+                if (!ret) {
+                        goto leave_error;
+                }
+        if (ret == NULL) {
+                printf("\nBenchmark completed\n");
+                return true;
+        }
+        /*
+         * Find workload size that is big enough to last few seconds.
+         * We also check that uint64_t is big enough.
+         */
+        uint64_t workload_size = 0;
+        for (size_t bits = 0; bits <= 64; bits++) {
+                if (bits == 64) {
+                        str_cpy(error_msg, MAX_ERROR_STR_LENGTH, "Workload too small even for 1 << 63");
+                        goto leave_error;
+                }
+                workload_size = ((uint64_t) 1) << bits;
+                stopwatch_t stopwatch = STOPWATCH_INITIALIZE_STATIC;
+                bool ok = bench->entry(&stopwatch, workload_size,
+                    error_msg, MAX_ERROR_STR_LENGTH);
+                if (!ok) {
+                        goto leave_error;
+                }
+                short_report(&stopwatch, -1, bench, workload_size);
+                nsec_t duration = stopwatch_get_nanos(&stopwatch);
+                if (duration > SEC2NSEC(MIN_DURATION_SECS)) {
+                        break;
+                }
+        }
+        printf("Workload size set to %" PRIu64 ", measuring %d samples.\n", workload_size, NUM_SAMPLES);
+        stopwatch_t *stopwatch = calloc(NUM_SAMPLES, sizeof(stopwatch_t));
+        if (stopwatch == NULL) {
+                snprintf(error_msg, MAX_ERROR_STR_LENGTH, "failed allocating memory");
+                goto leave_error;
+        }
+        for (int i = 0; i < NUM_SAMPLES; i++) {
+                stopwatch_init(&stopwatch[i]);
+                bool ok = bench->entry(&stopwatch[i], workload_size,
+                    error_msg, MAX_ERROR_STR_LENGTH);
+                if (!ok) {
+                        free(stopwatch);
+                        goto leave_error;
+                }
+                short_report(&stopwatch[i], i, bench, workload_size);
+        }
+        summary_stats(stopwatch, NUM_SAMPLES, bench, workload_size);
+        printf("\nBenchmark completed\n");
+        free(stopwatch);
+        goto leave;
+leave_error:
+        printf("Error: %s\n", error_msg);
+        ret = false;
+leave:
+        if (bench->teardown != NULL) {
+                bool ok = bench->teardown(error_msg, MAX_ERROR_STR_LENGTH);
+                if (!ok) {
+                        printf("Error: %s\n", error_msg);
+                        ret = false;
+                }
+        }
+        free(error_msg);
+        return ret;
+        printf("\n%s\n", ret);
+        return false;
+}
 static int run_benchmarks(void)
+{
+        unsigned int count_ok = 0;
+        unsigned int count_fail = 0;
+        benchmark_t *bench;
+        unsigned int i = 0;
+        unsigned int n = 0;
         char *failed_names = NULL;
 …
         printf("\n*** Running all benchmarks ***\n\n");
         for (size_t it = 0; it < benchmark_count; it++) {
                 printf("%s (%s)\n", benchmarks[it]->name, benchmarks[it]->desc);
                 if (run_benchmark(benchmarks[it])) {
                         count_ok++;
+        for (bench = benchmarks; bench->name != NULL; bench++) {
+                printf("%s (%s)\n", bench->name, bench->desc);
+                if (run_benchmark(bench)) {
+                        i++;
                         continue;
+                }
                 if (!failed_names) {
                         failed_names = str_dup(benchmarks[it]->name);
+                        failed_names = str_dup(bench->name);
                 } else {
                         char *f = NULL;
                         asprintf(&f, "%s, %s", failed_names, benchmarks[it]->name);
+                        asprintf(&f, "%s, %s", failed_names, bench->name);
                         if (!f) {
                                 printf("Out of memory.\n");
 …
                         failed_names = f;
+                }
                 count_fail++;
+                n++;
+        }
+        printf("\nCompleted, %u benchmarks run, %u succeeded.\n",
+            count_ok + count_fail, count_ok);
+        printf("\nCompleted, %u benchmarks run, %u succeeded.\n", i + n, i);
         if (failed_names)
                 printf("Failed benchmarks: %s\n", failed_names);
         return count_fail;
+        return n;
+}
 …
+{
         size_t len = 0;
         for (size_t i = 0; i < benchmark_count; i++) {
                 size_t len_now = str_length(benchmarks[i]->name);
                 if (len_now > len)
                         len = len_now;
+        benchmark_t *bench;
+        for (bench = benchmarks; bench->name != NULL; bench++) {
+                if (str_length(bench->name) > len)
+                        len = str_length(bench->name);
+        }
+        assert(can_cast_size_t_to_int(len) && "benchmark name length overflow");
+        unsigned int _len = (unsigned int) len;
+        if ((_len != len) || (((int) _len) < 0)) {
+                printf("Command length overflow\n");
+                return;
+        }
         for (size_t i = 0; i < benchmark_count; i++)
                 printf("%-*s %s\n", (int) len, benchmarks[i]->name, benchmarks[i]->desc);
+        for (bench = benchmarks; bench->name != NULL; bench++)
+                printf("%-*s %s\n", _len, bench->name, bench->desc);
         printf("%-*s Run all benchmarks\n", (int) len, "*");
+        printf("%-*s Run all benchmarks\n", _len, "*");
+}
 …
+        }
+        for (size_t i = 0; i < benchmark_count; i++) {
+                if (str_cmp(argv[1], benchmarks[i]->name) == 0) {
+                        return (run_benchmark(benchmarks[i]) ? 0 : -1);
+        benchmark_t *bench;
+        for (bench = benchmarks; bench->name != NULL; bench++) {
+                if (str_cmp(argv[1], bench->name) == 0) {
+                        return (run_benchmark(bench) ? 0 : -1);
+                }
+        }

Note: See TracChangeset for help on using the changeset viewer.

Context Navigation

Changes in uspace/app/perf/perf.c [b4a4ad94:e131833c] in mainline

Legend:

uspace/app/perf/perf.c

Download in other formats: