/* Copyright (c) (2014-2016,2018-2020) Apple Inc. All rights reserved. * * corecrypto is licensed under Apple Inc.’s Internal Use License Agreement (which * is contained in the License.txt file distributed with corecrypto) and only to * people who accept that license. IMPORTANT: Any license rights granted to you by * Apple Inc. (if any) are limited to internal use within your organization only on * devices and computers you own or control, for the sole purpose of verifying the * security characteristics and correct functioning of the Apple Software. You may * not, directly or indirectly, redistribute the Apple Software or any portions thereof. */ #include #include #include "ccstats.h" static const int verbose=0; // Assume list has not been sorted void export_measurement_to_file(char *file_name,measurement_t *samples,size_t len){ #if CCN_OSX FILE *s_file; int err=0; #if defined(_WIN32) err = fopen_s(&s_file, file_name, "w"); #else s_file=fopen(file_name, "w"); #endif if(err==0 && s_file!=NULL){ for (size_t i=0; i 1.0e9) { struct units u = { .name = "G", .scale = 1.0e-9 }; return u; } if (duration > 1.0e6) { struct units u = { .name = "M", .scale = 1.0e-6 }; return u; } if (duration > 1.0e3) { struct units u = { .name = "K", .scale = 1.0e-3 }; return u; } if (duration > 1.0) { struct units u = { .name = " ", .scale = 1.0 }; return u; } if (duration > 1.0e-3) { struct units u = { .name = "m", .scale = 1.0e3 }; return u; } if (duration > 1.0e-6) { struct units u = { .name = "u", .scale = 1.0e6 }; return u; } if (duration > 1.0e-9) { struct units u = { .name = "n", .scale = 1.0e9 }; return u; } struct units u = { .name = "p", .scale = 1.0e12 }; return u; } /* Knuth attributes this method to B.P. Welford, Technometrics, 4,(1962), 419-420. While the method of computing, the number of observations n; the sum of the xi's; and the sum of the squares of the xi's, is correct in theory and will often work well enough, it is extremely vulnerable to the effects of roundoff error in computer floating point operations. It is possible to end up taking the square root of a negative number! The problem, together with a better solution, is described in Donald Knuth's "The Art of Computer Programming, Volume 2: Seminumerical Algorithms", section 4.2.2. The solution is to compute mean and standard deviation using a recurrence relation, like this: M(1) = x(1), M(k) = M(k-1) + (x(k) - M(k-1)) / k S(1) = 0, S(k) = S(k-1) + (x(k) - M(k-1)) * (x(k) - M(k)) for 2 <= k <= n, then sigma = sqrt(S(n) / (n - 1)) */ #if PRINT_IN_FILE #include #define STAT_FILENAME "corecrypto_test_stat_%.8x%.8x.csv" #endif void standard_deviation_init(struct standard_deviation *sd) { #if PRINT_IN_FILE char filename[strlen(STAT_FILENAME)+2*sizeof(uint64_t)]; sprintf(filename, STAT_FILENAME, (uint32_t)((uint64_t)sd>>32),(uint32_t)sd); sd->s_file=fopen(filename, "w"); #endif sd->M = 0; sd->S = 0.0; sd->k = 0; }; void standard_deviation_add_first(struct standard_deviation *sd, double x) { sd->M = x; sd->S = 0.0; sd->k = 1; }; #define CC_STAT_START_N 0 void standard_deviation_add(struct standard_deviation *sd, double x) { sd->k++; double M = sd->M; sd->M = M + ((x - M) / sd->k); sd->S += (x - M) * (x - sd->M); #if PRINT_IN_FILE fprintf(sd->s_file, "%d, %f\n", sd->k,x); #endif }; double standard_deviation_sigma(const struct standard_deviation *sd) { return sqrt(sd->S / (sd->k - 1)); }; /* Variance estimator */ CC_INLINE double s_square(const struct standard_deviation *sd) { return (sd->S / (sd->k - 1)); }; CC_INLINE int compare_measurements(const void *a, const void *b) { uint64_t x = ((const measurement_t *)a)->timing; uint64_t y = ((const measurement_t *)b)->timing; return x < y ? -1 : x == y ? 0 : 1; } static void rank_average_samples(measurement_t *samples,size_t len) { double rank_avg=1; size_t i=0,j; // Now rank the items while (iW) = P(Z>z) // Therefore we define W' and W'' such that // P(abs(sum_rank-mean)/variance) = P(Z>abs(z))=2P(Z>z) // Using external tool we can show that // abs(sum_rank-mean)>2variance => Probability of 0.0455 mean = (double)(len * (len + 1)) / 4; variance = sqrt((double)(len * len * (len + 1)) / 48); // If off the boundary, we reject the possibility of same distribution if (fabs(rank_sum-mean)>2*variance) { if (verbose) diag("Wilcoxon Rank Sum Test failed: Rank Sum %f, Mean %f, Ratio variance %f",rank_sum,mean,fabs(rank_sum-mean)/variance); return 1; } else if (verbose>1) { diag("Wilcoxon Rank Sum Test: Rank Sum %f, Mean %f, Ratio variance %f",rank_sum,mean,fabs(rank_sum-mean)/variance); } return 0; } static void compute_standard_deviation(measurement_t *samples,size_t len,uint32_t group, struct standard_deviation *X) { size_t i=0; standard_deviation_init(X); for (i=0;iM; unsigned int k=sd->k; sigma=standard_deviation_sigma(sd); // Reset input structure standard_deviation_init(sd); // P(Z>4)=1-0.5+0.49997=0.00003 (cf Z-score cumulative tables) for (i=0;i1) diag("Discard %d, group %d, Timing %llu, Mean %f, sigma %f",i, samples[i].group, samples[i].timing, mean, sigma); } } } return (k-sd->k); } #endif // T_TEST_DISCARD_OUTLIERS /* Independent two-sample t-test Null hypothesis is equal mean, assume equal variance. Works for normal disbributions mostly */ #define T_TEST_REJECT 4.5 // #define T_TEST_DISCARD_OUTLIERS int T_test_isRejected(measurement_t *samples,size_t len) { double t; struct standard_deviation X1; struct standard_deviation X2; // Statistics over the samples compute_standard_deviation(samples,len,0,&X1); compute_standard_deviation(samples,len,1,&X2); #ifdef T_TEST_DISCARD_OUTLIERS // Remove outliers { uint32_t k1=stat_discard_outliers(samples,len,0,&X1); uint32_t k2=stat_discard_outliers(samples,len,1,&X2); if ((k1>0 || k2>0) && (verbose>=1)) { if (verbose) diag("Discarded outliers: Group1 %d, Group2 %d, over %lu samples",k1,k2,len); } } #endif // Compute the t statistic t=(X1.M - X2.M) / (sqrt(s_square(&X1)/X1.k)+(s_square(&X2)/X2.k)); t=fabs(t); // Take absolute value // Check against critical value #if PRINT_IN_FILE fprintf(X1.s_file, "avg,, %f\n", X1.M); fprintf(X2.s_file, "avg,, %f\n", X2.M); fclose(X1.s_file); fclose(X2.s_file); #endif if (t>T_TEST_REJECT) { if (verbose) diag("T test failed: T %f, Avg1 %f Sigma1 %f, Avg2 %f Sigma2 %f",t, X1.M,standard_deviation_sigma(&X1), X2.M,standard_deviation_sigma(&X2)); return 1; } return 0; }