/* * Copyright (C) 2011 Andrea Mazzoleni * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program. If not, see . */ #include "portable.h" #include "snapraid.h" #include "util.h" #include "raid/raid.h" #include "raid/cpu.h" #include "raid/internal.h" #include "raid/memory.h" #include "state.h" /* * Size of the blocks to test. */ #define TEST_SIZE (256 * KIBI) /* * Number of data blocks to test. */ #define TEST_COUNT (8) /** * Differential us of two timeval. */ static int64_t diffgettimeofday(struct timeval *start, struct timeval *stop) { int64_t d; d = 1000000LL * (stop->tv_sec - start->tv_sec); d += stop->tv_usec - start->tv_usec; return d; } /** * Start time measurement. */ #define SPEED_START \ count = 0; \ gettimeofday(&start, 0); \ do { \ for (i = 0; i < delta; ++i) /** * Stop time measurement. */ #define SPEED_STOP \ count += delta; \ gettimeofday(&stop, 0); \ } while (diffgettimeofday(&start, &stop) < period * 1000LL) ; \ ds = size * (int64_t)count * nd; \ dt = diffgettimeofday(&start, &stop); /** * Global variable used to propagate side effects. * * This is required to avoid optimizing compilers * to remove code without side effects. */ static unsigned side_effect; void speed(int period) { struct timeval start; struct timeval stop; int64_t ds; int64_t dt; int i, j; unsigned char digest[HASH_MAX]; unsigned char seed[HASH_MAX]; int id[RAID_PARITY_MAX]; int ip[RAID_PARITY_MAX]; int count; int delta = period >= 1000 ? 10 : 1; int size = TEST_SIZE; int nd = TEST_COUNT; int nv; void *v_alloc; void **v; nv = nd + RAID_PARITY_MAX + 1; v = malloc_nofail_vector_align(nd, nv, size, &v_alloc); /* initialize disks with fixed data */ for (i = 0; i < nd; ++i) memset(v[i], i, size); /* zero buffer */ memset(v[nd + RAID_PARITY_MAX], 0, size); raid_zero(v[nd + RAID_PARITY_MAX]); /* hash seed */ for (i = 0; i < HASH_MAX; ++i) seed[i] = i; /* basic disks and parity mapping */ for (i = 0; i < RAID_PARITY_MAX; ++i) { id[i] = i; ip[i] = i; } printf(PACKAGE " v" VERSION " by Andrea Mazzoleni, " PACKAGE_URL "\n"); #ifdef __GNUC__ printf("Compiler gcc " __VERSION__ "\n"); #endif #ifdef CONFIG_X86 { char vendor[CPU_VENDOR_MAX]; unsigned family; unsigned model; raid_cpu_info(vendor, &family, &model); printf("CPU %s, family %u, model %u, flags%s%s%s%s%s%s\n", vendor, family, model, raid_cpu_has_sse2() ? " sse2" : "", raid_cpu_has_ssse3() ? " ssse3" : "", raid_cpu_has_crc32() ? " crc32" : "", raid_cpu_has_avx2() ? " avx2" : "", raid_cpu_has_slowmult() ? " slowmult" : "", raid_cpu_has_slowextendedreg() ? " slowext" : "" ); } #else printf("CPU is not a x86/x64\n"); #endif #if WORDS_BIGENDIAN printf("Memory is big-endian %d-bit\n", (int)sizeof(void *) * 8); #else printf("Memory is little-endian %d-bit\n", (int)sizeof(void *) * 8); #endif #if HAVE_FUTIMENS printf("Support nanosecond timestamps with futimens()\n"); #elif HAVE_FUTIMES printf("Support nanosecond timestamps with futimes()\n"); #elif HAVE_FUTIMESAT printf("Support nanosecond timestamps with futimesat()\n"); #else printf("Does not support nanosecond timestamps\n"); #endif printf("\n"); printf("Speed test using %u data buffers of %u bytes, for a total of %u KiB.\n", nd, size, nd * size / KIBI); printf("Memory blocks have a displacement of %u bytes to improve cache performance.\n", RAID_MALLOC_DISPLACEMENT); printf("The reported values are the aggregate bandwidth of all data blocks in MB/s,\n"); printf("not counting parity blocks.\n"); printf("\n"); printf("Memory write speed using the C memset() function:\n"); printf("%8s", "memset"); fflush(stdout); SPEED_START { for (j = 0; j < nd; ++j) memset(v[j], j, size); } SPEED_STOP printf("%8" PRIu64, ds / dt); printf("\n"); printf("\n"); /* crc table */ printf("CRC used to check the content file integrity:\n"); printf("%8s", "table"); fflush(stdout); SPEED_START { for (j = 0; j < nd; ++j) side_effect += crc32c_gen(0, v[j], size); } SPEED_STOP printf("%8" PRIu64, ds / dt); printf("\n"); printf("%8s", "intel"); fflush(stdout); #if HAVE_SSE42 if (raid_cpu_has_crc32()) { SPEED_START { for (j = 0; j < nd; ++j) side_effect += crc32c_x86(0, v[j], size); } SPEED_STOP printf("%8" PRIu64, ds / dt); } #endif printf("\n"); printf("\n"); /* hash table */ printf("Hash used to check the data blocks integrity:\n"); printf("%8s", ""); printf("%8s", "best"); printf("%8s", "murmur3"); printf("%8s", "spooky2"); printf("%8s", "metro"); printf("\n"); printf("%8s", "hash"); #ifdef CONFIG_X86 if (sizeof(void *) == 4 && !raid_cpu_has_slowmult()) printf("%8s", "murmur3"); else printf("%8s", "spooky2"); #else if (sizeof(void *) == 4) printf("%8s", "murmur3"); else printf("%8s", "spooky2"); #endif fflush(stdout); SPEED_START { for (j = 0; j < nd; ++j) memhash(HASH_MURMUR3, seed, digest, v[j], size); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); SPEED_START { for (j = 0; j < nd; ++j) memhash(HASH_SPOOKY2, seed, digest, v[j], size); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); SPEED_START { for (j = 0; j < nd; ++j) memhash(HASH_METRO, seed, digest, v[j], size); } SPEED_STOP printf("%8" PRIu64, ds / dt); printf("\n"); printf("\n"); /* RAID table */ printf("RAID functions used for computing the parity with 'sync':\n"); printf("%8s", ""); printf("%8s", "best"); printf("%8s", "int8"); printf("%8s", "int32"); printf("%8s", "int64"); #ifdef CONFIG_X86 printf("%8s", "sse2"); #ifdef CONFIG_X86_64 printf("%8s", "sse2e"); #endif printf("%8s", "ssse3"); #ifdef CONFIG_X86_64 printf("%8s", "ssse3e"); #endif printf("%8s", "avx2"); #ifdef CONFIG_X86_64 printf("%8s", "avx2e"); #endif #endif printf("\n"); /* GEN1 */ printf("%8s", "gen1"); printf("%8s", raid_gen1_tag()); fflush(stdout); printf("%8s", ""); SPEED_START { raid_gen1_int32(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); SPEED_START { raid_gen1_int64(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #ifdef CONFIG_X86 #ifdef CONFIG_SSE2 if (raid_cpu_has_sse2()) { SPEED_START { raid_gen1_sse2(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); } #endif #ifdef CONFIG_X86_64 printf("%8s", ""); #endif printf("%8s", ""); #ifdef CONFIG_X86_64 printf("%8s", ""); #endif #ifdef CONFIG_AVX2 if (raid_cpu_has_avx2()) { SPEED_START { raid_gen1_avx2(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); } #endif #endif printf("\n"); /* GEN2 */ printf("%8s", "gen2"); printf("%8s", raid_gen2_tag()); fflush(stdout); printf("%8s", ""); SPEED_START { raid_gen2_int32(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); SPEED_START { raid_gen2_int64(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #ifdef CONFIG_X86 #ifdef CONFIG_SSE2 if (raid_cpu_has_sse2()) { SPEED_START { raid_gen2_sse2(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #ifdef CONFIG_X86_64 SPEED_START { raid_gen2_sse2ext(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #endif } #endif printf("%8s", ""); #ifdef CONFIG_X86_64 printf("%8s", ""); #endif #ifdef CONFIG_AVX2 if (raid_cpu_has_avx2()) { SPEED_START { raid_gen2_avx2(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); } #endif #endif printf("\n"); /* GENz */ printf("%8s", "genz"); printf("%8s", raid_genz_tag()); fflush(stdout); printf("%8s", ""); SPEED_START { raid_genz_int32(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); SPEED_START { raid_genz_int64(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #ifdef CONFIG_X86 #ifdef CONFIG_SSE2 if (raid_cpu_has_sse2()) { SPEED_START { raid_genz_sse2(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #ifdef CONFIG_X86_64 SPEED_START { raid_genz_sse2ext(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #endif } #endif printf("%8s", ""); #ifdef CONFIG_X86_64 printf("%8s", ""); #endif printf("%8s", ""); #ifdef CONFIG_X86_64 #ifdef CONFIG_AVX2 if (raid_cpu_has_avx2()) { SPEED_START { raid_genz_avx2ext(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); } #endif #endif #endif printf("\n"); /* GEN3 */ printf("%8s", "gen3"); printf("%8s", raid_gen3_tag()); fflush(stdout); SPEED_START { raid_gen3_int8(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); printf("%8s", ""); printf("%8s", ""); #ifdef CONFIG_X86 if (raid_cpu_has_sse2()) { printf("%8s", ""); #ifdef CONFIG_X86_64 printf("%8s", ""); #endif } #endif #ifdef CONFIG_X86 #ifdef CONFIG_SSSE3 if (raid_cpu_has_ssse3()) { SPEED_START { raid_gen3_ssse3(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #ifdef CONFIG_X86_64 SPEED_START { raid_gen3_ssse3ext(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #endif } #endif printf("%8s", ""); #ifdef CONFIG_X86_64 #ifdef CONFIG_AVX2 if (raid_cpu_has_avx2()) { SPEED_START { raid_gen3_avx2ext(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); } #endif #endif #endif printf("\n"); /* GEN4 */ printf("%8s", "gen4"); printf("%8s", raid_gen4_tag()); fflush(stdout); SPEED_START { raid_gen4_int8(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); printf("%8s", ""); printf("%8s", ""); #ifdef CONFIG_X86 #ifdef CONFIG_SSE2 if (raid_cpu_has_sse2()) { printf("%8s", ""); #ifdef CONFIG_X86_64 printf("%8s", ""); #endif } #endif #endif #ifdef CONFIG_X86 #ifdef CONFIG_SSSE3 if (raid_cpu_has_ssse3()) { SPEED_START { raid_gen4_ssse3(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #ifdef CONFIG_X86_64 SPEED_START { raid_gen4_ssse3ext(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #endif } #endif printf("%8s", ""); #ifdef CONFIG_X86_64 #ifdef CONFIG_AVX2 if (raid_cpu_has_avx2()) { SPEED_START { raid_gen4_avx2ext(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); } #endif #endif #endif printf("\n"); /* GEN5 */ printf("%8s", "gen5"); printf("%8s", raid_gen5_tag()); fflush(stdout); SPEED_START { raid_gen5_int8(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); printf("%8s", ""); printf("%8s", ""); #ifdef CONFIG_X86 #ifdef CONFIG_SSE2 if (raid_cpu_has_sse2()) { printf("%8s", ""); #ifdef CONFIG_X86_64 printf("%8s", ""); #endif } #endif #endif #ifdef CONFIG_X86 #ifdef CONFIG_SSSE3 if (raid_cpu_has_ssse3()) { SPEED_START { raid_gen5_ssse3(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #ifdef CONFIG_X86_64 SPEED_START { raid_gen5_ssse3ext(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #endif } #endif printf("%8s", ""); #ifdef CONFIG_X86_64 #ifdef CONFIG_AVX2 if (raid_cpu_has_avx2()) { SPEED_START { raid_gen5_avx2ext(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); } #endif #endif #endif printf("\n"); /* GEN6 */ printf("%8s", "gen6"); printf("%8s", raid_gen6_tag()); fflush(stdout); SPEED_START { raid_gen6_int8(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); printf("%8s", ""); printf("%8s", ""); #ifdef CONFIG_X86 #ifdef CONFIG_SSE2 if (raid_cpu_has_sse2()) { printf("%8s", ""); #ifdef CONFIG_X86_64 printf("%8s", ""); #endif } #endif #endif #ifdef CONFIG_X86 #ifdef CONFIG_SSSE3 if (raid_cpu_has_ssse3()) { SPEED_START { raid_gen6_ssse3(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #ifdef CONFIG_X86_64 SPEED_START { raid_gen6_ssse3ext(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #endif } #endif printf("%8s", ""); #ifdef CONFIG_X86_64 #ifdef CONFIG_AVX2 if (raid_cpu_has_avx2()) { SPEED_START { raid_gen6_avx2ext(nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); } #endif #endif #endif printf("\n"); printf("\n"); /* recover table */ printf("RAID functions used for recovering with 'fix':\n"); printf("%8s", ""); printf("%8s", "best"); printf("%8s", "int8"); #ifdef CONFIG_X86 printf("%8s", "ssse3"); printf("%8s", "avx2"); #endif printf("\n"); printf("%8s", "rec1"); printf("%8s", raid_rec1_tag()); fflush(stdout); SPEED_START { for (j = 0; j < nd; ++j) /* +1 to avoid GEN1 optimized case */ raid_rec1_int8(1, id, ip + 1, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #ifdef CONFIG_X86 #ifdef CONFIG_SSSE3 if (raid_cpu_has_ssse3()) { SPEED_START { for (j = 0; j < nd; ++j) /* +1 to avoid GEN1 optimized case */ raid_rec1_ssse3(1, id, ip + 1, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); } #endif #ifdef CONFIG_AVX2 if (raid_cpu_has_avx2()) { SPEED_START { for (j = 0; j < nd; ++j) /* +1 to avoid GEN1 optimized case */ raid_rec1_avx2(1, id, ip + 1, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); } #endif #endif printf("\n"); printf("%8s", "rec2"); printf("%8s", raid_rec2_tag()); fflush(stdout); SPEED_START { for (j = 0; j < nd; ++j) /* +1 to avoid GEN2 optimized case */ raid_rec2_int8(2, id, ip + 1, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #ifdef CONFIG_X86 #ifdef CONFIG_SSSE3 if (raid_cpu_has_ssse3()) { SPEED_START { for (j = 0; j < nd; ++j) /* +1 to avoid GEN2 optimized case */ raid_rec2_ssse3(2, id, ip + 1, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); } #endif #ifdef CONFIG_AVX2 if (raid_cpu_has_avx2()) { SPEED_START { for (j = 0; j < nd; ++j) /* +1 to avoid GEN1 optimized case */ raid_rec2_avx2(2, id, ip + 1, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); } #endif #endif printf("\n"); printf("%8s", "rec3"); printf("%8s", raid_recX_tag()); fflush(stdout); SPEED_START { for (j = 0; j < nd; ++j) raid_recX_int8(3, id, ip, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #ifdef CONFIG_X86 #ifdef CONFIG_SSSE3 if (raid_cpu_has_ssse3()) { SPEED_START { for (j = 0; j < nd; ++j) raid_recX_ssse3(3, id, ip, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); } #endif #ifdef CONFIG_AVX2 if (raid_cpu_has_avx2()) { SPEED_START { for (j = 0; j < nd; ++j) raid_recX_avx2(3, id, ip, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); } #endif #endif printf("\n"); printf("%8s", "rec4"); printf("%8s", raid_recX_tag()); fflush(stdout); SPEED_START { for (j = 0; j < nd; ++j) raid_recX_int8(4, id, ip, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #ifdef CONFIG_X86 #ifdef CONFIG_SSSE3 if (raid_cpu_has_ssse3()) { SPEED_START { for (j = 0; j < nd; ++j) raid_recX_ssse3(4, id, ip, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); } #endif #ifdef CONFIG_AVX2 if (raid_cpu_has_avx2()) { SPEED_START { for (j = 0; j < nd; ++j) raid_recX_avx2(4, id, ip, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); } #endif #endif printf("\n"); printf("%8s", "rec5"); printf("%8s", raid_recX_tag()); fflush(stdout); SPEED_START { for (j = 0; j < nd; ++j) raid_recX_int8(5, id, ip, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #ifdef CONFIG_X86 #ifdef CONFIG_SSSE3 if (raid_cpu_has_ssse3()) { SPEED_START { for (j = 0; j < nd; ++j) raid_recX_ssse3(5, id, ip, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); } #endif #ifdef CONFIG_AVX2 if (raid_cpu_has_avx2()) { SPEED_START { for (j = 0; j < nd; ++j) raid_recX_avx2(5, id, ip, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); } #endif #endif printf("\n"); printf("%8s", "rec6"); printf("%8s", raid_recX_tag()); fflush(stdout); SPEED_START { for (j = 0; j < nd; ++j) raid_recX_int8(6, id, ip, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); fflush(stdout); #ifdef CONFIG_X86 #ifdef CONFIG_SSSE3 if (raid_cpu_has_ssse3()) { SPEED_START { for (j = 0; j < nd; ++j) raid_recX_ssse3(6, id, ip, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); } #endif #ifdef CONFIG_AVX2 if (raid_cpu_has_avx2()) { SPEED_START { for (j = 0; j < nd; ++j) raid_recX_avx2(6, id, ip, nd, size, v); } SPEED_STOP printf("%8" PRIu64, ds / dt); } #endif #endif printf("\n"); printf("\n"); printf("If the 'best' expectations are wrong, please report it in the SnapRAID forum\n\n"); free(v_alloc); free(v); }