/* * UCW Library -- Testing the Sorter * * (c) 2007 Martin Mares * * This software may be freely distributed and used according to the terms * of the GNU Lesser General Public License. */ #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include /*** A hack for overriding radix-sorter configuration ***/ #ifdef FORCE_RADIX_BITS #undef CONFIG_UCW_RADIX_SORTER_BITS #define CONFIG_UCW_RADIX_SORTER_BITS FORCE_RADIX_BITS #endif /*** Time measurement ***/ static timestamp_t timer; static uint test_id; static void start(void) { sync(); init_timer(&timer); } static void stop(void) { sync(); msg(L_INFO, "Test %d took %.3fs", test_id, get_timer(&timer) / 1000.); } /*** Simple 4-byte integer keys ***/ struct key1 { u32 x; }; #define SORT_KEY_REGULAR struct key1 #define SORT_PREFIX(x) s1_##x #define SORT_INPUT_FB #define SORT_OUTPUT_FB #define SORT_UNIQUE #define SORT_INT(k) (k).x #define SORT_DELETE_INPUT 0 #include static void test_int(int mode, u64 size) { uint N = size ? nextprime(MIN(size/4, 0xffff0000)) : 0; uint K = N/4*3; msg(L_INFO, ">>> Integers (%s, N=%u)", ((char *[]) { "increasing", "decreasing", "random" })[mode], N); struct fastbuf *f = bopen_tmp(65536); for (uint i=0; icnt += k[i]->cnt; bwrite(f, k[0], sizeof(struct key2)); } #define SORT_KEY_REGULAR struct key2 #define SORT_PREFIX(x) s2_##x #define SORT_INPUT_FB #define SORT_OUTPUT_FB #define SORT_UNIFY #define SORT_INT(k) (k).x #include static void test_counted(int mode, u64 size) { u64 items = size / sizeof(struct key2); uint mult = 2; while (items/(2*mult) > 0xffff0000) mult++; uint N = items ? nextprime(items/(2*mult)) : 0; uint K = N/4*3; msg(L_INFO, ">>> Counted integers (%s, N=%u, mult=%u)", ((char *[]) { "increasing", "decreasing", "random" })[mode], N, mult); struct fastbuf *f = bopen_tmp(65536); for (uint m=0; mhash[0], y->hash[0]); COMPARE(x->hash[1], y->hash[1]); COMPARE(x->hash[2], y->hash[2]); COMPARE(x->hash[3], y->hash[3]); return 0; } static inline uint s3_hash(struct key3 *x) { return x->hash[0]; } #define SORT_KEY_REGULAR struct key3 #define SORT_PREFIX(x) s3_##x #define SORT_INPUT_FB #define SORT_OUTPUT_FB #define SORT_HASH_BITS 32 #include static void gen_hash_key(int mode, struct key3 *k, uint i) { k->i = i; k->payload[0] = 7*i + 13; k->payload[1] = 13*i + 19; k->payload[2] = 19*i + 7; switch (mode) { case 0: k->hash[0] = i; k->hash[1] = k->payload[0]; k->hash[2] = k->payload[1]; k->hash[3] = k->payload[2]; break; case 1: k->hash[0] = ~i; k->hash[1] = k->payload[0]; k->hash[2] = k->payload[1]; k->hash[3] = k->payload[2]; break; default: ; md5_hash_buffer((byte *) &k->hash, (byte *) &k->i, 4); break; } } static void test_hashes(int mode, u64 size) { uint N = MIN(size / sizeof(struct key3), 0xffffffff); msg(L_INFO, ">>> Hashes (%s, N=%u)", ((char *[]) { "increasing", "decreasing", "random" })[mode], N); struct key3 k, lastk; struct fastbuf *f = bopen_tmp(65536); uint hash_sum = 0; for (uint i=0; ilen, y->len); int c = memcmp(x->s, y->s, l); if (c) return c; COMPARE(x->len, y->len); return 0; } static inline int s4_read_key(struct fastbuf *f, struct key4 *x) { x->len = bgetl(f); if (x->len == 0xffffffff) return 0; ASSERT(x->len < KEY4_MAX); breadb(f, x->s, x->len); return 1; } static inline void s4_write_key(struct fastbuf *f, struct key4 *x) { ASSERT(x->len < KEY4_MAX); bputl(f, x->len); bwrite(f, x->s, x->len); } #define SORT_KEY struct key4 #define SORT_PREFIX(x) s4_##x #define SORT_KEY_SIZE(x) (sizeof(struct key4) - KEY4_MAX + (x).len) #define SORT_INPUT_FB #define SORT_OUTPUT_FB #include #define s4b_compare s4_compare #define s4b_read_key s4_read_key #define s4b_write_key s4_write_key static inline uint s4_data_size(struct key4 *x) { return x->len ? (x->s[0] ^ 0xad) : 0; } #define SORT_KEY struct key4 #define SORT_PREFIX(x) s4b_##x #define SORT_KEY_SIZE(x) (sizeof(struct key4) - KEY4_MAX + (x).len) #define SORT_DATA_SIZE(x) s4_data_size(&(x)) #define SORT_INPUT_FB #define SORT_OUTPUT_FB #include static void gen_key4(struct key4 *k) { k->len = random_max(KEY4_MAX); for (uint i=0; ilen; i++) k->s[i] = random(); } static void gen_data4(byte *buf, uint len, uint h) { while (len--) { *buf++ = h >> 24; h = h*259309 + 17; } } static void test_strings(uint mode, u64 size) { uint avg_item_size = KEY4_MAX/2 + 4 + (mode ? 128 : 0); uint N = MIN(size / avg_item_size, 0xffffffff); msg(L_INFO, ">>> Strings %s(N=%u)", (mode ? "with data " : ""), N); random_set_seed(1); struct key4 k, lastk; byte buf[256], buf2[256]; uint sum = 0; struct fastbuf *f = bopen_tmp(65536); for (uint i=0; i= s5_N) { if (!s5_N || s5_i >= s5_N-1) return 0; s5_j = 0; s5_i++; } p->x = ((u64)s5_j * s5_K) % s5_N; p->y = ((u64)(s5_i + s5_j) * s5_L) % s5_N; s5_j++; return 1; } #define ASORT_PREFIX(x) s5m_##x #define ASORT_KEY_TYPE u32 #include static void s5_write_merged(struct fastbuf *f, struct key5 **keys, void **data, uint n, void *buf) { u32 *a = buf; uint m = 0; for (uint i=0; icnt); m += keys[i]->cnt; } s5m_sort(a, m); keys[0]->cnt = m; bwrite(f, keys[0], sizeof(struct key5)); bwrite(f, a, 4*m); } static void s5_copy_merged(struct key5 **keys, struct fastbuf **data, uint n, struct fastbuf *dest) { u32 k[n]; uint m = 0; for (uint i=0; icnt; } struct key5 key = { .x = keys[0]->x, .cnt = m }; bwrite(dest, &key, sizeof(key)); while (key.cnt--) { uint b = 0; for (uint i=1; icnt) k[b] = bgetl(data[b]); else k[b] = ~0U; } } static inline int s5p_lt(struct s5_pair x, struct s5_pair y) { COMPARE_LT(x.x, y.x); COMPARE_LT(x.y, y.y); return 0; } #define ASORT_PREFIX(x) s5p_##x #define ASORT_KEY_TYPE struct s5_pair #define ASORT_LT(x,y) s5p_lt(x,y) #include static int s5_presort(struct fastbuf *dest, void *buf, size_t bufsize) { uint max = MIN(bufsize/sizeof(struct s5_pair), 0xffffffff); struct s5_pair *a = buf; uint n = 0; while (n #define SORT_KEY_REGULAR struct key5 #define SORT_PREFIX(x) s5b_##x #define SORT_DATA_SIZE(k) (4*(k).cnt) #define SORT_UNIFY #define SORT_UNIFY_WORKSPACE(k) SORT_DATA_SIZE(k) #define SORT_INPUT_FB #define SORT_OUTPUT_THIS_FB #define SORT_INT(k) (k).x #define s5b_write_merged s5_write_merged #define s5b_copy_merged s5_copy_merged #include static void test_graph(uint mode, u64 size) { uint N = 3; while ((u64)N*(N+2)*4 < size) N = nextprime(N); if (!size) N = 0; msg(L_INFO, ">>> Graph%s (N=%u)", (mode ? "" : " with custom presorting"), N); s5_N = N; s5_K = N/4*3; s5_L = N/3*2; s5_i = s5_j = 0; struct fastbuf *in = NULL; if (mode) { struct s5_pair p; in = bopen_tmp(65536); while (s5_gen(&p)) { struct key5 k = { .x = p.x, .cnt = 1 }; bwrite(in, &k, sizeof(k)); bputl(in, p.y); } brewind(in); } start(); struct fastbuf *f = bopen_tmp(65536); bputl(f, 0xfeedcafe); struct fastbuf *g = (mode ? s5b_sort(in, f, s5_N-1) : s5_sort(NULL, f, s5_N-1)); ASSERT(f == g); stop(); SORT_XTRACE(2, "Verifying"); uint c = bgetl(f); ASSERT(c == 0xfeedcafe); for (uint i=0; i static void test_int64(int mode, u64 size) { u64 N = size ? nextprime(MIN(size/8, 0xffff0000)) : 0; u64 K = N/4*3; msg(L_INFO, ">>> 64-bit integers (%s, N=%llu)", ((char *[]) { "increasing", "decreasing", "random" })[mode], (long long)N); struct fastbuf *f = bopen_tmp(65536); for (u64 i=0; i= 0) switch (c) { case 'd': sorter_debug = atol(optarg); break; case 's': if (cf_parse_u64(optarg, &size)) goto usage; break; case 't': { char *w[32]; int f = str_sepsplit(optarg, ',', w, ARRAY_SIZE(w)); if (f < 0) goto usage; t = 0; for (int i=0; i= TMAX) goto usage; t |= 1 << j; } } break; case 'v': sorter_trace++; break; default: usage: fputs("Usage: sort-test [-v] [-d ] [-s ] [-t ]\n", stderr); exit(1); } if (optind != argc) goto usage; for (uint i=0; i