1 /* SPDX-License-Identifier: BSD-3-Clause
2 * Copyright(c) 2018 Intel Corporation
8 #include <rte_cycles.h>
10 #include <rte_hash_crc.h>
11 #include <rte_jhash.h>
12 #include <rte_launch.h>
13 #include <rte_malloc.h>
14 #include <rte_random.h>
15 #include <rte_spinlock.h>
19 #define RTE_RWTEST_FAIL 0
21 #define TOTAL_ENTRY (5*1024*1024)
22 #define TOTAL_INSERT (4.5*1024*1024)
23 #define TOTAL_INSERT_EXT (5*1024*1024)
26 unsigned int core_cnt
[NUM_TEST
] = {2, 4, 8};
28 unsigned int slave_core_ids
[RTE_MAX_LCORE
];
31 uint32_t single_write
;
32 uint32_t read_only
[NUM_TEST
];
33 uint32_t write_only
[NUM_TEST
];
34 uint32_t read_write_r
[NUM_TEST
];
35 uint32_t read_write_w
[NUM_TEST
];
38 static struct perf htm_results
, non_htm_results
;
44 uint32_t rounded_tot_insert
;
48 static rte_atomic64_t gcycles
;
49 static rte_atomic64_t ginsertions
;
51 static rte_atomic64_t gread_cycles
;
52 static rte_atomic64_t gwrite_cycles
;
54 static rte_atomic64_t greads
;
55 static rte_atomic64_t gwrites
;
58 test_hash_readwrite_worker(__attribute__((unused
)) void *arg
)
61 uint32_t lcore_id
= rte_lcore_id();
62 uint64_t begin
, cycles
;
65 ret
= rte_malloc(NULL
, sizeof(int) *
66 tbl_rw_test_param
.num_insert
, 0);
67 for (i
= 0; i
< rte_lcore_count(); i
++) {
68 if (slave_core_ids
[i
] == lcore_id
)
71 offset
= tbl_rw_test_param
.num_insert
* i
;
73 printf("Core #%d inserting and reading %d: %'"PRId64
" - %'"PRId64
"\n",
74 lcore_id
, tbl_rw_test_param
.num_insert
,
75 offset
, offset
+ tbl_rw_test_param
.num_insert
- 1);
77 begin
= rte_rdtsc_precise();
79 for (i
= offset
; i
< offset
+ tbl_rw_test_param
.num_insert
; i
++) {
81 if (rte_hash_lookup(tbl_rw_test_param
.h
,
82 tbl_rw_test_param
.keys
+ i
) > 0)
85 ret
[i
- offset
] = rte_hash_add_key(tbl_rw_test_param
.h
,
86 tbl_rw_test_param
.keys
+ i
);
87 if (ret
[i
- offset
] < 0)
90 /* lookup a random key */
91 uint32_t rand
= rte_rand() % (i
+ 1 - offset
);
93 if (rte_hash_lookup(tbl_rw_test_param
.h
,
94 tbl_rw_test_param
.keys
+ rand
) != ret
[rand
])
98 if (rte_hash_del_key(tbl_rw_test_param
.h
,
99 tbl_rw_test_param
.keys
+ rand
) != ret
[rand
])
102 ret
[rand
] = rte_hash_add_key(tbl_rw_test_param
.h
,
103 tbl_rw_test_param
.keys
+ rand
);
107 if (rte_hash_lookup(tbl_rw_test_param
.h
,
108 tbl_rw_test_param
.keys
+ rand
) != ret
[rand
])
112 cycles
= rte_rdtsc_precise() - begin
;
113 rte_atomic64_add(&gcycles
, cycles
);
114 rte_atomic64_add(&ginsertions
, i
- offset
);
116 for (; i
< offset
+ tbl_rw_test_param
.num_insert
; i
++)
117 tbl_rw_test_param
.keys
[i
] = RTE_RWTEST_FAIL
;
124 init_params(int use_ext
, int use_htm
, int use_jhash
)
128 uint32_t *keys
= NULL
;
129 uint8_t *found
= NULL
;
130 struct rte_hash
*handle
;
132 struct rte_hash_parameters hash_params
= {
133 .entries
= TOTAL_ENTRY
,
134 .key_len
= sizeof(uint32_t),
135 .hash_func_init_val
= 0,
136 .socket_id
= rte_socket_id(),
139 hash_params
.hash_func
= rte_jhash
;
141 hash_params
.hash_func
= rte_hash_crc
;
144 hash_params
.extra_flag
=
145 RTE_HASH_EXTRA_FLAGS_TRANS_MEM_SUPPORT
|
146 RTE_HASH_EXTRA_FLAGS_RW_CONCURRENCY
|
147 RTE_HASH_EXTRA_FLAGS_MULTI_WRITER_ADD
;
149 hash_params
.extra_flag
=
150 RTE_HASH_EXTRA_FLAGS_RW_CONCURRENCY
|
151 RTE_HASH_EXTRA_FLAGS_MULTI_WRITER_ADD
;
154 hash_params
.extra_flag
|=
155 RTE_HASH_EXTRA_FLAGS_EXT_TABLE
;
157 hash_params
.extra_flag
&=
158 ~RTE_HASH_EXTRA_FLAGS_EXT_TABLE
;
160 hash_params
.name
= "tests";
162 handle
= rte_hash_create(&hash_params
);
163 if (handle
== NULL
) {
164 printf("hash creation failed");
168 tbl_rw_test_param
.h
= handle
;
169 keys
= rte_malloc(NULL
, sizeof(uint32_t) * TOTAL_ENTRY
, 0);
172 printf("RTE_MALLOC failed\n");
176 found
= rte_zmalloc(NULL
, sizeof(uint8_t) * TOTAL_ENTRY
, 0);
178 printf("RTE_ZMALLOC failed\n");
182 tbl_rw_test_param
.keys
= keys
;
183 tbl_rw_test_param
.found
= found
;
185 for (i
= 0; i
< TOTAL_ENTRY
; i
++)
192 rte_hash_free(handle
);
198 test_hash_readwrite_functional(int use_ext
, int use_htm
)
201 const void *next_key
;
205 uint32_t duplicated_keys
= 0;
206 uint32_t lost_keys
= 0;
208 int slave_cnt
= rte_lcore_count() - 1;
209 uint32_t tot_insert
= 0;
211 rte_atomic64_init(&gcycles
);
212 rte_atomic64_clear(&gcycles
);
214 rte_atomic64_init(&ginsertions
);
215 rte_atomic64_clear(&ginsertions
);
217 if (init_params(use_ext
, use_htm
, use_jhash
) != 0)
221 tot_insert
= TOTAL_INSERT_EXT
;
223 tot_insert
= TOTAL_INSERT
;
225 tbl_rw_test_param
.num_insert
=
226 tot_insert
/ slave_cnt
;
228 tbl_rw_test_param
.rounded_tot_insert
=
229 tbl_rw_test_param
.num_insert
232 printf("++++++++Start function tests:+++++++++\n");
234 /* Fire all threads. */
235 rte_eal_mp_remote_launch(test_hash_readwrite_worker
,
237 rte_eal_mp_wait_lcore();
239 while (rte_hash_iterate(tbl_rw_test_param
.h
, &next_key
,
240 &next_data
, &iter
) >= 0) {
241 /* Search for the key in the list of keys added .*/
242 i
= *(const uint32_t *)next_key
;
243 tbl_rw_test_param
.found
[i
]++;
246 for (i
= 0; i
< tbl_rw_test_param
.rounded_tot_insert
; i
++) {
247 if (tbl_rw_test_param
.keys
[i
] != RTE_RWTEST_FAIL
) {
248 if (tbl_rw_test_param
.found
[i
] > 1) {
252 if (tbl_rw_test_param
.found
[i
] == 0) {
254 printf("key %d is lost\n", i
);
260 if (duplicated_keys
> 0) {
261 printf("%d key duplicated\n", duplicated_keys
);
266 printf("%d key lost\n", lost_keys
);
270 printf("No key corrupted during read-write test.\n");
272 unsigned long long int cycles_per_insertion
=
273 rte_atomic64_read(&gcycles
) /
274 rte_atomic64_read(&ginsertions
);
276 printf("cycles per insertion and lookup: %llu\n", cycles_per_insertion
);
278 rte_free(tbl_rw_test_param
.found
);
279 rte_free(tbl_rw_test_param
.keys
);
280 rte_hash_free(tbl_rw_test_param
.h
);
281 printf("+++++++++Complete function tests+++++++++\n");
285 rte_free(tbl_rw_test_param
.found
);
286 rte_free(tbl_rw_test_param
.keys
);
287 rte_hash_free(tbl_rw_test_param
.h
);
293 test_rw_reader(void *arg
)
296 uint64_t begin
, cycles
;
297 uint64_t read_cnt
= (uint64_t)((uintptr_t)arg
);
299 begin
= rte_rdtsc_precise();
300 for (i
= 0; i
< read_cnt
; i
++) {
302 rte_hash_lookup_data(tbl_rw_test_param
.h
,
303 tbl_rw_test_param
.keys
+ i
,
305 if (i
!= (uint64_t)(uintptr_t)data
) {
306 printf("lookup find wrong value %"PRIu64
","
308 (uint64_t)(uintptr_t)data
);
313 cycles
= rte_rdtsc_precise() - begin
;
314 rte_atomic64_add(&gread_cycles
, cycles
);
315 rte_atomic64_add(&greads
, i
);
320 test_rw_writer(void *arg
)
323 uint32_t lcore_id
= rte_lcore_id();
324 uint64_t begin
, cycles
;
326 uint64_t start_coreid
= (uint64_t)(uintptr_t)arg
;
329 for (i
= 0; i
< rte_lcore_count(); i
++) {
330 if (slave_core_ids
[i
] == lcore_id
)
334 offset
= TOTAL_INSERT
/ 2 + (i
- (start_coreid
)) *
335 tbl_rw_test_param
.num_insert
;
336 begin
= rte_rdtsc_precise();
337 for (i
= offset
; i
< offset
+ tbl_rw_test_param
.num_insert
; i
++) {
338 ret
= rte_hash_add_key_data(tbl_rw_test_param
.h
,
339 tbl_rw_test_param
.keys
+ i
,
340 (void *)((uintptr_t)i
));
342 printf("writer failed %"PRIu64
"\n", i
);
347 cycles
= rte_rdtsc_precise() - begin
;
348 rte_atomic64_add(&gwrite_cycles
, cycles
);
349 rte_atomic64_add(&gwrites
, tbl_rw_test_param
.num_insert
);
354 test_hash_readwrite_perf(struct perf
*perf_results
, int use_htm
,
360 uint64_t i
, read_cnt
;
362 const void *next_key
;
367 uint32_t duplicated_keys
= 0;
368 uint32_t lost_keys
= 0;
370 uint64_t start
= 0, end
= 0;
372 rte_atomic64_init(&greads
);
373 rte_atomic64_init(&gwrites
);
374 rte_atomic64_clear(&gwrites
);
375 rte_atomic64_clear(&greads
);
377 rte_atomic64_init(&gread_cycles
);
378 rte_atomic64_clear(&gread_cycles
);
379 rte_atomic64_init(&gwrite_cycles
);
380 rte_atomic64_clear(&gwrite_cycles
);
382 if (init_params(0, use_htm
, use_jhash
) != 0)
386 * Do a readers finish faster or writers finish faster test.
387 * When readers finish faster, we timing the readers, and when writers
388 * finish faster, we timing the writers.
389 * Divided by 10 or 2 is just experimental values to vary the workload
393 printf("++++++Start perf test: reader++++++++\n");
394 read_cnt
= TOTAL_INSERT
/ 10;
396 printf("++++++Start perf test: writer++++++++\n");
397 read_cnt
= TOTAL_INSERT
/ 2;
400 /* We first test single thread performance */
401 start
= rte_rdtsc_precise();
402 /* Insert half of the keys */
403 for (i
= 0; i
< TOTAL_INSERT
/ 2; i
++) {
404 ret
= rte_hash_add_key_data(tbl_rw_test_param
.h
,
405 tbl_rw_test_param
.keys
+ i
,
406 (void *)((uintptr_t)i
));
408 printf("Failed to insert half of keys\n");
412 end
= rte_rdtsc_precise() - start
;
413 perf_results
->single_write
= end
/ i
;
415 start
= rte_rdtsc_precise();
417 for (i
= 0; i
< read_cnt
; i
++) {
419 rte_hash_lookup_data(tbl_rw_test_param
.h
,
420 tbl_rw_test_param
.keys
+ i
,
422 if (i
!= (uint64_t)(uintptr_t)data
) {
423 printf("lookup find wrong value"
424 " %"PRIu64
",%"PRIu64
"\n", i
,
425 (uint64_t)(uintptr_t)data
);
429 end
= rte_rdtsc_precise() - start
;
430 perf_results
->single_read
= end
/ i
;
432 for (n
= 0; n
< NUM_TEST
; n
++) {
433 unsigned int tot_slave_lcore
= rte_lcore_count() - 1;
434 if (tot_slave_lcore
< core_cnt
[n
] * 2)
437 rte_atomic64_clear(&greads
);
438 rte_atomic64_clear(&gread_cycles
);
439 rte_atomic64_clear(&gwrites
);
440 rte_atomic64_clear(&gwrite_cycles
);
442 rte_hash_reset(tbl_rw_test_param
.h
);
444 tbl_rw_test_param
.num_insert
= TOTAL_INSERT
/ 2 / core_cnt
[n
];
445 tbl_rw_test_param
.rounded_tot_insert
= TOTAL_INSERT
/ 2 +
446 tbl_rw_test_param
.num_insert
*
449 for (i
= 0; i
< TOTAL_INSERT
/ 2; i
++) {
450 ret
= rte_hash_add_key_data(tbl_rw_test_param
.h
,
451 tbl_rw_test_param
.keys
+ i
,
452 (void *)((uintptr_t)i
));
454 printf("Failed to insert half of keys\n");
459 /* Then test multiple thread case but only all reads or
463 /* Test only reader cases */
464 for (i
= 0; i
< core_cnt
[n
]; i
++)
465 rte_eal_remote_launch(test_rw_reader
,
466 (void *)(uintptr_t)read_cnt
,
469 rte_eal_mp_wait_lcore();
472 /* Test only writer cases */
473 for (; i
< core_cnt
[n
] * 2; i
++)
474 rte_eal_remote_launch(test_rw_writer
,
475 (void *)((uintptr_t)start_coreid
),
478 rte_eal_mp_wait_lcore();
481 unsigned long long int cycles_per_insertion
=
482 rte_atomic64_read(&gread_cycles
) /
483 rte_atomic64_read(&greads
);
484 perf_results
->read_only
[n
] = cycles_per_insertion
;
485 printf("Reader only: cycles per lookup: %llu\n",
486 cycles_per_insertion
);
490 unsigned long long int cycles_per_insertion
=
491 rte_atomic64_read(&gwrite_cycles
) /
492 rte_atomic64_read(&gwrites
);
493 perf_results
->write_only
[n
] = cycles_per_insertion
;
494 printf("Writer only: cycles per writes: %llu\n",
495 cycles_per_insertion
);
498 rte_atomic64_clear(&greads
);
499 rte_atomic64_clear(&gread_cycles
);
500 rte_atomic64_clear(&gwrites
);
501 rte_atomic64_clear(&gwrite_cycles
);
503 rte_hash_reset(tbl_rw_test_param
.h
);
505 for (i
= 0; i
< TOTAL_INSERT
/ 2; i
++) {
506 ret
= rte_hash_add_key_data(tbl_rw_test_param
.h
,
507 tbl_rw_test_param
.keys
+ i
,
508 (void *)((uintptr_t)i
));
510 printf("Failed to insert half of keys\n");
515 start_coreid
= core_cnt
[n
];
518 for (i
= core_cnt
[n
]; i
< core_cnt
[n
] * 2; i
++)
519 rte_eal_remote_launch(test_rw_writer
,
520 (void *)((uintptr_t)start_coreid
),
522 for (i
= 0; i
< core_cnt
[n
]; i
++)
523 rte_eal_remote_launch(test_rw_reader
,
524 (void *)(uintptr_t)read_cnt
,
527 for (i
= 0; i
< core_cnt
[n
]; i
++)
528 rte_eal_remote_launch(test_rw_reader
,
529 (void *)(uintptr_t)read_cnt
,
531 for (; i
< core_cnt
[n
] * 2; i
++)
532 rte_eal_remote_launch(test_rw_writer
,
533 (void *)((uintptr_t)start_coreid
),
537 rte_eal_mp_wait_lcore();
540 memset(tbl_rw_test_param
.found
, 0, TOTAL_ENTRY
);
541 while (rte_hash_iterate(tbl_rw_test_param
.h
,
542 &next_key
, &next_data
, &iter
) >= 0) {
543 /* Search for the key in the list of keys added .*/
544 i
= *(const uint32_t *)next_key
;
545 tbl_rw_test_param
.found
[i
]++;
548 for (i
= 0; i
< tbl_rw_test_param
.rounded_tot_insert
; i
++) {
549 if (tbl_rw_test_param
.keys
[i
] != RTE_RWTEST_FAIL
) {
550 if (tbl_rw_test_param
.found
[i
] > 1) {
554 if (tbl_rw_test_param
.found
[i
] == 0) {
556 printf("key %"PRIu64
" is lost\n", i
);
562 if (duplicated_keys
> 0) {
563 printf("%d key duplicated\n", duplicated_keys
);
568 printf("%d key lost\n", lost_keys
);
572 printf("No key corrupted during read-write test.\n");
575 unsigned long long int cycles_per_insertion
=
576 rte_atomic64_read(&gread_cycles
) /
577 rte_atomic64_read(&greads
);
578 perf_results
->read_write_r
[n
] = cycles_per_insertion
;
579 printf("Read-write cycles per lookup: %llu\n",
580 cycles_per_insertion
);
584 unsigned long long int cycles_per_insertion
=
585 rte_atomic64_read(&gwrite_cycles
) /
586 rte_atomic64_read(&gwrites
);
587 perf_results
->read_write_w
[n
] = cycles_per_insertion
;
588 printf("Read-write cycles per writes: %llu\n",
589 cycles_per_insertion
);
594 rte_free(tbl_rw_test_param
.found
);
595 rte_free(tbl_rw_test_param
.keys
);
596 rte_hash_free(tbl_rw_test_param
.h
);
600 rte_free(tbl_rw_test_param
.found
);
601 rte_free(tbl_rw_test_param
.keys
);
602 rte_hash_free(tbl_rw_test_param
.h
);
609 test_hash_readwrite_main(void)
612 * Variables used to choose different tests.
613 * use_htm indicates if hardware transactional memory should be used.
614 * reader_faster indicates if the reader threads should finish earlier
615 * than writer threads. This is to timing either reader threads or
616 * writer threads for performance numbers.
618 int use_htm
, use_ext
, reader_faster
;
619 unsigned int i
= 0, core_id
= 0;
621 if (rte_lcore_count() <= 2) {
622 printf("More than two lcores are required "
623 "to do read write test\n");
627 RTE_LCORE_FOREACH_SLAVE(core_id
) {
628 slave_core_ids
[i
] = core_id
;
632 setlocale(LC_NUMERIC
, "");
634 if (rte_tm_supported()) {
635 printf("Hardware transactional memory (lock elision) "
638 printf("Test read-write with Hardware transactional memory\n");
643 if (test_hash_readwrite_functional(use_ext
, use_htm
) < 0)
647 if (test_hash_readwrite_functional(use_ext
, use_htm
) < 0)
651 if (test_hash_readwrite_perf(&htm_results
, use_htm
,
656 if (test_hash_readwrite_perf(&htm_results
, use_htm
,
660 printf("Hardware transactional memory (lock elision) "
661 "is NOT supported\n");
664 printf("Test read-write without Hardware transactional memory\n");
667 if (test_hash_readwrite_functional(use_ext
, use_htm
) < 0)
671 if (test_hash_readwrite_functional(use_ext
, use_htm
) < 0)
675 if (test_hash_readwrite_perf(&non_htm_results
, use_htm
,
679 if (test_hash_readwrite_perf(&non_htm_results
, use_htm
,
683 printf("================\n");
684 printf("Results summary:\n");
685 printf("================\n");
687 printf("single read: %u\n", htm_results
.single_read
);
688 printf("single write: %u\n", htm_results
.single_write
);
689 for (i
= 0; i
< NUM_TEST
; i
++) {
690 printf("+++ core_cnt: %u +++\n", core_cnt
[i
]);
692 printf(" read only: %u\n", htm_results
.read_only
[i
]);
693 printf(" write only: %u\n", htm_results
.write_only
[i
]);
694 printf(" read-write read: %u\n", htm_results
.read_write_r
[i
]);
695 printf(" read-write write: %u\n", htm_results
.read_write_w
[i
]);
697 printf("non HTM:\n");
698 printf(" read only: %u\n", non_htm_results
.read_only
[i
]);
699 printf(" write only: %u\n", non_htm_results
.write_only
[i
]);
700 printf(" read-write read: %u\n",
701 non_htm_results
.read_write_r
[i
]);
702 printf(" read-write write: %u\n",
703 non_htm_results
.read_write_w
[i
]);
709 REGISTER_TEST_COMMAND(hash_readwrite_autotest
, test_hash_readwrite_main
);