From 46f74780f5ddfa903b98e8ff48a000150fccf2b7 Mon Sep 17 00:00:00 2001 From: nikhil nanal Date: Mon, 26 Aug 2024 15:01:27 -0700 Subject: [PATCH] fabtests: New fabtest fi_flood to test over subscription of resources 1. MR cache based registrations tests regsiter and send in batch and sequential modes while flooding the cache beyond the maximum size. 2. Test receipt of unexpected messages by overwhelming the receiver Signed-off-by: nikhil nanal --- fabtests/Makefile.am | 6 + fabtests/functional/flood.c | 314 +++++++++++++++++++++++++++++++ fabtests/functional/rdm_atomic.c | 3 +- fabtests/include/shared.h | 1 - fabtests/man/man1/fi_flood.1 | 1 + fabtests/scripts/runfabtests.sh | 6 +- 6 files changed, 326 insertions(+), 5 deletions(-) create mode 100644 fabtests/functional/flood.c create mode 100644 fabtests/man/man1/fi_flood.1 diff --git a/fabtests/Makefile.am b/fabtests/Makefile.am index b97ca169e5f..17572aa02a4 100644 --- a/fabtests/Makefile.am +++ b/fabtests/Makefile.am @@ -41,6 +41,7 @@ bin_PROGRAMS = \ functional/fi_rdm_stress \ functional/fi_multi_recv \ functional/fi_bw \ + functional/fi_flood \ functional/fi_rdm_multi_client \ functional/fi_loopback \ benchmarks/fi_msg_pingpong \ @@ -362,6 +363,10 @@ functional_fi_bw_SOURCES = \ functional/bw.c functional_fi_bw_LDADD = libfabtests.la +functional_fi_flood_SOURCES = \ + functional/flood.c +functional_fi_flood_LDADD = libfabtests.la + functional_fi_rdm_multi_client_SOURCES = \ functional/rdm_multi_client.c functional_fi_rdm_multi_client_LDADD = libfabtests.la @@ -652,6 +657,7 @@ dummy_man_pages = \ man/man1/fi_getinfo_test.1 \ man/man1/fi_mr_test.1 \ man/man1/fi_bw.1 \ + man/man1/fi_flood.1 \ man/man1/fi_rdm_multi_client.1 \ man/man1/fi_ubertest.1 \ man/man1/fi_efa_ep_rnr_retry.1 diff --git a/fabtests/functional/flood.c b/fabtests/functional/flood.c new file mode 100644 index 00000000000..875ebce2387 --- /dev/null +++ b/fabtests/functional/flood.c @@ -0,0 +1,314 @@ +/* + * Copyright (c) 2019 Intel Corporation. All rights reserved. + * + * This software is available to you under the BSD license + * below: + * + * Redistribution and use in source and binary forms, with or + * without modification, are permitted provided that the following + * conditions are met: + * + * - Redistributions of source code must retain the above + * copyright notice, this list of conditions and the following + * disclaimer. + * + * - Redistributions in binary form must reproduce the above + * copyright notice, this list of conditions and the following + * disclaimer in the documentation and/or other materials + * provided with the distribution. + * + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, + * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF + * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND + * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS + * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN + * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN + * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE + * SOFTWARE. + */ + +#include +#include +#include +#include + +#include + +int sleep_time = 0; + +static ssize_t post_one_tx(struct ft_context *msg) +{ + ssize_t ret; + + if (ft_check_opts(FT_OPT_VERIFY_DATA | FT_OPT_ACTIVE)) { + ret = ft_fill_buf(msg->buf + ft_tx_prefix_size(), + opts.transfer_size); + if (ret) + return ret; + } + + return ft_post_tx_buf(ep, remote_fi_addr, opts.transfer_size, + NO_CQ_DATA, &msg->context, msg->buf, + msg->desc, 0); +} + +static ssize_t wait_check_rx_bufs(void) +{ + ssize_t ret; + int i; + + ret = ft_get_rx_comp(rx_seq); + if (ret) + return ret; + + if (!ft_check_opts(FT_OPT_VERIFY_DATA | FT_OPT_ACTIVE)) + return 0; + + for (i = 0; i < opts.window_size; i++) { + ret = ft_check_buf((char *) rx_ctx_arr[i].buf + + ft_rx_prefix_size(), opts.transfer_size); + if (ret) + return ret; + } + + return 0; +} + +static int post_rx_sync(void) +{ + int ret; + + ret = ft_post_rx(ep, rx_size, &rx_ctx); + if (ret) + return ret; + + if (opts.dst_addr) { + ret = ft_tx(ep, remote_fi_addr, 1, &tx_ctx); + if (ret) + return ret; + + ret = ft_get_rx_comp(rx_seq); + } else { + ret = ft_get_rx_comp(rx_seq); + if (ret) + return ret; + + ret = ft_tx(ep, remote_fi_addr, 1, &tx_ctx); + } + + return ret; +} +static void mr_close_all(struct ft_context *ctx_arr, int window_size) +{ + int i; + for (i = 0; i < window_size; i++) + FT_CLOSE_FID(ctx_arr[i].mr); +} + +static int run_seq_mr_send(void) { + + int ret; + int i; + + mr_close_all(tx_ctx_arr, opts.window_size); + mr_close_all(rx_ctx_arr, opts.window_size); + + printf("Sequential memory registration:\n"); + if (opts.dst_addr) { + for (i = 0; i < opts.window_size; i++) { + ret = ft_reg_mr(fi, tx_ctx_arr[i].buf, tx_mr_size, + ft_info_to_mr_access(fi), + FT_TX_MR_KEY + i, opts.iface, opts.device, + &(tx_ctx_arr[i].mr), &(tx_ctx_arr[i].desc)); + if (ret) + return ret; + + if (ft_check_opts(FT_OPT_VERIFY_DATA | FT_OPT_ACTIVE)) { + ret = ft_fill_buf(tx_ctx_arr[i].buf + ft_tx_prefix_size(), + opts.transfer_size); + if (ret) + return ret; + } + + ft_post_tx_buf(ep, remote_fi_addr, opts.transfer_size, + NO_CQ_DATA, &(tx_ctx_arr[i].context), + tx_ctx_arr[i].buf, tx_ctx_arr[i].desc, + ft_tag); + ret = ft_get_tx_comp(tx_seq); + if (ret) + return ret; + FT_CLOSE_FID(tx_ctx_arr[i].mr); + } + } + else { + for (i = 0; i < opts.window_size; i++) { + ret = ft_reg_mr(fi, rx_ctx_arr[i].buf, rx_mr_size, + ft_info_to_mr_access(fi), FT_RX_MR_KEY + i, + opts.iface, opts.device, &(rx_ctx_arr[i].mr), + &(rx_ctx_arr[i].desc)); + if (ret) + return ret; + + ft_post_rx_buf(ep, opts.transfer_size, + &(rx_ctx_arr[i].context), rx_ctx_arr[i].buf, + rx_ctx_arr[i].desc, ft_tag); + ret = wait_check_rx_bufs(); + if (ret) + return ret; + FT_CLOSE_FID(rx_ctx_arr[i].mr); + } + } + + if (opts.options & FT_OPT_OOB_SYNC) + ret = ft_sync(); + else + ret = post_rx_sync(); + + return ret; +} +static int run_batch_mr_send(void) +{ + int ret, i; + + /* Receive side delay is used in order to let the sender + get ahead of the receiver and post multiple sends + before the receiver begins processing them. */ + if (!opts.dst_addr) + sleep(sleep_time); + + printf("Batch memory registration:\n"); + if (opts.dst_addr) { + for (i = 0; i < opts.window_size; i++) { + ret = post_one_tx(&tx_ctx_arr[i]); + if (ret) + return ret; + } + + ret = ft_get_tx_comp(tx_seq); + if (ret) + return ret; + } else { + for (i = 0; i < opts.window_size; i++) { + ret = ft_post_rx_buf(ep, opts.transfer_size, + &rx_ctx_arr[i].context, + rx_ctx_arr[i].buf, + rx_ctx_arr[i].desc, 0); + if (ret) + return ret; + } + + ret = wait_check_rx_bufs(); + if (ret) + return ret; + } + + if (opts.options & FT_OPT_OOB_SYNC) + ret = ft_sync(); + else + ret = post_rx_sync(); + + return ret; +} + +static int run(void) +{ + int ret; + + ret = hints->ep_attr->type == FI_EP_MSG ? + ft_init_fabric_cm() : ft_init_fabric(); + if (ret) + return ret; + + ret = ft_tx(ep, remote_fi_addr, 1, &tx_ctx); + if (ret) + return ret; + ret = ft_get_rx_comp(rx_seq); + if (ret) + return ret; + + ret = run_batch_mr_send(); + if (ret) + goto out; + + ret = run_seq_mr_send(); + if (ret) + goto out; + +out: + return ret; +} + +int main(int argc, char **argv) +{ + int op, ret; + + opts = INIT_OPTS; + + hints = fi_allocinfo(); + if (!hints) + return EXIT_FAILURE; + + hints->ep_attr->type = FI_EP_RDM; + + while ((op = getopt(argc, argv, "UW:vT:h" CS_OPTS ADDR_OPTS INFO_OPTS)) != -1) { + switch (op) { + default: + ft_parse_addr_opts(op, optarg, &opts); + ft_parseinfo(op, optarg, hints, &opts); + ft_parsecsopts(op, optarg, &opts); + break; + case 'W': + opts.window_size = atoi(optarg); + break; + case 'U': + hints->tx_attr->op_flags |= FI_DELIVERY_COMPLETE; + break; + case 'v': + opts.options |= FT_OPT_VERIFY_DATA; + break; + case 'T': + sleep_time = atoi(optarg); + break; + case '?': + case 'h': + ft_usage(argv[0], "test to oversubscribe mr cache and receiver with unexpected msgs."); + FT_PRINT_OPTS_USAGE("-T sleep_time", + "Receive side delay before starting"); + FT_PRINT_OPTS_USAGE("-v", "Enable data verification"); + FT_PRINT_OPTS_USAGE("-W window_size", + "Set transmit window size before waiting for completion"); + return EXIT_FAILURE; + } + } + + if (optind < argc) + opts.dst_addr = argv[optind]; + + hints->caps = FI_MSG; + hints->mode = FI_CONTEXT; + hints->domain_attr->mr_mode = opts.mr_mode; + hints->addr_format = opts.address_format; + + opts.options |= FT_OPT_ALLOC_MULT_MR; + + if (hints->ep_attr->type == FI_EP_DGRAM) { + fprintf(stderr, "This test does not support DGRAM endpoints\n"); + return -FI_EINVAL; + } + + if (opts.options & FT_OPT_VERIFY_DATA) { + hints->tx_attr->msg_order |= FI_ORDER_SAS; + hints->rx_attr->msg_order |= FI_ORDER_SAS; + } + + ret = run(); + if (ret) { + FT_ERR( "Tests failed\n"); + goto err; + } + FT_DEBUG("Tests Passed\n"); +err: + ft_free_res(); + + return ft_exit_code(ret); +} \ No newline at end of file diff --git a/fabtests/functional/rdm_atomic.c b/fabtests/functional/rdm_atomic.c index cef31ecb229..632c36f0f89 100644 --- a/fabtests/functional/rdm_atomic.c +++ b/fabtests/functional/rdm_atomic.c @@ -504,9 +504,10 @@ int main(int argc, char **argv) hints->caps = FI_MSG | FI_ATOMICS; hints->mode = FI_CONTEXT; hints->domain_attr->mr_mode = opts.mr_mode; + printf("HINTS:\n%s\n---------------------------------------\n", + fi_tostr(hints, FI_TYPE_INFO)); ret = run(); - free_res(); ft_free_res(); return ft_exit_code(ret); diff --git a/fabtests/include/shared.h b/fabtests/include/shared.h index 7d56fdd7257..73cbdbfd8f7 100644 --- a/fabtests/include/shared.h +++ b/fabtests/include/shared.h @@ -257,7 +257,6 @@ extern struct fi_cq_attr cq_attr; extern struct fi_cntr_attr cntr_attr; extern struct fi_rma_iov remote; - extern char test_name[50]; extern struct timespec start, end; extern struct ft_opts opts; diff --git a/fabtests/man/man1/fi_flood.1 b/fabtests/man/man1/fi_flood.1 new file mode 100644 index 00000000000..2d5fda814d2 --- /dev/null +++ b/fabtests/man/man1/fi_flood.1 @@ -0,0 +1 @@ +.so man7/fabtests.7 diff --git a/fabtests/scripts/runfabtests.sh b/fabtests/scripts/runfabtests.sh index 8b402aa38e1..2c7f984a902 100755 --- a/fabtests/scripts/runfabtests.sh +++ b/fabtests/scripts/runfabtests.sh @@ -150,9 +150,9 @@ functional_tests=( "fi_inject_test -N -A inject -v" "fi_inject_test -A inj_complete -v" "fi_inject_test -N -A inj_complete -v" - "fi_bw -e rdm -v -T 1" - "fi_bw -e rdm -v -T 1 -U" - "fi_bw -e msg -v -T 1" + "fi_flood -e rdm -v -T 1" + "fi_flood -e rdm -v -T 1 -U" + "fi_flood -e msg -v -T 1" "fi_rdm_multi_client -C 10 -I 5" "fi_rdm_multi_client -C 10 -I 5 -U" )