Skip to content

Commit

Permalink
fabtests: New fabtest fi_flood to test over subscription of resources
Browse files Browse the repository at this point in the history
	  1.  MR cache based registrations
	  tests regsiter and send  in batch and sequential modes while
	  flooding the cache beyond the maximum size.
	  2. Test receipt of unexpected messages by overwhelming the receiver

Signed-off-by: nikhil nanal <[email protected]>
  • Loading branch information
nikhilnanal authored and nikhil.nanal committed Oct 15, 2024
1 parent d9c31ef commit ac31c17
Show file tree
Hide file tree
Showing 7 changed files with 321 additions and 14 deletions.
10 changes: 5 additions & 5 deletions fabtests/Makefile.am
Original file line number Diff line number Diff line change
Expand Up @@ -40,7 +40,7 @@ bin_PROGRAMS = \
functional/fi_rdm_atomic \
functional/fi_rdm_stress \
functional/fi_multi_recv \
functional/fi_bw \
functional/fi_flood \
functional/fi_rdm_multi_client \
functional/fi_loopback \
benchmarks/fi_msg_pingpong \
Expand Down Expand Up @@ -360,9 +360,9 @@ functional_fi_multi_recv_SOURCES = \
functional/multi_recv.c
functional_fi_multi_recv_LDADD = libfabtests.la

functional_fi_bw_SOURCES = \
functional/bw.c
functional_fi_bw_LDADD = libfabtests.la
functional_fi_flood_SOURCES = \
functional/flood.c
functional_fi_flood_LDADD = libfabtests.la

functional_fi_rdm_multi_client_SOURCES = \
functional/rdm_multi_client.c
Expand Down Expand Up @@ -651,7 +651,7 @@ dummy_man_pages = \
man/man1/fi_eq_test.1 \
man/man1/fi_getinfo_test.1 \
man/man1/fi_mr_test.1 \
man/man1/fi_bw.1 \
man/man1/fi_flood.1 \
man/man1/fi_rdm_multi_client.1 \
man/man1/fi_ubertest.1 \
man/man1/fi_efa_ep_rnr_retry.1
Expand Down
2 changes: 1 addition & 1 deletion fabtests/fabtests.vcxproj
Original file line number Diff line number Diff line change
Expand Up @@ -239,7 +239,7 @@
<ClCompile Include="functional\rdm_netdir.c" />
<ClCompile Include="functional\scalable_ep.c" />
<ClCompile Include="functional\inject_test.c" />
<ClCompile Include="functional\bw.c" />
<ClCompile Include="functional\flood.c" />
<ClCompile Include="unit\av_test.c" />
<ClCompile Include="unit\cntr_test.c" />
<ClCompile Include="unit\common.c" />
Expand Down
2 changes: 1 addition & 1 deletion fabtests/fabtests.vcxproj.filters
Original file line number Diff line number Diff line change
Expand Up @@ -225,7 +225,7 @@
<ClCompile Include="functional\unexpected_msg.c">
<Filter>Source Files\functional</Filter>
</ClCompile>
<ClCompile Include="functional\bw.c">
<ClCompile Include="functional\flood.c">
<Filter>Source Files\functional</Filter>
</ClCompile>
<ClCompile Include="functional\inject_test.c">
Expand Down
305 changes: 305 additions & 0 deletions fabtests/functional/flood.c
Original file line number Diff line number Diff line change
@@ -0,0 +1,305 @@
/*
* Copyright (c) Intel Corporation. All rights reserved.
*
* This software is available to you under the BSD license
* below:
*
* Redistribution and use in source and binary forms, with or
* without modification, are permitted provided that the following
* conditions are met:
*
* - Redistributions of source code must retain the above
* copyright notice, this list of conditions and the following
* disclaimer.
*
* - Redistributions in binary form must reproduce the above
* copyright notice, this list of conditions and the following
* disclaimer in the documentation and/or other materials
* provided with the distribution.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
* BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
* ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
* SOFTWARE.
*/

#include <stdio.h>
#include <stdlib.h>
#include <getopt.h>
#include <unistd.h>

#include <shared.h>

static int sleep_time = 0;

static ssize_t post_one_tx(struct ft_context *msg)
{
ssize_t ret;

if (ft_check_opts(FT_OPT_VERIFY_DATA | FT_OPT_ACTIVE)) {
ret = ft_fill_buf(msg->buf + ft_tx_prefix_size(),
opts.transfer_size);
if (ret)
return ret;
}

return ft_post_tx_buf(ep, remote_fi_addr, opts.transfer_size,
NO_CQ_DATA, &msg->context, msg->buf,
msg->desc, 0);
}

static ssize_t wait_check_rx_bufs(void)
{
ssize_t ret;
int i;

ret = ft_get_rx_comp(rx_seq);
if (ret)
return ret;

if (!ft_check_opts(FT_OPT_VERIFY_DATA | FT_OPT_ACTIVE))
return 0;

for (i = 0; i < opts.window_size; i++) {
ret = ft_check_buf((char *) rx_ctx_arr[i].buf +
ft_rx_prefix_size(), opts.transfer_size);
if (ret)
return ret;
}

return 0;
}

static int post_rx_sync(void)
{
int ret;

ret = ft_post_rx(ep, rx_size, &rx_ctx);
if (ret)
return ret;

if (opts.dst_addr) {
ret = ft_tx(ep, remote_fi_addr, 1, &tx_ctx);
if (ret)
return ret;

ret = ft_get_rx_comp(rx_seq);
} else {
ret = ft_get_rx_comp(rx_seq);
if (ret)
return ret;

ret = ft_tx(ep, remote_fi_addr, 1, &tx_ctx);
}

return ret;
}

static void mr_close_all(struct ft_context *ctx_arr, int window_size)
{
int i;

for (i = 0; i < window_size; i++)
FT_CLOSE_FID(ctx_arr[i].mr);
}

static int run_seq_mr_send(void) {

int ret;
int i;

mr_close_all(tx_ctx_arr, opts.window_size);
mr_close_all(rx_ctx_arr, opts.window_size);

printf("Sequential memory registration:");
if (opts.dst_addr) {
for (i = 0; i < opts.window_size; i++) {
ret = ft_reg_mr(fi, tx_ctx_arr[i].buf, tx_mr_size,
ft_info_to_mr_access(fi),
FT_TX_MR_KEY + i, opts.iface, opts.device,
&(tx_ctx_arr[i].mr), &(tx_ctx_arr[i].desc));
if (ret)
goto err;

ret = post_one_tx(&tx_ctx_arr[i]);
if (ret)
goto err;

ret = ft_get_tx_comp(tx_seq);
if (ret)
goto err;

FT_CLOSE_FID(tx_ctx_arr[i].mr);
}
} else {
for (i = 0; i < opts.window_size; i++) {
ret = ft_reg_mr(fi, rx_ctx_arr[i].buf, rx_mr_size,
ft_info_to_mr_access(fi), FT_RX_MR_KEY + i, opts.iface, opts.device,
&(rx_ctx_arr[i].mr),
&(rx_ctx_arr[i].desc));
if (ret)
goto err;

ret = ft_post_rx_buf(ep, opts.transfer_size,
&(rx_ctx_arr[i].context),
rx_ctx_arr[i].buf,
rx_ctx_arr[i].desc, ft_tag);
if (ret)
goto err;

ret = wait_check_rx_bufs();
if (ret)
goto err;

FT_CLOSE_FID(rx_ctx_arr[i].mr);
}
}
if (opts.options & FT_OPT_OOB_SYNC)
ret = ft_sync();
else
ret = post_rx_sync();
err:
printf("%s\n", ret ? "Fail" : "Pass");
return ret;
}

static int run_batch_mr_send(void)
{
int ret, i;

/* Receive side delay is used in order to let the sender
* get ahead of the receiver and post multiple sends
* before the receiver begins processing them.
*/
if (!opts.dst_addr)
sleep(sleep_time);

printf("Batch memory registration:");
if (opts.dst_addr) {
for (i = 0; i < opts.window_size; i++) {
ret = post_one_tx(&tx_ctx_arr[i]);
if (ret)
goto err;
}

ret = ft_get_tx_comp(tx_seq);
if (ret)
goto err;
} else {
for (i = 0; i < opts.window_size; i++) {
ret = ft_post_rx_buf(ep, opts.transfer_size,
&rx_ctx_arr[i].context,
rx_ctx_arr[i].buf,
rx_ctx_arr[i].desc, 0);
if (ret)
goto err;
}

ret = wait_check_rx_bufs();
if (ret)
goto err;
}

if (opts.options & FT_OPT_OOB_SYNC)
ret = ft_sync();
else
ret = post_rx_sync();
err:
printf("%s\n", ret ? "Fail" : "Pass");
return ret;
}

static int run(void)
{
int ret;

ret = hints->ep_attr->type == FI_EP_MSG ?
ft_init_fabric_cm() : ft_init_fabric();
if (ret)
return ret;

ret = run_batch_mr_send();
if (ret)
goto out;

ret = run_seq_mr_send();
if (ret)
goto out;

out:
return ret;
}

int main(int argc, char **argv)
{
int op, ret;

opts = INIT_OPTS;
opts.options |= FT_OPT_ALLOC_MULT_MR;
opts.options |= FT_OPT_NO_PRE_POSTED_RX;

hints = fi_allocinfo();
if (!hints)
return EXIT_FAILURE;

hints->ep_attr->type = FI_EP_RDM;

while ((op = getopt(argc, argv, "UW:vT:h" CS_OPTS ADDR_OPTS INFO_OPTS)) != -1) {
switch (op) {
default:
ft_parse_addr_opts(op, optarg, &opts);
ft_parseinfo(op, optarg, hints, &opts);
ft_parsecsopts(op, optarg, &opts);
break;
case 'W':
opts.window_size = atoi(optarg);
break;
case 'U':
hints->tx_attr->op_flags |= FI_DELIVERY_COMPLETE;
break;
case 'v':
opts.options |= FT_OPT_VERIFY_DATA;
break;
case 'T':
sleep_time = atoi(optarg);
break;
case '?':
case 'h':
ft_usage(argv[0], "test to oversubscribe mr cache and receiver with unexpected msgs.");
FT_PRINT_OPTS_USAGE("-T sleep_time",
"Receive side delay before starting");
FT_PRINT_OPTS_USAGE("-v", "Enable data verification");
FT_PRINT_OPTS_USAGE("-W window_size",
"Set transmit window size before waiting for completion");
return EXIT_FAILURE;
}
}

if (optind < argc)
opts.dst_addr = argv[optind];

hints->caps = FI_MSG;
hints->mode = FI_CONTEXT;
hints->domain_attr->mr_mode = opts.mr_mode;
hints->addr_format = opts.address_format;

if (hints->ep_attr->type == FI_EP_DGRAM) {
fprintf(stderr, "This test does not support DGRAM endpoints\n");
return -FI_EINVAL;
}

if (opts.options & FT_OPT_VERIFY_DATA) {
hints->tx_attr->msg_order |= FI_ORDER_SAS;
hints->rx_attr->msg_order |= FI_ORDER_SAS;
}

ret = run();

ft_free_res();

return ft_exit_code(ret);
}
1 change: 1 addition & 0 deletions fabtests/man/man1/fi_flood.1
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
.so man7/fabtests.7
6 changes: 3 additions & 3 deletions fabtests/scripts/runfabtests.sh
Original file line number Diff line number Diff line change
Expand Up @@ -150,9 +150,9 @@ functional_tests=(
"fi_inject_test -N -A inject -v"
"fi_inject_test -A inj_complete -v"
"fi_inject_test -N -A inj_complete -v"
"fi_bw -e rdm -v -T 1"
"fi_bw -e rdm -v -T 1 -U"
"fi_bw -e msg -v -T 1"
"fi_flood -e rdm -v -T 1"
"fi_flood -e rdm -v -T 1 -U"
"fi_flood -e msg -v -T 1"
"fi_rdm_multi_client -C 10 -I 5"
"fi_rdm_multi_client -C 10 -I 5 -U"
)
Expand Down
9 changes: 5 additions & 4 deletions fabtests/test_configs/tcp/io_uring.exclude
Original file line number Diff line number Diff line change
Expand Up @@ -70,13 +70,14 @@ fi_msg_sockets
# fi_unexpected_msg -e rdm fails with no message
fi_unexpected_msg -e rdm

# fi_bw -e msg fails with
# fi_flood -e msg fails with
# fi_eq_sread(): common/shared.c:1165, ret=-4 (Interrupted system call)
fi_bw -e msg
fi_flood -e msg

# fi_bw fails by hanging
# fi_flood fails by hanging
# fi_flood fails by runfabtest timeout only on the CI.
# This is a suspected race condition
fi_bw
fi_flood

# fi_msg_pingpong fails with
# fi_eq_sread(): common/shared.c:1127, ret=-4 (Interrupted system call)
Expand Down

0 comments on commit ac31c17

Please sign in to comment.