| #!/usr/bin/env python3 |
| # SPDX-License-Identifier: GPL-2.0 |
| |
| """ |
| GRO (Generic Receive Offload) conformance tests. |
| |
| Validates that GRO coalescing works correctly by running the gro |
| binary in different configurations and checking for correct packet |
| coalescing behavior. |
| |
| Test cases: |
| - data_same: Same size data packets coalesce |
| - data_lrg_sml: Large packet followed by smaller one coalesces |
| - data_lrg_1byte: Large packet followed by 1B one coalesces (Ethernet padding) |
| - data_sml_lrg: Small packet followed by larger one doesn't coalesce |
| - ack: Pure ACK packets do not coalesce |
| - flags_psh: Packets with PSH flag don't coalesce |
| - flags_syn: Packets with SYN flag don't coalesce |
| - flags_rst: Packets with RST flag don't coalesce |
| - flags_urg: Packets with URG flag don't coalesce |
| - flags_cwr: Packets with CWR flag don't coalesce |
| - tcp_csum: Packets with incorrect checksum don't coalesce |
| - tcp_seq: Packets with non-consecutive seqno don't coalesce |
| - tcp_ts: Packets with different timestamp options don't coalesce |
| - tcp_opt: Packets with different TCP options don't coalesce |
| - ip_ecn: Packets with different ECN don't coalesce |
| - ip_tos: Packets with different TOS don't coalesce |
| - ip_ttl: (IPv4) Packets with different TTL don't coalesce |
| - ip_opt: (IPv4) Packets with IP options don't coalesce |
| - ip_frag4: (IPv4) IPv4 fragments don't coalesce |
| - ip_id_df*: (IPv4) IP ID field coalescing tests |
| - ip_frag6: (IPv6) IPv6 fragments don't coalesce |
| - ip_v6ext_same: (IPv6) IPv6 ext header with same payload coalesces |
| - ip_v6ext_diff: (IPv6) IPv6 ext header with different payload doesn't coalesce |
| - large_max: Packets exceeding GRO_MAX_SIZE don't coalesce |
| - large_rem: Large packet remainder handling |
| """ |
| |
| import glob |
| import os |
| import re |
| from lib.py import ksft_run, ksft_exit, ksft_pr |
| from lib.py import NetDrvEpEnv, KsftXfailEx |
| from lib.py import NetdevFamily, EthtoolFamily |
| from lib.py import bkg, cmd, defer, ethtool, ip |
| from lib.py import ksft_variants, KsftNamedVariant |
| |
| |
| # gro.c uses hardcoded DPORT=8000 |
| GRO_DPORT = 8000 |
| |
| |
| def _resolve_dmac(cfg, ipver): |
| """ |
| Find the destination MAC address remote host should use to send packets |
| towards the local host. It may be a router / gateway address. |
| """ |
| |
| attr = "dmac" + ipver |
| # Cache the response across test cases |
| if hasattr(cfg, attr): |
| return getattr(cfg, attr) |
| |
| route = ip(f"-{ipver} route get {cfg.addr_v[ipver]}", |
| json=True, host=cfg.remote)[0] |
| gw = route.get("gateway") |
| # Local L2 segment, address directly |
| if not gw: |
| setattr(cfg, attr, cfg.dev['address']) |
| return getattr(cfg, attr) |
| |
| # ping to make sure neighbor is resolved, |
| # bind to an interface, for v6 the GW is likely link local |
| cmd(f"ping -c1 -W0 -I{cfg.remote_ifname} {gw}", host=cfg.remote) |
| |
| neigh = ip(f"neigh get {gw} dev {cfg.remote_ifname}", |
| json=True, host=cfg.remote)[0] |
| setattr(cfg, attr, neigh['lladdr']) |
| return getattr(cfg, attr) |
| |
| |
| def _write_defer_restore(cfg, path, val, defer_undo=False): |
| with open(path, "r", encoding="utf-8") as fp: |
| orig_val = fp.read().strip() |
| if str(val) == orig_val: |
| return |
| with open(path, "w", encoding="utf-8") as fp: |
| fp.write(val) |
| if defer_undo: |
| defer(_write_defer_restore, cfg, path, orig_val) |
| |
| |
| def _set_mtu_restore(dev, mtu, host): |
| if dev['mtu'] < mtu: |
| ip(f"link set dev {dev['ifname']} mtu {mtu}", host=host) |
| defer(ip, f"link set dev {dev['ifname']} mtu {dev['mtu']}", host=host) |
| |
| |
| def _set_ethtool_feat(dev, current, feats, host=None): |
| s2n = {True: "on", False: "off"} |
| |
| new = ["-K", dev] |
| old = ["-K", dev] |
| no_change = True |
| for name, state in feats.items(): |
| new += [name, s2n[state]] |
| old += [name, s2n[current[name]["active"]]] |
| |
| if current[name]["active"] != state: |
| no_change = False |
| if current[name]["fixed"]: |
| raise KsftXfailEx(f"Device does not support {name}") |
| if no_change: |
| return |
| |
| eth_cmd = ethtool(" ".join(new), host=host) |
| defer(ethtool, " ".join(old), host=host) |
| |
| # If ethtool printed something kernel must have modified some features |
| if eth_cmd.stdout: |
| ksft_pr(eth_cmd) |
| |
| |
| def _get_queue_stats(cfg, queue_id): |
| """Get stats for a specific Rx queue.""" |
| cfg.wait_hw_stats_settle() |
| data = cfg.netnl.qstats_get({"ifindex": cfg.ifindex, "scope": ["queue"]}, |
| dump=True) |
| for q in data: |
| if q.get('queue-type') == 'rx' and q.get('queue-id') == queue_id: |
| return q |
| return {} |
| |
| |
| def _setup_isolated_queue(cfg): |
| """Set up an isolated queue for testing using ntuple filter. |
| |
| Remove queue 1 from the default RSS context and steer test traffic to it. |
| """ |
| test_queue = 1 |
| |
| qcnt = len(glob.glob(f"/sys/class/net/{cfg.ifname}/queues/rx-*")) |
| if qcnt < 2: |
| raise KsftXfailEx(f"Need at least 2 queues, have {qcnt}") |
| |
| # Remove queue 1 from default RSS context by setting its weight to 0 |
| weights = ["1"] * qcnt |
| weights[test_queue] = "0" |
| ethtool(f"-X {cfg.ifname} weight " + " ".join(weights)) |
| defer(ethtool, f"-X {cfg.ifname} default") |
| |
| # Set up ntuple filter to steer our test traffic to the isolated queue |
| flow = f"flow-type tcp{cfg.addr_ipver} " |
| flow += f"dst-ip {cfg.addr} dst-port {GRO_DPORT} action {test_queue}" |
| output = ethtool(f"-N {cfg.ifname} {flow}").stdout |
| ntuple_id = int(output.split()[-1]) |
| defer(ethtool, f"-N {cfg.ifname} delete {ntuple_id}") |
| |
| return test_queue |
| |
| |
| def _setup_queue_count(cfg, num_queues): |
| """Configure the NIC to use a specific number of queues.""" |
| channels = cfg.ethnl.channels_get({'header': {'dev-index': cfg.ifindex}}) |
| ch_max = channels.get('combined-max', 0) |
| qcnt = channels['combined-count'] |
| |
| if ch_max < num_queues: |
| raise KsftXfailEx(f"Need at least {num_queues} queues, max={ch_max}") |
| |
| defer(ethtool, f"-L {cfg.ifname} combined {qcnt}") |
| ethtool(f"-L {cfg.ifname} combined {num_queues}") |
| |
| |
| def _run_gro_bin(cfg, test_name, protocol=None, num_flows=None, |
| order_check=False, verbose=False, fail=False): |
| """Run gro binary with given test and return the process result.""" |
| if not hasattr(cfg, "bin_remote"): |
| cfg.bin_local = cfg.net_lib_dir / "gro" |
| cfg.bin_remote = cfg.remote.deploy(cfg.bin_local) |
| |
| if protocol is None: |
| ipver = cfg.addr_ipver |
| protocol = f"ipv{ipver}" |
| else: |
| ipver = "6" if protocol[-1] == "6" else "4" |
| |
| dmac = _resolve_dmac(cfg, ipver) |
| |
| base_args = [ |
| f"--{protocol}", |
| f"--dmac {dmac}", |
| f"--smac {cfg.remote_dev['address']}", |
| f"--daddr {cfg.addr_v[ipver]}", |
| f"--saddr {cfg.remote_addr_v[ipver]}", |
| f"--test {test_name}", |
| ] |
| if num_flows: |
| base_args.append(f"--num-flows {num_flows}") |
| if order_check: |
| base_args.append("--order-check") |
| if verbose: |
| base_args.append("--verbose") |
| |
| args = " ".join(base_args) |
| |
| rx_cmd = f"{cfg.bin_local} {args} --rx --iface {cfg.ifname}" |
| tx_cmd = f"{cfg.bin_remote} {args} --iface {cfg.remote_ifname}" |
| |
| with bkg(rx_cmd, ksft_ready=True, exit_wait=True, fail=fail) as rx_proc: |
| cmd(tx_cmd, host=cfg.remote) |
| |
| return rx_proc |
| |
| |
| def _setup(cfg, mode, test_name): |
| """ Setup hardware loopback mode for GRO testing. """ |
| |
| if not hasattr(cfg, "bin_remote"): |
| cfg.bin_local = cfg.net_lib_dir / "gro" |
| cfg.bin_remote = cfg.remote.deploy(cfg.bin_local) |
| |
| if not hasattr(cfg, "feat"): |
| cfg.feat = ethtool(f"-k {cfg.ifname}", json=True)[0] |
| cfg.remote_feat = ethtool(f"-k {cfg.remote_ifname}", |
| host=cfg.remote, json=True)[0] |
| |
| # "large_*" tests need at least 4k MTU |
| if test_name.startswith("large_"): |
| _set_mtu_restore(cfg.dev, 4096, None) |
| _set_mtu_restore(cfg.remote_dev, 4096, cfg.remote) |
| |
| if mode == "sw": |
| flush_path = f"/sys/class/net/{cfg.ifname}/gro_flush_timeout" |
| irq_path = f"/sys/class/net/{cfg.ifname}/napi_defer_hard_irqs" |
| |
| _write_defer_restore(cfg, flush_path, "200000", defer_undo=True) |
| _write_defer_restore(cfg, irq_path, "10", defer_undo=True) |
| |
| _set_ethtool_feat(cfg.ifname, cfg.feat, |
| {"generic-receive-offload": True, |
| "rx-gro-hw": False, |
| "large-receive-offload": False}) |
| elif mode == "hw": |
| _set_ethtool_feat(cfg.ifname, cfg.feat, |
| {"generic-receive-offload": False, |
| "rx-gro-hw": True, |
| "large-receive-offload": False}) |
| |
| # Some NICs treat HW GRO as a GRO sub-feature so disabling GRO |
| # will also clear HW GRO. Use a hack of installing XDP generic |
| # to skip SW GRO, even when enabled. |
| feat = ethtool(f"-k {cfg.ifname}", json=True)[0] |
| if not feat["rx-gro-hw"]["active"]: |
| ksft_pr("Driver clears HW GRO and SW GRO is cleared, using generic XDP workaround") |
| prog = cfg.net_lib_dir / "xdp_dummy.bpf.o" |
| ip(f"link set dev {cfg.ifname} xdpgeneric obj {prog} sec xdp") |
| defer(ip, f"link set dev {cfg.ifname} xdpgeneric off") |
| |
| # Attaching XDP may change features, fetch the latest state |
| feat = ethtool(f"-k {cfg.ifname}", json=True)[0] |
| |
| _set_ethtool_feat(cfg.ifname, feat, |
| {"generic-receive-offload": True, |
| "rx-gro-hw": True, |
| "large-receive-offload": False}) |
| elif mode == "lro": |
| # netdevsim advertises LRO for feature inheritance testing with |
| # bonding/team tests but it doesn't actually perform the offload |
| cfg.require_nsim(nsim_test=False) |
| |
| _set_ethtool_feat(cfg.ifname, cfg.feat, |
| {"generic-receive-offload": False, |
| "rx-gro-hw": False, |
| "large-receive-offload": True}) |
| |
| try: |
| # Disable TSO for local tests |
| cfg.require_nsim() # will raise KsftXfailEx if not running on nsim |
| |
| _set_ethtool_feat(cfg.remote_ifname, cfg.remote_feat, |
| {"tcp-segmentation-offload": False}, |
| host=cfg.remote) |
| except KsftXfailEx: |
| pass |
| |
| |
| def _gro_variants(): |
| """Generator that yields all combinations of protocol and test types.""" |
| |
| # Tests that work for all protocols |
| common_tests = [ |
| "data_same", "data_lrg_sml", "data_sml_lrg", "data_lrg_1byte", |
| "data_burst", |
| "ack", |
| "flags_psh", "flags_syn", "flags_rst", "flags_urg", "flags_cwr", |
| "tcp_csum", "tcp_seq", "tcp_ts", "tcp_opt", |
| "ip_ecn", "ip_tos", |
| "large_max", "large_rem", |
| ] |
| |
| # Tests specific to IPv4 |
| ipv4_tests = [ |
| "ip_csum", |
| "ip_ttl", "ip_opt", "ip_frag4", |
| "ip_id_df1_inc", "ip_id_df1_fixed", |
| "ip_id_df0_inc", "ip_id_df0_fixed", |
| "ip_id_df1_inc_fixed", "ip_id_df1_fixed_inc", |
| ] |
| |
| # Tests specific to IPv6 |
| ipv6_tests = [ |
| "ip_frag6", "ip_v6ext_same", "ip_v6ext_diff", |
| ] |
| |
| for mode in ["sw", "hw", "lro"]: |
| for protocol in ["ipv4", "ipv6", "ipip", "ip6ip6"]: |
| for test_name in common_tests: |
| yield mode, protocol, test_name |
| |
| if protocol in ["ipv4", "ipip"]: |
| for test_name in ipv4_tests: |
| yield mode, protocol, test_name |
| elif protocol == "ipv6": |
| for test_name in ipv6_tests: |
| yield mode, protocol, test_name |
| |
| |
| @ksft_variants(_gro_variants()) |
| def test(cfg, mode, protocol, test_name): |
| """Run a single GRO test with retries.""" |
| |
| ipver = "6" if protocol[-1] == "6" else "4" |
| cfg.require_ipver(ipver) |
| |
| _setup(cfg, mode, test_name) |
| |
| # Each test is run 6 times to deflake, because given the receive timing, |
| # not all packets that should coalesce will be considered in the same flow |
| # on every try. |
| max_retries = 6 |
| for attempt in range(max_retries): |
| fail_now = attempt >= max_retries - 1 |
| rx_proc = _run_gro_bin(cfg, test_name, protocol=protocol, |
| verbose=True, fail=fail_now) |
| |
| if rx_proc.ret == 0: |
| return |
| |
| ksft_pr(rx_proc) |
| |
| if test_name.startswith("large_") and os.environ.get("KSFT_MACHINE_SLOW"): |
| ksft_pr(f"Ignoring {protocol}/{test_name} failure due to slow environment") |
| return |
| |
| ksft_pr(f"Attempt {attempt + 1}/{max_retries} failed, retrying...") |
| |
| |
| def _capacity_variants(): |
| """Generate variants for capacity test: mode x queue setup.""" |
| setups = [ |
| ("isolated", _setup_isolated_queue), |
| ("1q", lambda cfg: _setup_queue_count(cfg, 1)), |
| ("8q", lambda cfg: _setup_queue_count(cfg, 8)), |
| ] |
| for mode in ["sw", "hw", "lro"]: |
| for name, func in setups: |
| yield KsftNamedVariant(f"{mode}_{name}", mode, func) |
| |
| |
| @ksft_variants(_capacity_variants()) |
| def test_gro_capacity(cfg, mode, setup_func): |
| """ |
| Probe GRO capacity. |
| |
| Start with 8 flows and increase by 2x on each successful run. |
| Retry up to 3 times on failure. |
| |
| Variants combine mode (sw, hw, lro) with queue setup: |
| - isolated: Use a single queue isolated from RSS |
| - 1q: Configure NIC to use 1 queue |
| - 8q: Configure NIC to use 8 queues |
| """ |
| max_retries = 3 |
| |
| _setup(cfg, mode, "capacity") |
| queue_id = setup_func(cfg) |
| |
| num_flows = 8 |
| while True: |
| success = False |
| for attempt in range(max_retries): |
| if queue_id is not None: |
| stats_before = _get_queue_stats(cfg, queue_id) |
| |
| rx_proc = _run_gro_bin(cfg, "capacity", num_flows=num_flows) |
| output = rx_proc.stdout |
| |
| if queue_id is not None: |
| stats_after = _get_queue_stats(cfg, queue_id) |
| qstat_pkts = (stats_after.get('rx-packets', 0) - |
| stats_before.get('rx-packets', 0)) |
| gro_pkts = (stats_after.get('rx-hw-gro-packets', 0) - |
| stats_before.get('rx-hw-gro-packets', 0)) |
| qstat_str = f" qstat={qstat_pkts} hw-gro={gro_pkts}" |
| else: |
| qstat_str = "" |
| |
| # Parse and print STATS line |
| match = re.search( |
| r'STATS: received=(\d+) wire=(\d+) coalesced=(\d+)', output) |
| if match: |
| received = int(match.group(1)) |
| wire = int(match.group(2)) |
| coalesced = int(match.group(3)) |
| status = "PASS" if received == num_flows else "MISS" |
| ksft_pr(f"flows={num_flows} attempt={attempt + 1} " |
| f"received={received} wire={wire} " |
| f"coalesced={coalesced}{qstat_str} [{status}]") |
| if received == num_flows: |
| success = True |
| break |
| else: |
| ksft_pr(rx_proc) |
| ksft_pr(f"flows={num_flows} attempt={attempt + 1}" |
| f"{qstat_str} [FAIL - can't parse stats]") |
| |
| if not success: |
| ksft_pr(f"Stopped at {num_flows} flows") |
| break |
| |
| num_flows *= 2 |
| |
| |
| def main() -> None: |
| """ Ksft boiler plate main """ |
| |
| with NetDrvEpEnv(__file__) as cfg: |
| cfg.ethnl = EthtoolFamily() |
| cfg.netnl = NetdevFamily() |
| ksft_run(cases=[test, test_gro_capacity], args=(cfg,)) |
| ksft_exit() |
| |
| |
| if __name__ == "__main__": |
| main() |