Skip site navigation (1)Skip section navigation (2)
Date:      Thu, 15 Aug 2024 21:28:08 -0600
From:      Warner Losh <imp@bsdimp.com>
To:        Zhenlei Huang <zlei@freebsd.org>
Cc:        Warner Losh <imp@freebsd.org>, src-committers <src-committers@freebsd.org>,  "<dev-commits-src-all@freebsd.org>" <dev-commits-src-all@freebsd.org>,  "<dev-commits-src-main@freebsd.org>" <dev-commits-src-main@freebsd.org>
Subject:   Re: git: d5507f9e4366 - main - nvme: Separate total failures from I/O failures
Message-ID:  <CANCZdfpk7dSiuYaU42cFXrhqMsonbPrQrjzTDeWL=vvCnoHMxA@mail.gmail.com>
In-Reply-To: <0936F9D3-86A7-46AF-83E3-3EE63C41DA67@FreeBSD.org>
References:  <202408160230.47G2UO9J045807@gitrepo.freebsd.org> <0936F9D3-86A7-46AF-83E3-3EE63C41DA67@FreeBSD.org>

next in thread | previous in thread | raw e-mail | index | archive | help

[-- Attachment #1 --]
On Thu, Aug 15, 2024, 9:12 PM Zhenlei Huang <zlei@freebsd.org> wrote:

> Hi Warner,
>
> I'm not sure but this change seems include lots of unintended changes (
> maybe some local WIP ) .
>

Git am somehow screwed me.  I'll fix.

Warner

> On Aug 16, 2024, at 10:30 AM, Warner Losh <imp@FreeBSD.org> wrote:
> >
> > The branch main has been updated by imp:
> >
> > URL:
> https://cgit.FreeBSD.org/src/commit/?id=d5507f9e436698ac17dc5ace7ef58493988a9b04
> >
> > commit d5507f9e436698ac17dc5ace7ef58493988a9b04
> > Author:     Warner Losh <imp@FreeBSD.org>
> > AuthorDate: 2024-08-14 22:55:49 +0000
> > Commit:     Warner Losh <imp@FreeBSD.org>
> > CommitDate: 2024-08-16 02:22:18 +0000
> >
> >    nvme: Separate total failures from I/O failures
> >
> >    When it's a I/O failure, we can still send admin commands. Separate
> out
> >    the admin failures and flag them as such so that we can still send
> admin
> >    commands on half-failed drives.
> >
> >    Fixes: 9229b3105d88 (nvme: Fail passthrough commands right away in
> failed state)
> >    Sponsored by: Netflix
> > ---
> > sys/amd64/conf/IOSCHED                             |    2 +
> > sys/amd64/conf/MPI3MR                              |   10 +
> > sys/arm64/conf/GENERIC16K                          |    4 +
> > .../linuxkpi/common/include/linux/#compiler.h#     |  117 +
> > sys/contrib/dev/iwlwifi/fw/api/soc.h               |   35 +
> > sys/contrib/zlib/contrib/asm686/README.686         |   51 +
> > sys/contrib/zlib/contrib/asm686/match.S            |  357 +
> > sys/dev/ice/ice_sriov.c                            |  595 ++
> > sys/dev/ice/ice_sriov.h                            |   64 +
> > sys/dev/mps/mpi/mpi2_pci.h                         |  141 +
> > sys/dev/nvme/nvme_ctrlr.c                          |   46 +-
> > sys/dev/nvme/nvme_private.h                        |    1 +
> > sys/dev/nvme/nvme_qpair.c                          |   23 +-
> > sys/dev/nvme/nvme_sim.c                            |   13 +-
> > sys/dev/sound/pci/aureal.c                         |  686 ++
> > sys/dev/sound/pci/aureal.h                         |   99 +
> > sys/dev/sound/pci/ds1-fw.h                         | 1602 ++++
> > sys/dev/sound/pci/ds1.c                            | 1103 +++
> > sys/dev/sound/pci/ds1.h                            |  146 +
> > sys/dev/sound/pci/maestro.c                        | 2043 +++++
> > sys/dev/sound/pci/maestro_reg.h                    |  381 +
> > sys/kern/bsduser-syscalls.c                        | 8712
> ++++++++++++++++++++
> > sys/modules/sound/driver/ds1/Makefile              |    8 +
> > sys/modules/sound/driver/maestro/Makefile          |    8 +
> > 24 files changed, 16219 insertions(+), 28 deletions(-)
> >
> > diff --git a/sys/amd64/conf/IOSCHED b/sys/amd64/conf/IOSCHED
> > new file mode 100644
> > index 000000000000..e15106bc4c1f
> > --- /dev/null
> > +++ b/sys/amd64/conf/IOSCHED
> > @@ -0,0 +1,2 @@
> > +include "GENERIC"
> > +options CAM_IOSCHED_DYNAMIC
> > diff --git a/sys/amd64/conf/MPI3MR b/sys/amd64/conf/MPI3MR
> > new file mode 100644
> > index 000000000000..99e5244cb49d
> > --- /dev/null
> > +++ b/sys/amd64/conf/MPI3MR
> > @@ -0,0 +1,10 @@
> > +include GENERIC
> > +
> > +device mpi3mr
> > +# All the debugging options
> > +options DEADLKRES # Enable the deadlock resolver
> > +options INVARIANTS # Enable calls of extra sanity checking
> > +options INVARIANT_SUPPORT # Extra sanity checks of internal structures,
> required by INVARIANTS
> > +options QUEUE_MACRO_DEBUG_TRASH # Trash queue(2) internal pointers on
> invalidation
> > +options WITNESS # Enable checks to detect deadlocks and cycles
> > +options WITNESS_SKIPSPIN # Don't run witness on spinlocks for speed
> > diff --git a/sys/arm64/conf/GENERIC16K b/sys/arm64/conf/GENERIC16K
> > new file mode 100644
> > index 000000000000..9bf9e2dadb08
> > --- /dev/null
> > +++ b/sys/arm64/conf/GENERIC16K
> > @@ -0,0 +1,4 @@
> > +include              "GENERIC"
> > +
> > +ident                GENERIC_16K
> > +
> > diff --git a/sys/compat/linuxkpi/common/include/linux/#compiler.h#
> b/sys/compat/linuxkpi/common/include/linux/#compiler.h#
> > new file mode 100644
> > index 000000000000..1177674aa68f
> > --- /dev/null
> > +++ b/sys/compat/linuxkpi/common/include/linux/#compiler.h#
> > @@ -0,0 +1,117 @@
> > +/*-
> > + * Copyright (c) 2010 Isilon Systems, Inc.
> > + * Copyright (c) 2010 iX Systems, Inc.
> > + * Copyright (c) 2010 Panasas, Inc.
> > + * Copyright (c) 2013-2016 Mellanox Technologies, Ltd.
> > + * Copyright (c) 2015 François Tigeot
> > + * All rights reserved.
> > + *
> > + * Redistribution and use in source and binary forms, with or without
> > + * modification, are permitted provided that the following conditions
> > + * are met:
> > + * 1. Redistributions of source code must retain the above copyright
> > + *    notice unmodified, this list of conditions, and the following
> > + *    disclaimer.
> > + * 2. Redistributions in binary form must reproduce the above copyright
> > + *    notice, this list of conditions and the following disclaimer in
> the
> > + *    documentation and/or other materials provided with the
> distribution.
> > + *
> > + * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
> > + * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
> WARRANTIES
> > + * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
> DISCLAIMED.
> > + * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
> > + * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
> BUT
> > + * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
> USE,
> > + * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
> > + * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
> > + * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE
> USE OF
> > + * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
> > + *
> > + * $FreeBSD$
> > + */
> > +#ifndef      _LINUX_COMPILER_H_
> > +#define      _LINUX_COMPILER_H_
> > +
> > +#include <sys/cdefs.h>
> > +
> > +#define __user
> > +#define __kernel
> > +#define __safe
> > +#define __force
> > +#define __nocast
> > +#define __iomem
> > +#define __chk_user_ptr(x)            ((void)0)
> > +#define __chk_io_ptr(x)                      ((void)0)
> > +#define __builtin_warning(x, y...)   (1)
> > +#define __acquires(x)
> > +#define __releases(x)
> > +#define __acquire(x)                 do { } while (0)
> > +#define __release(x)                 do { } while (0)
> > +#define __cond_lock(x,c)             (c)
> > +#define      __bitwise
> > +#define __devinitdata
> > +#define      __deprecated
> > +#define __init
> > +#define      __initconst
> > +#define      __devinit
> > +#define      __devexit
> > +#define __exit
> > +#define      __rcu
> > +#define      __percpu
> > +#define      __weak __weak_symbol
> > +#define      __malloc
> > +#define      ___stringify(...)               #__VA_ARGS__
> > +#define      __stringify(...)                ___stringify(__VA_ARGS__)
> > +#define      __attribute_const__             __attribute__((__const__))
> > +#undef __always_inline
> > +#define      __always_inline                 inline
> > +#define      noinline                        __noinline
> > +#define      ____cacheline_aligned           __aligned(CACHE_LINE_SIZE)
> > +
> > +#define      likely(x)                       __builtin_expect(!!(x), 1)
> > +#define      unlikely(x)                     __builtin_expect(!!(x), 0)
> > +#define typeof(x)                    __typeof(x)
> > +
> > +#define      uninitialized_var(x)            x = x
> > +#define      __maybe_unused                  __unused
> > +#define      __always_unused                 __unused
> > +#define      __must_check                    __result_use_check
> > +
> > +#define      __printf(a,b)                   __printflike(a,b)
> > +
> > +#define      barrier()                       __asm__ __volatile__("": :
> :"memory")
> > +
> > +#if defined(LINUXKPI_VERSION) && LINUXKPI_VERSION >= 50000
> > +/* Moved from drm_os_freebsd.h */
> > +#define      lower_32_bits(n)                ((u32)(n))
> > +#define      upper_32_bits(n)                ((u32)(((n) >> 16) >> 16))
> > +#endif
> > +
> > +#define      ___PASTE(a,b) a##b
> > +#define      __PASTE(a,b) ___PASTE(a,b)
> > +
> > +#define      ACCESS_ONCE(x)                  (*(volatile __typeof(x)
> *)&(x))
> > +
> > +#define      WRITE_ONCE(x,v) do {            \
> > +     barrier();                      \
> > +     ACCESS_ONCE(x) = (v);           \
> > +     barrier();                      \
> > +} while (0)
> > +
> > +#define      READ_ONCE(x) ({                 \
> > +     __typeof(x) __var = ({          \
> > +             barrier();              \
> > +             ACCESS_ONCE(x);         \
> > +     });                             \
> > +     barrier();                      \
> > +     __var;                          \
> > +})
> > +
> > +#define      lockless_dereference(p) READ_ONCE(p)
> > +
> > +#define      _AT(T,X)        ((T)(X))
> > +
> > +#define      __same_type(a, b)
>  __builtin_types_compatible_p(typeof(a), typeof(b))
> > +#define      __must_be_array(a)      __same_type(a, &(a)[0])
> > +
> > +#endif       /* _LINUX_COMPILER_H_ */
> > diff --git a/sys/contrib/dev/iwlwifi/fw/api/soc.h
> b/sys/contrib/dev/iwlwifi/fw/api/soc.h
> > new file mode 100644
> > index 000000000000..c5df1171462b
> > --- /dev/null
> > +++ b/sys/contrib/dev/iwlwifi/fw/api/soc.h
> > @@ -0,0 +1,35 @@
> > +/* SPDX-License-Identifier: GPL-2.0 OR BSD-3-Clause */
> > +/*
> > + * Copyright (C) 2012-2014, 2019-2020 Intel Corporation
> > + * Copyright (C) 2013-2015 Intel Mobile Communications GmbH
> > + * Copyright (C) 2016-2017 Intel Deutschland GmbH
> > + */
> > +#ifndef __iwl_fw_api_soc_h__
> > +#define __iwl_fw_api_soc_h__
> > +
> > +#define SOC_CONFIG_CMD_FLAGS_DISCRETE                BIT(0)
> > +#define SOC_CONFIG_CMD_FLAGS_LOW_LATENCY     BIT(1)
> > +
> > +#define SOC_FLAGS_LTR_APPLY_DELAY_MASK               0xc
> > +#define SOC_FLAGS_LTR_APPLY_DELAY_NONE               0
> > +#define SOC_FLAGS_LTR_APPLY_DELAY_200                1
> > +#define SOC_FLAGS_LTR_APPLY_DELAY_2500               2
> > +#define SOC_FLAGS_LTR_APPLY_DELAY_1820               3
> > +
> > +/**
> > + * struct iwl_soc_configuration_cmd - Set device stabilization latency
> > + *
> > + * @flags: soc settings flags.  In VER_1, we can only set the DISCRETE
> > + *   flag, because the FW treats the whole value as an integer. In
> > + *   VER_2, we can set the bits independently.
> > + * @latency: time for SOC to ensure stable power & XTAL
> > + */
> > +struct iwl_soc_configuration_cmd {
> > +     __le32 flags;
> > +     __le32 latency;
> > +} __packed; /*
> > +          * SOC_CONFIGURATION_CMD_S_VER_1 (see description above)
> > +          * SOC_CONFIGURATION_CMD_S_VER_2
> > +          */
> > +
> > +#endif /* __iwl_fw_api_soc_h__ */
> > diff --git a/sys/contrib/zlib/contrib/asm686/README.686
> b/sys/contrib/zlib/contrib/asm686/README.686
> > new file mode 100644
> > index 000000000000..a0bf3bea4aff
> > --- /dev/null
> > +++ b/sys/contrib/zlib/contrib/asm686/README.686
> > @@ -0,0 +1,51 @@
> > +This is a patched version of zlib, modified to use
> > +Pentium-Pro-optimized assembly code in the deflation algorithm. The
> > +files changed/added by this patch are:
> > +
> > +README.686
> > +match.S
> > +
> > +The speedup that this patch provides varies, depending on whether the
> > +compiler used to build the original version of zlib falls afoul of the
> > +PPro's speed traps. My own tests show a speedup of around 10-20% at
> > +the default compression level, and 20-30% using -9, against a version
> > +compiled using gcc 2.7.2.3. Your mileage may vary.
> > +
> > +Note that this code has been tailored for the PPro/PII in particular,
> > +and will not perform particuarly well on a Pentium.
> > +
> > +If you are using an assembler other than GNU as, you will have to
> > +translate match.S to use your assembler's syntax. (Have fun.)
> > +
> > +Brian Raiter
> > +breadbox@muppetlabs.com
> > +April, 1998
> > +
> > +
> > +Added for zlib 1.1.3:
> > +
> > +The patches come from
> > +http://www.muppetlabs.com/~breadbox/software/assembly.html
> > +
> > +To compile zlib with this asm file, copy match.S to the zlib directory
> > +then do:
> > +
> > +CFLAGS="-O3 -DASMV" ./configure
> > +make OBJA=match.o
> > +
> > +
> > +Update:
> > +
> > +I've been ignoring these assembly routines for years, believing that
> > +gcc's generated code had caught up with it sometime around gcc 2.95
> > +and the major rearchitecting of the Pentium 4. However, I recently
> > +learned that, despite what I believed, this code still has some life
> > +in it. On the Pentium 4 and AMD64 chips, it continues to run about 8%
> > +faster than the code produced by gcc 4.1.
> > +
> > +In acknowledgement of its continuing usefulness, I've altered the
> > +license to match that of the rest of zlib. Share and Enjoy!
> > +
> > +Brian Raiter
> > +breadbox@muppetlabs.com
> > +April, 2007
> > diff --git a/sys/contrib/zlib/contrib/asm686/match.S
> b/sys/contrib/zlib/contrib/asm686/match.S
> > new file mode 100644
> > index 000000000000..fa421092785d
> > --- /dev/null
> > +++ b/sys/contrib/zlib/contrib/asm686/match.S
> > @@ -0,0 +1,357 @@
> > +/* match.S -- x86 assembly version of the zlib longest_match() function.
> > + * Optimized for the Intel 686 chips (PPro and later).
> > + *
> > + * Copyright (C) 1998, 2007 Brian Raiter <breadbox@muppetlabs.com>
> > + *
> > + * This software is provided 'as-is', without any express or implied
> > + * warranty.  In no event will the author be held liable for any damages
> > + * arising from the use of this software.
> > + *
> > + * Permission is granted to anyone to use this software for any purpose,
> > + * including commercial applications, and to alter it and redistribute
> it
> > + * freely, subject to the following restrictions:
> > + *
> > + * 1. The origin of this software must not be misrepresented; you must
> not
> > + *    claim that you wrote the original software. If you use this
> software
> > + *    in a product, an acknowledgment in the product documentation
> would be
> > + *    appreciated but is not required.
> > + * 2. Altered source versions must be plainly marked as such, and must
> not be
> > + *    misrepresented as being the original software.
> > + * 3. This notice may not be removed or altered from any source
> distribution.
> > + */
> > +
> > +#ifndef NO_UNDERLINE
> > +#define      match_init      _match_init
> > +#define      longest_match   _longest_match
> > +#endif
> > +
> > +#define      MAX_MATCH       (258)
> > +#define      MIN_MATCH       (3)
> > +#define      MIN_LOOKAHEAD   (MAX_MATCH + MIN_MATCH + 1)
> > +#define      MAX_MATCH_8     ((MAX_MATCH + 7) & ~7)
> > +
> > +/* stack frame offsets */
> > +
> > +#define      chainlenwmask           0       /* high word: current
> chain len */
> > +                                     /* low word: s->wmask           */
> > +#define      window                  4       /* local copy of
> s->window      */
> > +#define      windowbestlen           8       /* s->window + bestlen
>       */
> > +#define      scanstart               16      /* first two bytes of
> string    */
> > +#define      scanend                 12      /* last two bytes of
> string     */
> > +#define      scanalign               20      /* dword-misalignment of
> string */
> > +#define      nicematch               24      /* a good enough match
> size     */
> > +#define      bestlen                 28      /* size of best match so
> far    */
> > +#define      scan                    32      /* ptr to string wanting
> match  */
> > +
> > +#define      LocalVarsSize           (36)
> > +/*   saved ebx               36 */
> > +/*   saved edi               40 */
> > +/*   saved esi               44 */
> > +/*   saved ebp               48 */
> > +/*   return address          52 */
> > +#define      deflatestate            56      /* the function arguments
>      */
> > +#define      curmatch                60
> > +
> > +/* All the +zlib1222add offsets are due to the addition of fields
> > + *  in zlib in the deflate_state structure since the asm code was first
> written
> > + * (if you compile with zlib 1.0.4 or older, use "zlib1222add equ
> (-4)").
> > + * (if you compile with zlib between 1.0.5 and 1.2.2.1, use
> "zlib1222add equ 0").
> > + * if you compile with zlib 1.2.2.2 or later , use "zlib1222add equ 8").
> > + */
> > +
> > +#define zlib1222add          (8)
> > +
> > +#define      dsWSize                 (36+zlib1222add)
> > +#define      dsWMask                 (44+zlib1222add)
> > +#define      dsWindow                (48+zlib1222add)
> > +#define      dsPrev                  (56+zlib1222add)
> > +#define      dsMatchLen              (88+zlib1222add)
> > +#define      dsPrevMatch             (92+zlib1222add)
> > +#define      dsStrStart              (100+zlib1222add)
> > +#define      dsMatchStart            (104+zlib1222add)
> > +#define      dsLookahead             (108+zlib1222add)
> > +#define      dsPrevLen               (112+zlib1222add)
> > +#define      dsMaxChainLen           (116+zlib1222add)
> > +#define      dsGoodMatch             (132+zlib1222add)
> > +#define      dsNiceMatch             (136+zlib1222add)
> > +
> > +
> > +.file "match.S"
> > +
> > +.globl       match_init, longest_match
> > +
> > +.text
> > +
> > +/* uInt longest_match(deflate_state *deflatestate, IPos curmatch) */
> > +.cfi_sections        .debug_frame
> > +
> > +longest_match:
> > +
> > +.cfi_startproc
> > +/* Save registers that the compiler may be using, and adjust %esp to */
> > +/* make room for our stack frame.                                    */
> > +
> > +             pushl   %ebp
> > +             .cfi_def_cfa_offset 8
> > +             .cfi_offset ebp, -8
> > +             pushl   %edi
> > +             .cfi_def_cfa_offset 12
> > +             pushl   %esi
> > +             .cfi_def_cfa_offset 16
> > +             pushl   %ebx
> > +             .cfi_def_cfa_offset 20
> > +             subl    $LocalVarsSize, %esp
> > +             .cfi_def_cfa_offset LocalVarsSize+20
> > +
> > +/* Retrieve the function arguments. %ecx will hold cur_match         */
> > +/* throughout the entire function. %edx will hold the pointer to the */
> > +/* deflate_state structure during the function's setup (before
>      */
> > +/* entering the main loop).                                          */
> > +
> > +             movl    deflatestate(%esp), %edx
> > +             movl    curmatch(%esp), %ecx
> > +
> > +/* uInt wmask = s->w_mask;                                           */
> > +/* unsigned chain_length = s->max_chain_length;
>       */
> > +/* if (s->prev_length >= s->good_match) {                            */
> > +/*     chain_length >>= 2;                                           */
> > +/* }                                                                 */
> > +
> > +             movl    dsPrevLen(%edx), %eax
> > +             movl    dsGoodMatch(%edx), %ebx
> > +             cmpl    %ebx, %eax
> > +             movl    dsWMask(%edx), %eax
> > +             movl    dsMaxChainLen(%edx), %ebx
> > +             jl      LastMatchGood
> > +             shrl    $2, %ebx
> > +LastMatchGood:
> > +
> > +/* chainlen is decremented once beforehand so that the function can  */
> > +/* use the sign flag instead of the zero flag for the exit test.     */
> > +/* It is then shifted into the high word, to make room for the wmask */
> > +/* value, which it will always accompany.                            */
> > +
> > +             decl    %ebx
> > +             shll    $16, %ebx
> > +             orl     %eax, %ebx
> > +             movl    %ebx, chainlenwmask(%esp)
> > +
> > +/* if ((uInt)nice_match > s->lookahead) nice_match = s->lookahead;   */
> > +
> > +             movl    dsNiceMatch(%edx), %eax
> > +             movl    dsLookahead(%edx), %ebx
> > +             cmpl    %eax, %ebx
> > +             jl      LookaheadLess
> > +             movl    %eax, %ebx
> > +LookaheadLess:       movl    %ebx, nicematch(%esp)
> > +
> > +/* register Bytef *scan = s->window + s->strstart;                   */
> > +
> > +             movl    dsWindow(%edx), %esi
> > +             movl    %esi, window(%esp)
> > +             movl    dsStrStart(%edx), %ebp
> > +             lea     (%esi,%ebp), %edi
> > +             movl    %edi, scan(%esp)
> > +
> > +/* Determine how many bytes the scan ptr is off from being           */
> > +/* dword-aligned.                                                    */
> > +
> > +             movl    %edi, %eax
> > +             negl    %eax
> > +             andl    $3, %eax
> > +             movl    %eax, scanalign(%esp)
> > +
> > +/* IPos limit = s->strstart > (IPos)MAX_DIST(s) ?                    */
> > +/*     s->strstart - (IPos)MAX_DIST(s) : NIL;
>       */
> > +
> > +             movl    dsWSize(%edx), %eax
> > +             subl    $MIN_LOOKAHEAD, %eax
> > +             subl    %eax, %ebp
> > +             jg      LimitPositive
> > +             xorl    %ebp, %ebp
> > +LimitPositive:
> > +
> > +/* int best_len = s->prev_length;                                    */
> > +
> > +             movl    dsPrevLen(%edx), %eax
> > +             movl    %eax, bestlen(%esp)
> > +
> > +/* Store the sum of s->window + best_len in %esi locally, and in %esi.
>      */
> > +
> > +             addl    %eax, %esi
> > +             movl    %esi, windowbestlen(%esp)
> > +
> > +/* register ush scan_start = *(ushf*)scan;                           */
> > +/* register ush scan_end   = *(ushf*)(scan+best_len-1);
>       */
> > +/* Posf *prev = s->prev;                                             */
> > +
> > +             movzwl  (%edi), %ebx
> > +             movl    %ebx, scanstart(%esp)
> > +             movzwl  -1(%edi,%eax), %ebx
> > +             movl    %ebx, scanend(%esp)
> > +             movl    dsPrev(%edx), %edi
> > +
> > +/* Jump into the main loop.                                          */
> > +
> > +             movl    chainlenwmask(%esp), %edx
> > +             jmp     LoopEntry
> > +
> > +.balign 16
> > +
> > +/* do {
> > + *     match = s->window + cur_match;
> > + *     if (*(ushf*)(match+best_len-1) != scan_end ||
> > + *         *(ushf*)match != scan_start) continue;
> > + *     [...]
> > + * } while ((cur_match = prev[cur_match & wmask]) > limit
> > + *          && --chain_length != 0);
> > + *
> > + * Here is the inner loop of the function. The function will spend the
> > + * majority of its time in this loop, and majority of that time will
> > + * be spent in the first ten instructions.
> > + *
> > + * Within this loop:
> > + * %ebx = scanend
> > + * %ecx = curmatch
> > + * %edx = chainlenwmask - i.e., ((chainlen << 16) | wmask)
> > + * %esi = windowbestlen - i.e., (window + bestlen)
> > + * %edi = prev
> > + * %ebp = limit
> > + */
> > +LookupLoop:
> > +             andl    %edx, %ecx
> > +             movzwl  (%edi,%ecx,2), %ecx
> > +             cmpl    %ebp, %ecx
> > +             jbe     LeaveNow
> > +             subl    $0x00010000, %edx
> > +             js      LeaveNow
> > +LoopEntry:   movzwl  -1(%esi,%ecx), %eax
> > +             cmpl    %ebx, %eax
> > +             jnz     LookupLoop
> > +             movl    window(%esp), %eax
> > +             movzwl  (%eax,%ecx), %eax
> > +             cmpl    scanstart(%esp), %eax
> > +             jnz     LookupLoop
> > +
> > +/* Store the current value of chainlen.
>       */
> > +
> > +             movl    %edx, chainlenwmask(%esp)
> > +
> > +/* Point %edi to the string under scrutiny, and %esi to the string we
>       */
> > +/* are hoping to match it up with. In actuality, %esi and %edi are   */
> > +/* both pointed (MAX_MATCH_8 - scanalign) bytes ahead, and %edx is   */
> > +/* initialized to -(MAX_MATCH_8 - scanalign).
>       */
> > +
> > +             movl    window(%esp), %esi
> > +             movl    scan(%esp), %edi
> > +             addl    %ecx, %esi
> > +             movl    scanalign(%esp), %eax
> > +             movl    $(-MAX_MATCH_8), %edx
> > +             lea     MAX_MATCH_8(%edi,%eax), %edi
> > +             lea     MAX_MATCH_8(%esi,%eax), %esi
> > +
> > +/* Test the strings for equality, 8 bytes at a time. At the end,
> > + * adjust %edx so that it is offset to the exact byte that mismatched.
> > + *
> > + * We already know at this point that the first three bytes of the
> > + * strings match each other, and they can be safely passed over before
> > + * starting the compare loop. So what this code does is skip over 0-3
> > + * bytes, as much as necessary in order to dword-align the %edi
> > + * pointer. (%esi will still be misaligned three times out of four.)
> > + *
> > + * It should be confessed that this loop usually does not represent
> > + * much of the total running time. Replacing it with a more
> > + * straightforward "rep cmpsb" would not drastically degrade
> > + * performance.
> > + */
> > +LoopCmps:
> > +             movl    (%esi,%edx), %eax
> > +             xorl    (%edi,%edx), %eax
> > +             jnz     LeaveLoopCmps
> > +             movl    4(%esi,%edx), %eax
> > +             xorl    4(%edi,%edx), %eax
> > +             jnz     LeaveLoopCmps4
> > +             addl    $8, %edx
> > +             jnz     LoopCmps
> > +             jmp     LenMaximum
> > +LeaveLoopCmps4:      addl    $4, %edx
> > +LeaveLoopCmps:       testl   $0x0000FFFF, %eax
> > +             jnz     LenLower
> > +             addl    $2, %edx
> > +             shrl    $16, %eax
> > +LenLower:    subb    $1, %al
> > +             adcl    $0, %edx
> > +
> > +/* Calculate the length of the match. If it is longer than MAX_MATCH,
>       */
> > +/* then automatically accept it as the best possible match and leave.
>       */
> > +
> > +             lea     (%edi,%edx), %eax
> > +             movl    scan(%esp), %edi
> > +             subl    %edi, %eax
> > +             cmpl    $MAX_MATCH, %eax
> > +             jge     LenMaximum
> > +
> > +/* If the length of the match is not longer than the best match we   */
> > +/* have so far, then forget it and return to the lookup loop.
>       */
> > +
> > +             movl    deflatestate(%esp), %edx
> > +             movl    bestlen(%esp), %ebx
> > +             cmpl    %ebx, %eax
> > +             jg      LongerMatch
> > +             movl    windowbestlen(%esp), %esi
> > +             movl    dsPrev(%edx), %edi
> > +             movl    scanend(%esp), %ebx
> > +             movl    chainlenwmask(%esp), %edx
> > +             jmp     LookupLoop
> > +
> > +/*         s->match_start = cur_match;
>      */
> > +/*         best_len = len;                                           */
> > +/*         if (len >= nice_match) break;                             */
> > +/*         scan_end = *(ushf*)(scan+best_len-1);                     */
> > +
> > +LongerMatch: movl    nicematch(%esp), %ebx
> > +             movl    %eax, bestlen(%esp)
> > +             movl    %ecx, dsMatchStart(%edx)
> > +             cmpl    %ebx, %eax
> > +             jge     LeaveNow
> > +             movl    window(%esp), %esi
> > +             addl    %eax, %esi
> > +             movl    %esi, windowbestlen(%esp)
> > +             movzwl  -1(%edi,%eax), %ebx
> > +             movl    dsPrev(%edx), %edi
> > +             movl    %ebx, scanend(%esp)
> > +             movl    chainlenwmask(%esp), %edx
> > +             jmp     LookupLoop
> > +
> > +/* Accept the current string, with the maximum possible length.
>       */
> > +
> > +LenMaximum:  movl    deflatestate(%esp), %edx
> > +             movl    $MAX_MATCH, bestlen(%esp)
> > +             movl    %ecx, dsMatchStart(%edx)
> > +
> > +/* if ((uInt)best_len <= s->lookahead) return (uInt)best_len;
>       */
> > +/* return s->lookahead;
>       */
> > +
> > +LeaveNow:
> > +             movl    deflatestate(%esp), %edx
> > +             movl    bestlen(%esp), %ebx
> > +             movl    dsLookahead(%edx), %eax
> > +             cmpl    %eax, %ebx
> > +             jg      LookaheadRet
> > +             movl    %ebx, %eax
> > +LookaheadRet:
> > +
> > +/* Restore the stack and return from whence we came.                 */
> > +
> > +             addl    $LocalVarsSize, %esp
> > +             .cfi_def_cfa_offset 20
> > +             popl    %ebx
> > +             .cfi_def_cfa_offset 16
> > +             popl    %esi
> > +             .cfi_def_cfa_offset 12
> > +             popl    %edi
> > +             .cfi_def_cfa_offset 8
> > +             popl    %ebp
> > +             .cfi_def_cfa_offset 4
> > +.cfi_endproc
> > +match_init:  ret
> > diff --git a/sys/dev/ice/ice_sriov.c b/sys/dev/ice/ice_sriov.c
> > new file mode 100644
> > index 000000000000..c0521e667fa2
> > --- /dev/null
> > +++ b/sys/dev/ice/ice_sriov.c
> > @@ -0,0 +1,595 @@
> > +/* SPDX-License-Identifier: BSD-3-Clause */
> > +/*  Copyright (c) 2021, Intel Corporation
> > + *  All rights reserved.
> > + *
> > + *  Redistribution and use in source and binary forms, with or without
> > + *  modification, are permitted provided that the following conditions
> are met:
> > + *
> > + *   1. Redistributions of source code must retain the above copyright
> notice,
> > + *      this list of conditions and the following disclaimer.
> > + *
> > + *   2. Redistributions in binary form must reproduce the above
> copyright
> > + *      notice, this list of conditions and the following disclaimer in
> the
> > + *      documentation and/or other materials provided with the
> distribution.
> > + *
> > + *   3. Neither the name of the Intel Corporation nor the names of its
> > + *      contributors may be used to endorse or promote products derived
> from
> > + *      this software without specific prior written permission.
> > + *
> > + *  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
> "AS IS"
> > + *  AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
> TO, THE
> > + *  IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
> PURPOSE
> > + *  ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
> CONTRIBUTORS BE
> > + *  LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
> > + *  CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
> > + *  SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
> BUSINESS
> > + *  INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
> WHETHER IN
> > + *  CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
> OTHERWISE)
> > + *  ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
> OF THE
> > + *  POSSIBILITY OF SUCH DAMAGE.
> > + */
> > +
> > +#include "ice_common.h"
> > +#include "ice_sriov.h"
> > +
> > +/**
> > + * ice_aq_send_msg_to_vf
> > + * @hw: pointer to the hardware structure
> > + * @vfid: VF ID to send msg
> > + * @v_opcode: opcodes for VF-PF communication
> > + * @v_retval: return error code
> > + * @msg: pointer to the msg buffer
> > + * @msglen: msg length
> > + * @cd: pointer to command details
> > + *
> > + * Send message to VF driver (0x0802) using mailbox
> > + * queue and asynchronously sending message via
> > + * ice_sq_send_cmd() function
> > + */
> > +enum ice_status
> > +ice_aq_send_msg_to_vf(struct ice_hw *hw, u16 vfid, u32 v_opcode, u32
> v_retval,
> > +                   u8 *msg, u16 msglen, struct ice_sq_cd *cd)
> > +{
> > +     struct ice_aqc_pf_vf_msg *cmd;
> > +     struct ice_aq_desc desc;
> > +
> > +     ice_fill_dflt_direct_cmd_desc(&desc, ice_mbx_opc_send_msg_to_vf);
> > +
> > +     cmd = &desc.params.virt;
> > +     cmd->id = CPU_TO_LE32(vfid);
> > +
> > +     desc.cookie_high = CPU_TO_LE32(v_opcode);
> > +     desc.cookie_low = CPU_TO_LE32(v_retval);
> > +
> > +     if (msglen)
> > +             desc.flags |= CPU_TO_LE16(ICE_AQ_FLAG_RD);
> > +
> > +     return ice_sq_send_cmd(hw, &hw->mailboxq, &desc, msg, msglen, cd);
> > +}
> > +
> > +/**
> > + * ice_aq_send_msg_to_pf
> > + * @hw: pointer to the hardware structure
> > + * @v_opcode: opcodes for VF-PF communication
> > + * @v_retval: return error code
> > + * @msg: pointer to the msg buffer
> > + * @msglen: msg length
> > + * @cd: pointer to command details
> > + *
> > + * Send message to PF driver using mailbox queue. By default, this
> > + * message is sent asynchronously, i.e. ice_sq_send_cmd()
> > + * does not wait for completion before returning.
> > + */
> > +enum ice_status
> > +ice_aq_send_msg_to_pf(struct ice_hw *hw, enum virtchnl_ops v_opcode,
> > +                   enum ice_status v_retval, u8 *msg, u16 msglen,
> > +                   struct ice_sq_cd *cd)
> > +{
> > +     struct ice_aq_desc desc;
> > +
> > +     ice_fill_dflt_direct_cmd_desc(&desc, ice_mbx_opc_send_msg_to_pf);
> > +     desc.cookie_high = CPU_TO_LE32(v_opcode);
> > +     desc.cookie_low = CPU_TO_LE32(v_retval);
> > +
> > +     if (msglen)
> > +             desc.flags |= CPU_TO_LE16(ICE_AQ_FLAG_RD);
> > +
> > +     return ice_sq_send_cmd(hw, &hw->mailboxq, &desc, msg, msglen, cd);
> > +}
> > +
> > +/**
> > + * ice_conv_link_speed_to_virtchnl
> > + * @adv_link_support: determines the format of the returned link speed
> > + * @link_speed: variable containing the link_speed to be converted
> > + *
> > + * Convert link speed supported by HW to link speed supported by
> virtchnl.
> > + * If adv_link_support is true, then return link speed in Mbps. Else
> return
> > + * link speed as a VIRTCHNL_LINK_SPEED_* casted to a u32. Note that the
> caller
> > + * needs to cast back to an enum virtchnl_link_speed in the case where
> > + * adv_link_support is false, but when adv_link_support is true the
> caller can
> > + * expect the speed in Mbps.
> > + */
> > +u32 ice_conv_link_speed_to_virtchnl(bool adv_link_support, u16
> link_speed)
> > +{
> > +     u32 speed;
> > +
> > +     if (adv_link_support)
> > +             switch (link_speed) {
> > +             case ICE_AQ_LINK_SPEED_10MB:
> > +                     speed = ICE_LINK_SPEED_10MBPS;
> > +                     break;
> > +             case ICE_AQ_LINK_SPEED_100MB:
> > +                     speed = ICE_LINK_SPEED_100MBPS;
> > +                     break;
> > +             case ICE_AQ_LINK_SPEED_1000MB:
> > +                     speed = ICE_LINK_SPEED_1000MBPS;
> > +                     break;
> > +             case ICE_AQ_LINK_SPEED_2500MB:
> > +                     speed = ICE_LINK_SPEED_2500MBPS;
> > +                     break;
> > +             case ICE_AQ_LINK_SPEED_5GB:
> > +                     speed = ICE_LINK_SPEED_5000MBPS;
> > +                     break;
> > +             case ICE_AQ_LINK_SPEED_10GB:
> > +                     speed = ICE_LINK_SPEED_10000MBPS;
> > +                     break;
> > +             case ICE_AQ_LINK_SPEED_20GB:
> > +                     speed = ICE_LINK_SPEED_20000MBPS;
> > +                     break;
> > +             case ICE_AQ_LINK_SPEED_25GB:
> > +                     speed = ICE_LINK_SPEED_25000MBPS;
> > +                     break;
> > +             case ICE_AQ_LINK_SPEED_40GB:
> > +                     speed = ICE_LINK_SPEED_40000MBPS;
> > +                     break;
> > +             case ICE_AQ_LINK_SPEED_50GB:
> > +                     speed = ICE_LINK_SPEED_50000MBPS;
> > +                     break;
> > +             case ICE_AQ_LINK_SPEED_100GB:
> > +                     speed = ICE_LINK_SPEED_100000MBPS;
> > +                     break;
> > +             default:
> > +                     speed = ICE_LINK_SPEED_UNKNOWN;
> > +                     break;
> > +             }
> > +     else
> > +             /* Virtchnl speeds are not defined for every speed
> supported in
> > +              * the hardware. To maintain compatibility with older AVF
> > +              * drivers, while reporting the speed the new speed values
> are
> > +              * resolved to the closest known virtchnl speeds
> > +              */
> > +             switch (link_speed) {
> > +             case ICE_AQ_LINK_SPEED_10MB:
> > +             case ICE_AQ_LINK_SPEED_100MB:
> > +                     speed = (u32)VIRTCHNL_LINK_SPEED_100MB;
> > +                     break;
> > +             case ICE_AQ_LINK_SPEED_1000MB:
> > +             case ICE_AQ_LINK_SPEED_2500MB:
> > +             case ICE_AQ_LINK_SPEED_5GB:
> > +                     speed = (u32)VIRTCHNL_LINK_SPEED_1GB;
> > +                     break;
> > +             case ICE_AQ_LINK_SPEED_10GB:
> > +                     speed = (u32)VIRTCHNL_LINK_SPEED_10GB;
> > +                     break;
> > +             case ICE_AQ_LINK_SPEED_20GB:
> > +                     speed = (u32)VIRTCHNL_LINK_SPEED_20GB;
> > +                     break;
> > +             case ICE_AQ_LINK_SPEED_25GB:
> > +                     speed = (u32)VIRTCHNL_LINK_SPEED_25GB;
> > +                     break;
> > +             case ICE_AQ_LINK_SPEED_40GB:
> > +             case ICE_AQ_LINK_SPEED_50GB:
> > +             case ICE_AQ_LINK_SPEED_100GB:
> > +                     speed = (u32)VIRTCHNL_LINK_SPEED_40GB;
> > +                     break;
> > +             default:
> > +                     speed = (u32)VIRTCHNL_LINK_SPEED_UNKNOWN;
> > +                     break;
> > +             }
> > +
> > +     return speed;
> > +}
> > +
> > +/* The mailbox overflow detection algorithm helps to check if there
> > + * is a possibility of a malicious VF transmitting too many MBX
> messages to the
> > + * PF.
> > + * 1. The mailbox snapshot structure, ice_mbx_snapshot, is initialized
> during
> > + * driver initialization in ice_init_hw() using ice_mbx_init_snapshot().
> > + * The struct ice_mbx_snapshot helps to track and traverse a static
> window of
> > + * messages within the mailbox queue while looking for a malicious VF.
> > + *
> > + * 2. When the caller starts processing its mailbox queue in response
> to an
> > + * interrupt, the structure ice_mbx_snapshot is expected to be cleared
> before
> > + * the algorithm can be run for the first time for that interrupt. This
> can be
> > + * done via ice_mbx_reset_snapshot().
> > + *
> > + * 3. For every message read by the caller from the MBX Queue, the
> caller must
> > + * call the detection algorithm's entry function
> ice_mbx_vf_state_handler().
> > + * Before every call to ice_mbx_vf_state_handler() the struct
> ice_mbx_data is
> > + * filled as it is required to be passed to the algorithm.
> > + *
> > + * 4. Every time a message is read from the MBX queue, a VFId is
> received which
> > + * is passed to the state handler. The boolean output is_malvf of the
> state
> > + * handler ice_mbx_vf_state_handler() serves as an indicator to the
> caller
> > + * whether this VF is malicious or not.
> > + *
> > + * 5. When a VF is identified to be malicious, the caller can send a
> message
> > + * to the system administrator. The caller can invoke
> ice_mbx_report_malvf()
> > + * to help determine if a malicious VF is to be reported or not. This
> function
> > + * requires the caller to maintain a global bitmap to track all
> malicious VFs
> > + * and pass that to ice_mbx_report_malvf() along with the VFID which
> was identified
> > + * to be malicious by ice_mbx_vf_state_handler().
> > + *
> > + * 6. The global bitmap maintained by PF can be cleared completely if
> PF is in
> > + * reset or the bit corresponding to a VF can be cleared if that VF is
> in reset.
> > + * When a VF is shut down and brought back up, we assume that the new VF
> > + * brought up is not malicious and hence report it if found malicious.
> > + *
> > + * 7. The function ice_mbx_reset_snapshot() is called to reset the
> information
> > + * in ice_mbx_snapshot for every new mailbox interrupt handled.
> > + *
> > + * 8. The memory allocated for variables in ice_mbx_snapshot is
> de-allocated
> > + * when driver is unloaded.
> > + */
> > +#define ICE_RQ_DATA_MASK(rq_data) ((rq_data) & PF_MBX_ARQH_ARQH_M)
> > +/* Using the highest value for an unsigned 16-bit value 0xFFFF to
> indicate that
> > + * the max messages check must be ignored in the algorithm
> > + */
> > +#define ICE_IGNORE_MAX_MSG_CNT       0xFFFF
> > +
> > +/**
> > + * ice_mbx_traverse - Pass through mailbox snapshot
> > + * @hw: pointer to the HW struct
> > + * @new_state: new algorithm state
> > + *
> > + * Traversing the mailbox static snapshot without checking
> > + * for malicious VFs.
> > + */
> > +static void
> > +ice_mbx_traverse(struct ice_hw *hw,
> > +              enum ice_mbx_snapshot_state *new_state)
> > +{
> > +     struct ice_mbx_snap_buffer_data *snap_buf;
> > +     u32 num_iterations;
> > +
> > +     snap_buf = &hw->mbx_snapshot.mbx_buf;
> > +
> > +     /* As mailbox buffer is circular, applying a mask
> > +      * on the incremented iteration count.
> > +      */
> > +     num_iterations = ICE_RQ_DATA_MASK(++snap_buf->num_iterations);
> > +
> > +     /* Checking either of the below conditions to exit snapshot
> traversal:
> > +      * Condition-1: If the number of iterations in the mailbox is
> equal to
> > +      * the mailbox head which would indicate that we have reached the
> end
> > +      * of the static snapshot.
> > +      * Condition-2: If the maximum messages serviced in the mailbox
> for a
> > +      * given interrupt is the highest possible value then there is no
> need
> > +      * to check if the number of messages processed is equal to it. If
> not
> > +      * check if the number of messages processed is greater than or
> equal
> > +      * to the maximum number of mailbox entries serviced in current
> work item.
> > +      */
> > +     if (num_iterations == snap_buf->head ||
> > +         (snap_buf->max_num_msgs_mbx < ICE_IGNORE_MAX_MSG_CNT &&
> > +          ++snap_buf->num_msg_proc >= snap_buf->max_num_msgs_mbx))
> > +             *new_state = ICE_MAL_VF_DETECT_STATE_NEW_SNAPSHOT;
> > +}
> > +
> > +/**
> > + * ice_mbx_detect_malvf - Detect malicious VF in snapshot
> > + * @hw: pointer to the HW struct
> > + * @vf_id: relative virtual function ID
> > + * @new_state: new algorithm state
> > + * @is_malvf: boolean output to indicate if VF is malicious
> > + *
> > + * This function tracks the number of asynchronous messages
> > + * sent per VF and marks the VF as malicious if it exceeds
> > + * the permissible number of messages to send.
> > + */
> > +static enum ice_status
> > +ice_mbx_detect_malvf(struct ice_hw *hw, u16 vf_id,
> > +                  enum ice_mbx_snapshot_state *new_state,
> > +                  bool *is_malvf)
> > +{
> > +     struct ice_mbx_snapshot *snap = &hw->mbx_snapshot;
> > +
> > +     if (vf_id >= snap->mbx_vf.vfcntr_len)
> > +             return ICE_ERR_OUT_OF_RANGE;
> > +
> > +     /* increment the message count in the VF array */
> > +     snap->mbx_vf.vf_cntr[vf_id]++;
> > +
> > +     if (snap->mbx_vf.vf_cntr[vf_id] >= ICE_ASYNC_VF_MSG_THRESHOLD)
> > +             *is_malvf = true;
> > +
> > +     /* continue to iterate through the mailbox snapshot */
> > +     ice_mbx_traverse(hw, new_state);
> > +
> > +     return ICE_SUCCESS;
> > +}
> > +
> > +/**
> > + * ice_mbx_reset_snapshot - Reset mailbox snapshot structure
> > + * @snap: pointer to mailbox snapshot structure in the ice_hw struct
> > + *
> > + * Reset the mailbox snapshot structure and clear VF counter array.
> > + */
> > +static void ice_mbx_reset_snapshot(struct ice_mbx_snapshot *snap)
> > *** 15611 LINES SKIPPED ***
>
>
>
>

[-- Attachment #2 --]
<div dir="auto"><div><br><br><div class="gmail_quote"><div dir="ltr" class="gmail_attr">On Thu, Aug 15, 2024, 9:12 PM Zhenlei Huang &lt;<a href="mailto:zlei@freebsd.org">zlei@freebsd.org</a>&gt; wrote:<br></div><blockquote class="gmail_quote" style="margin:0 0 0 .8ex;border-left:1px #ccc solid;padding-left:1ex">Hi Warner,<br>
<br>
I&#39;m not sure but this change seems include lots of unintended changes ( maybe some local WIP ) .<br></blockquote></div></div><div dir="auto"><br></div><div dir="auto">Git am somehow screwed me.  I&#39;ll fix.</div><div dir="auto"><br></div><div dir="auto">Warner</div><div dir="auto"><br></div><div dir="auto"><div class="gmail_quote"><blockquote class="gmail_quote" style="margin:0 0 0 .8ex;border-left:1px #ccc solid;padding-left:1ex">
&gt; On Aug 16, 2024, at 10:30 AM, Warner Losh &lt;imp@FreeBSD.org&gt; wrote:<br>
&gt; <br>
&gt; The branch main has been updated by imp:<br>
&gt; <br>
&gt; URL: <a href="https://cgit.FreeBSD.org/src/commit/?id=d5507f9e436698ac17dc5ace7ef58493988a9b04" rel="noreferrer noreferrer" target="_blank">https://cgit.FreeBSD.org/src/commit/?id=d5507f9e436698ac17dc5ace7ef58493988a9b04</a><br>;
&gt; <br>
&gt; commit d5507f9e436698ac17dc5ace7ef58493988a9b04<br>
&gt; Author:     Warner Losh &lt;imp@FreeBSD.org&gt;<br>
&gt; AuthorDate: 2024-08-14 22:55:49 +0000<br>
&gt; Commit:     Warner Losh &lt;imp@FreeBSD.org&gt;<br>
&gt; CommitDate: 2024-08-16 02:22:18 +0000<br>
&gt; <br>
&gt;    nvme: Separate total failures from I/O failures<br>
&gt; <br>
&gt;    When it&#39;s a I/O failure, we can still send admin commands. Separate out<br>
&gt;    the admin failures and flag them as such so that we can still send admin<br>
&gt;    commands on half-failed drives.<br>
&gt; <br>
&gt;    Fixes: 9229b3105d88 (nvme: Fail passthrough commands right away in failed state)<br>
&gt;    Sponsored by: Netflix<br>
&gt; ---<br>
&gt; sys/amd64/conf/IOSCHED                             |    2 +<br>
&gt; sys/amd64/conf/MPI3MR                              |   10 +<br>
&gt; sys/arm64/conf/GENERIC16K                          |    4 +<br>
&gt; .../linuxkpi/common/include/linux/#compiler.h#     |  117 +<br>
&gt; sys/contrib/dev/iwlwifi/fw/api/soc.h               |   35 +<br>
&gt; sys/contrib/zlib/contrib/asm686/README.686         |   51 +<br>
&gt; sys/contrib/zlib/contrib/asm686/match.S            |  357 +<br>
&gt; sys/dev/ice/ice_sriov.c                            |  595 ++<br>
&gt; sys/dev/ice/ice_sriov.h                            |   64 +<br>
&gt; sys/dev/mps/mpi/mpi2_pci.h                         |  141 +<br>
&gt; sys/dev/nvme/nvme_ctrlr.c                          |   46 +-<br>
&gt; sys/dev/nvme/nvme_private.h                        |    1 +<br>
&gt; sys/dev/nvme/nvme_qpair.c                          |   23 +-<br>
&gt; sys/dev/nvme/nvme_sim.c                            |   13 +-<br>
&gt; sys/dev/sound/pci/aureal.c                         |  686 ++<br>
&gt; sys/dev/sound/pci/aureal.h                         |   99 +<br>
&gt; sys/dev/sound/pci/ds1-fw.h                         | 1602 ++++<br>
&gt; sys/dev/sound/pci/ds1.c                            | 1103 +++<br>
&gt; sys/dev/sound/pci/ds1.h                            |  146 +<br>
&gt; sys/dev/sound/pci/maestro.c                        | 2043 +++++<br>
&gt; sys/dev/sound/pci/maestro_reg.h                    |  381 +<br>
&gt; sys/kern/bsduser-syscalls.c                        | 8712 ++++++++++++++++++++<br>
&gt; sys/modules/sound/driver/ds1/Makefile              |    8 +<br>
&gt; sys/modules/sound/driver/maestro/Makefile          |    8 +<br>
&gt; 24 files changed, 16219 insertions(+), 28 deletions(-)<br>
&gt; <br>
&gt; diff --git a/sys/amd64/conf/IOSCHED b/sys/amd64/conf/IOSCHED<br>
&gt; new file mode 100644<br>
&gt; index 000000000000..e15106bc4c1f<br>
&gt; --- /dev/null<br>
&gt; +++ b/sys/amd64/conf/IOSCHED<br>
&gt; @@ -0,0 +1,2 @@<br>
&gt; +include &quot;GENERIC&quot;<br>
&gt; +options CAM_IOSCHED_DYNAMIC<br>
&gt; diff --git a/sys/amd64/conf/MPI3MR b/sys/amd64/conf/MPI3MR<br>
&gt; new file mode 100644<br>
&gt; index 000000000000..99e5244cb49d<br>
&gt; --- /dev/null<br>
&gt; +++ b/sys/amd64/conf/MPI3MR<br>
&gt; @@ -0,0 +1,10 @@<br>
&gt; +include GENERIC<br>
&gt; +<br>
&gt; +device mpi3mr<br>
&gt; +# All the debugging options<br>
&gt; +options DEADLKRES # Enable the deadlock resolver<br>
&gt; +options INVARIANTS # Enable calls of extra sanity checking<br>
&gt; +options INVARIANT_SUPPORT # Extra sanity checks of internal structures, required by INVARIANTS<br>
&gt; +options QUEUE_MACRO_DEBUG_TRASH # Trash queue(2) internal pointers on invalidation<br>
&gt; +options WITNESS # Enable checks to detect deadlocks and cycles<br>
&gt; +options WITNESS_SKIPSPIN # Don&#39;t run witness on spinlocks for speed<br>
&gt; diff --git a/sys/arm64/conf/GENERIC16K b/sys/arm64/conf/GENERIC16K<br>
&gt; new file mode 100644<br>
&gt; index 000000000000..9bf9e2dadb08<br>
&gt; --- /dev/null<br>
&gt; +++ b/sys/arm64/conf/GENERIC16K<br>
&gt; @@ -0,0 +1,4 @@<br>
&gt; +include              &quot;GENERIC&quot;<br>
&gt; +<br>
&gt; +ident                GENERIC_16K<br>
&gt; +<br>
&gt; diff --git a/sys/compat/linuxkpi/common/include/linux/#compiler.h# b/sys/compat/linuxkpi/common/include/linux/#compiler.h#<br>
&gt; new file mode 100644<br>
&gt; index 000000000000..1177674aa68f<br>
&gt; --- /dev/null<br>
&gt; +++ b/sys/compat/linuxkpi/common/include/linux/#compiler.h#<br>
&gt; @@ -0,0 +1,117 @@<br>
&gt; +/*-<br>
&gt; + * Copyright (c) 2010 Isilon Systems, Inc.<br>
&gt; + * Copyright (c) 2010 iX Systems, Inc.<br>
&gt; + * Copyright (c) 2010 Panasas, Inc.<br>
&gt; + * Copyright (c) 2013-2016 Mellanox Technologies, Ltd.<br>
&gt; + * Copyright (c) 2015 François Tigeot<br>
&gt; + * All rights reserved.<br>
&gt; + *<br>
&gt; + * Redistribution and use in source and binary forms, with or without<br>
&gt; + * modification, are permitted provided that the following conditions<br>
&gt; + * are met:<br>
&gt; + * 1. Redistributions of source code must retain the above copyright<br>
&gt; + *    notice unmodified, this list of conditions, and the following<br>
&gt; + *    disclaimer.<br>
&gt; + * 2. Redistributions in binary form must reproduce the above copyright<br>
&gt; + *    notice, this list of conditions and the following disclaimer in the<br>
&gt; + *    documentation and/or other materials provided with the distribution.<br>
&gt; + *<br>
&gt; + * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS&#39;&#39; AND ANY EXPRESS OR<br>
&gt; + * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES<br>
&gt; + * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.<br>
&gt; + * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,<br>
&gt; + * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT<br>
&gt; + * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,<br>
&gt; + * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY<br>
&gt; + * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT<br>
&gt; + * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF<br>
&gt; + * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.<br>
&gt; + *<br>
&gt; + * $FreeBSD$<br>
&gt; + */<br>
&gt; +#ifndef      _LINUX_COMPILER_H_<br>
&gt; +#define      _LINUX_COMPILER_H_<br>
&gt; +<br>
&gt; +#include &lt;sys/cdefs.h&gt;<br>
&gt; +<br>
&gt; +#define __user<br>
&gt; +#define __kernel<br>
&gt; +#define __safe<br>
&gt; +#define __force<br>
&gt; +#define __nocast<br>
&gt; +#define __iomem<br>
&gt; +#define __chk_user_ptr(x)            ((void)0)<br>
&gt; +#define __chk_io_ptr(x)                      ((void)0)<br>
&gt; +#define __builtin_warning(x, y...)   (1)<br>
&gt; +#define __acquires(x)<br>
&gt; +#define __releases(x)<br>
&gt; +#define __acquire(x)                 do { } while (0)<br>
&gt; +#define __release(x)                 do { } while (0)<br>
&gt; +#define __cond_lock(x,c)             (c)<br>
&gt; +#define      __bitwise<br>
&gt; +#define __devinitdata<br>
&gt; +#define      __deprecated<br>
&gt; +#define __init<br>
&gt; +#define      __initconst<br>
&gt; +#define      __devinit<br>
&gt; +#define      __devexit<br>
&gt; +#define __exit<br>
&gt; +#define      __rcu<br>
&gt; +#define      __percpu<br>
&gt; +#define      __weak __weak_symbol<br>
&gt; +#define      __malloc<br>
&gt; +#define      ___stringify(...)               #__VA_ARGS__<br>
&gt; +#define      __stringify(...)                ___stringify(__VA_ARGS__)<br>
&gt; +#define      __attribute_const__             __attribute__((__const__))<br>
&gt; +#undef __always_inline<br>
&gt; +#define      __always_inline                 inline<br>
&gt; +#define      noinline                        __noinline<br>
&gt; +#define      ____cacheline_aligned           __aligned(CACHE_LINE_SIZE)<br>
&gt; +<br>
&gt; +#define      likely(x)                       __builtin_expect(!!(x), 1)<br>
&gt; +#define      unlikely(x)                     __builtin_expect(!!(x), 0)<br>
&gt; +#define typeof(x)                    __typeof(x)<br>
&gt; +<br>
&gt; +#define      uninitialized_var(x)            x = x<br>
&gt; +#define      __maybe_unused                  __unused<br>
&gt; +#define      __always_unused                 __unused<br>
&gt; +#define      __must_check                    __result_use_check<br>
&gt; +<br>
&gt; +#define      __printf(a,b)                   __printflike(a,b)<br>
&gt; +<br>
&gt; +#define      barrier()                       __asm__ __volatile__(&quot;&quot;: : :&quot;memory&quot;)<br>
&gt; +<br>
&gt; +#if defined(LINUXKPI_VERSION) &amp;&amp; LINUXKPI_VERSION &gt;= 50000<br>
&gt; +/* Moved from drm_os_freebsd.h */<br>
&gt; +#define      lower_32_bits(n)                ((u32)(n))<br>
&gt; +#define      upper_32_bits(n)                ((u32)(((n) &gt;&gt; 16) &gt;&gt; 16))<br>
&gt; +#endif<br>
&gt; +<br>
&gt; +#define      ___PASTE(a,b) a##b<br>
&gt; +#define      __PASTE(a,b) ___PASTE(a,b)<br>
&gt; +<br>
&gt; +#define      ACCESS_ONCE(x)                  (*(volatile __typeof(x) *)&amp;(x))<br>
&gt; +<br>
&gt; +#define      WRITE_ONCE(x,v) do {            \<br>
&gt; +     barrier();                      \<br>
&gt; +     ACCESS_ONCE(x) = (v);           \<br>
&gt; +     barrier();                      \<br>
&gt; +} while (0)<br>
&gt; +<br>
&gt; +#define      READ_ONCE(x) ({                 \<br>
&gt; +     __typeof(x) __var = ({          \<br>
&gt; +             barrier();              \<br>
&gt; +             ACCESS_ONCE(x);         \<br>
&gt; +     });                             \<br>
&gt; +     barrier();                      \<br>
&gt; +     __var;                          \<br>
&gt; +})<br>
&gt; +<br>
&gt; +#define      lockless_dereference(p) READ_ONCE(p)<br>
&gt; +<br>
&gt; +#define      _AT(T,X)        ((T)(X))<br>
&gt; +<br>
&gt; +#define      __same_type(a, b)       __builtin_types_compatible_p(typeof(a), typeof(b))<br>
&gt; +#define      __must_be_array(a)      __same_type(a, &amp;(a)[0])<br>
&gt; +<br>
&gt; +#endif       /* _LINUX_COMPILER_H_ */<br>
&gt; diff --git a/sys/contrib/dev/iwlwifi/fw/api/soc.h b/sys/contrib/dev/iwlwifi/fw/api/soc.h<br>
&gt; new file mode 100644<br>
&gt; index 000000000000..c5df1171462b<br>
&gt; --- /dev/null<br>
&gt; +++ b/sys/contrib/dev/iwlwifi/fw/api/soc.h<br>
&gt; @@ -0,0 +1,35 @@<br>
&gt; +/* SPDX-License-Identifier: GPL-2.0 OR BSD-3-Clause */<br>
&gt; +/*<br>
&gt; + * Copyright (C) 2012-2014, 2019-2020 Intel Corporation<br>
&gt; + * Copyright (C) 2013-2015 Intel Mobile Communications GmbH<br>
&gt; + * Copyright (C) 2016-2017 Intel Deutschland GmbH<br>
&gt; + */<br>
&gt; +#ifndef __iwl_fw_api_soc_h__<br>
&gt; +#define __iwl_fw_api_soc_h__<br>
&gt; +<br>
&gt; +#define SOC_CONFIG_CMD_FLAGS_DISCRETE                BIT(0)<br>
&gt; +#define SOC_CONFIG_CMD_FLAGS_LOW_LATENCY     BIT(1)<br>
&gt; +<br>
&gt; +#define SOC_FLAGS_LTR_APPLY_DELAY_MASK               0xc<br>
&gt; +#define SOC_FLAGS_LTR_APPLY_DELAY_NONE               0<br>
&gt; +#define SOC_FLAGS_LTR_APPLY_DELAY_200                1<br>
&gt; +#define SOC_FLAGS_LTR_APPLY_DELAY_2500               2<br>
&gt; +#define SOC_FLAGS_LTR_APPLY_DELAY_1820               3<br>
&gt; +<br>
&gt; +/**<br>
&gt; + * struct iwl_soc_configuration_cmd - Set device stabilization latency<br>
&gt; + *<br>
&gt; + * @flags: soc settings flags.  In VER_1, we can only set the DISCRETE<br>
&gt; + *   flag, because the FW treats the whole value as an integer. In<br>
&gt; + *   VER_2, we can set the bits independently.<br>
&gt; + * @latency: time for SOC to ensure stable power &amp; XTAL<br>
&gt; + */<br>
&gt; +struct iwl_soc_configuration_cmd {<br>
&gt; +     __le32 flags;<br>
&gt; +     __le32 latency;<br>
&gt; +} __packed; /*<br>
&gt; +          * SOC_CONFIGURATION_CMD_S_VER_1 (see description above)<br>
&gt; +          * SOC_CONFIGURATION_CMD_S_VER_2<br>
&gt; +          */<br>
&gt; +<br>
&gt; +#endif /* __iwl_fw_api_soc_h__ */<br>
&gt; diff --git a/sys/contrib/zlib/contrib/asm686/README.686 b/sys/contrib/zlib/contrib/asm686/README.686<br>
&gt; new file mode 100644<br>
&gt; index 000000000000..a0bf3bea4aff<br>
&gt; --- /dev/null<br>
&gt; +++ b/sys/contrib/zlib/contrib/asm686/README.686<br>
&gt; @@ -0,0 +1,51 @@<br>
&gt; +This is a patched version of zlib, modified to use<br>
&gt; +Pentium-Pro-optimized assembly code in the deflation algorithm. The<br>
&gt; +files changed/added by this patch are:<br>
&gt; +<br>
&gt; +README.686<br>
&gt; +match.S<br>
&gt; +<br>
&gt; +The speedup that this patch provides varies, depending on whether the<br>
&gt; +compiler used to build the original version of zlib falls afoul of the<br>
&gt; +PPro&#39;s speed traps. My own tests show a speedup of around 10-20% at<br>
&gt; +the default compression level, and 20-30% using -9, against a version<br>
&gt; +compiled using gcc 2.7.2.3. Your mileage may vary.<br>
&gt; +<br>
&gt; +Note that this code has been tailored for the PPro/PII in particular,<br>
&gt; +and will not perform particuarly well on a Pentium.<br>
&gt; +<br>
&gt; +If you are using an assembler other than GNU as, you will have to<br>
&gt; +translate match.S to use your assembler&#39;s syntax. (Have fun.)<br>
&gt; +<br>
&gt; +Brian Raiter<br>
&gt; +<a href="mailto:breadbox@muppetlabs.com" target="_blank" rel="noreferrer">breadbox@muppetlabs.com</a><br>
&gt; +April, 1998<br>
&gt; +<br>
&gt; +<br>
&gt; +Added for zlib 1.1.3:<br>
&gt; +<br>
&gt; +The patches come from<br>
&gt; +<a href="http://www.muppetlabs.com/~breadbox/software/assembly.html" rel="noreferrer noreferrer" target="_blank">http://www.muppetlabs.com/~breadbox/software/assembly.html</a><br>;
&gt; +<br>
&gt; +To compile zlib with this asm file, copy match.S to the zlib directory<br>
&gt; +then do:<br>
&gt; +<br>
&gt; +CFLAGS=&quot;-O3 -DASMV&quot; ./configure<br>
&gt; +make OBJA=match.o<br>
&gt; +<br>
&gt; +<br>
&gt; +Update:<br>
&gt; +<br>
&gt; +I&#39;ve been ignoring these assembly routines for years, believing that<br>
&gt; +gcc&#39;s generated code had caught up with it sometime around gcc 2.95<br>
&gt; +and the major rearchitecting of the Pentium 4. However, I recently<br>
&gt; +learned that, despite what I believed, this code still has some life<br>
&gt; +in it. On the Pentium 4 and AMD64 chips, it continues to run about 8%<br>
&gt; +faster than the code produced by gcc 4.1.<br>
&gt; +<br>
&gt; +In acknowledgement of its continuing usefulness, I&#39;ve altered the<br>
&gt; +license to match that of the rest of zlib. Share and Enjoy!<br>
&gt; +<br>
&gt; +Brian Raiter<br>
&gt; +<a href="mailto:breadbox@muppetlabs.com" target="_blank" rel="noreferrer">breadbox@muppetlabs.com</a><br>
&gt; +April, 2007<br>
&gt; diff --git a/sys/contrib/zlib/contrib/asm686/match.S b/sys/contrib/zlib/contrib/asm686/match.S<br>
&gt; new file mode 100644<br>
&gt; index 000000000000..fa421092785d<br>
&gt; --- /dev/null<br>
&gt; +++ b/sys/contrib/zlib/contrib/asm686/match.S<br>
&gt; @@ -0,0 +1,357 @@<br>
&gt; +/* match.S -- x86 assembly version of the zlib longest_match() function.<br>
&gt; + * Optimized for the Intel 686 chips (PPro and later).<br>
&gt; + *<br>
&gt; + * Copyright (C) 1998, 2007 Brian Raiter &lt;<a href="mailto:breadbox@muppetlabs.com" target="_blank" rel="noreferrer">breadbox@muppetlabs.com</a>&gt;<br>
&gt; + *<br>
&gt; + * This software is provided &#39;as-is&#39;, without any express or implied<br>
&gt; + * warranty.  In no event will the author be held liable for any damages<br>
&gt; + * arising from the use of this software.<br>
&gt; + *<br>
&gt; + * Permission is granted to anyone to use this software for any purpose,<br>
&gt; + * including commercial applications, and to alter it and redistribute it<br>
&gt; + * freely, subject to the following restrictions:<br>
&gt; + *<br>
&gt; + * 1. The origin of this software must not be misrepresented; you must not<br>
&gt; + *    claim that you wrote the original software. If you use this software<br>
&gt; + *    in a product, an acknowledgment in the product documentation would be<br>
&gt; + *    appreciated but is not required.<br>
&gt; + * 2. Altered source versions must be plainly marked as such, and must not be<br>
&gt; + *    misrepresented as being the original software.<br>
&gt; + * 3. This notice may not be removed or altered from any source distribution.<br>
&gt; + */<br>
&gt; +<br>
&gt; +#ifndef NO_UNDERLINE<br>
&gt; +#define      match_init      _match_init<br>
&gt; +#define      longest_match   _longest_match<br>
&gt; +#endif<br>
&gt; +<br>
&gt; +#define      MAX_MATCH       (258)<br>
&gt; +#define      MIN_MATCH       (3)<br>
&gt; +#define      MIN_LOOKAHEAD   (MAX_MATCH + MIN_MATCH + 1)<br>
&gt; +#define      MAX_MATCH_8     ((MAX_MATCH + 7) &amp; ~7)<br>
&gt; +<br>
&gt; +/* stack frame offsets */<br>
&gt; +<br>
&gt; +#define      chainlenwmask           0       /* high word: current chain len */<br>
&gt; +                                     /* low word: s-&gt;wmask           */<br>
&gt; +#define      window                  4       /* local copy of s-&gt;window      */<br>
&gt; +#define      windowbestlen           8       /* s-&gt;window + bestlen          */<br>
&gt; +#define      scanstart               16      /* first two bytes of string    */<br>
&gt; +#define      scanend                 12      /* last two bytes of string     */<br>
&gt; +#define      scanalign               20      /* dword-misalignment of string */<br>
&gt; +#define      nicematch               24      /* a good enough match size     */<br>
&gt; +#define      bestlen                 28      /* size of best match so far    */<br>
&gt; +#define      scan                    32      /* ptr to string wanting match  */<br>
&gt; +<br>
&gt; +#define      LocalVarsSize           (36)<br>
&gt; +/*   saved ebx               36 */<br>
&gt; +/*   saved edi               40 */<br>
&gt; +/*   saved esi               44 */<br>
&gt; +/*   saved ebp               48 */<br>
&gt; +/*   return address          52 */<br>
&gt; +#define      deflatestate            56      /* the function arguments       */<br>
&gt; +#define      curmatch                60<br>
&gt; +<br>
&gt; +/* All the +zlib1222add offsets are due to the addition of fields<br>
&gt; + *  in zlib in the deflate_state structure since the asm code was first written<br>
&gt; + * (if you compile with zlib 1.0.4 or older, use &quot;zlib1222add equ (-4)&quot;).<br>
&gt; + * (if you compile with zlib between 1.0.5 and 1.2.2.1, use &quot;zlib1222add equ 0&quot;).<br>
&gt; + * if you compile with zlib 1.2.2.2 or later , use &quot;zlib1222add equ 8&quot;).<br>
&gt; + */<br>
&gt; +<br>
&gt; +#define zlib1222add          (8)<br>
&gt; +<br>
&gt; +#define      dsWSize                 (36+zlib1222add)<br>
&gt; +#define      dsWMask                 (44+zlib1222add)<br>
&gt; +#define      dsWindow                (48+zlib1222add)<br>
&gt; +#define      dsPrev                  (56+zlib1222add)<br>
&gt; +#define      dsMatchLen              (88+zlib1222add)<br>
&gt; +#define      dsPrevMatch             (92+zlib1222add)<br>
&gt; +#define      dsStrStart              (100+zlib1222add)<br>
&gt; +#define      dsMatchStart            (104+zlib1222add)<br>
&gt; +#define      dsLookahead             (108+zlib1222add)<br>
&gt; +#define      dsPrevLen               (112+zlib1222add)<br>
&gt; +#define      dsMaxChainLen           (116+zlib1222add)<br>
&gt; +#define      dsGoodMatch             (132+zlib1222add)<br>
&gt; +#define      dsNiceMatch             (136+zlib1222add)<br>
&gt; +<br>
&gt; +<br>
&gt; +.file &quot;match.S&quot;<br>
&gt; +<br>
&gt; +.globl       match_init, longest_match<br>
&gt; +<br>
&gt; +.text<br>
&gt; +<br>
&gt; +/* uInt longest_match(deflate_state *deflatestate, IPos curmatch) */<br>
&gt; +.cfi_sections        .debug_frame<br>
&gt; +<br>
&gt; +longest_match:<br>
&gt; +<br>
&gt; +.cfi_startproc<br>
&gt; +/* Save registers that the compiler may be using, and adjust %esp to */<br>
&gt; +/* make room for our stack frame.                                    */<br>
&gt; +<br>
&gt; +             pushl   %ebp<br>
&gt; +             .cfi_def_cfa_offset 8<br>
&gt; +             .cfi_offset ebp, -8<br>
&gt; +             pushl   %edi<br>
&gt; +             .cfi_def_cfa_offset 12<br>
&gt; +             pushl   %esi<br>
&gt; +             .cfi_def_cfa_offset 16<br>
&gt; +             pushl   %ebx<br>
&gt; +             .cfi_def_cfa_offset 20<br>
&gt; +             subl    $LocalVarsSize, %esp<br>
&gt; +             .cfi_def_cfa_offset LocalVarsSize+20<br>
&gt; +<br>
&gt; +/* Retrieve the function arguments. %ecx will hold cur_match         */<br>
&gt; +/* throughout the entire function. %edx will hold the pointer to the */<br>
&gt; +/* deflate_state structure during the function&#39;s setup (before               */<br>
&gt; +/* entering the main loop).                                          */<br>
&gt; +<br>
&gt; +             movl    deflatestate(%esp), %edx<br>
&gt; +             movl    curmatch(%esp), %ecx<br>
&gt; +<br>
&gt; +/* uInt wmask = s-&gt;w_mask;                                           */<br>
&gt; +/* unsigned chain_length = s-&gt;max_chain_length;                              */<br>
&gt; +/* if (s-&gt;prev_length &gt;= s-&gt;good_match) {                            */<br>
&gt; +/*     chain_length &gt;&gt;= 2;                                           */<br>
&gt; +/* }                                                                 */<br>
&gt; + <br>
&gt; +             movl    dsPrevLen(%edx), %eax<br>
&gt; +             movl    dsGoodMatch(%edx), %ebx<br>
&gt; +             cmpl    %ebx, %eax<br>
&gt; +             movl    dsWMask(%edx), %eax<br>
&gt; +             movl    dsMaxChainLen(%edx), %ebx<br>
&gt; +             jl      LastMatchGood<br>
&gt; +             shrl    $2, %ebx<br>
&gt; +LastMatchGood:<br>
&gt; +<br>
&gt; +/* chainlen is decremented once beforehand so that the function can  */<br>
&gt; +/* use the sign flag instead of the zero flag for the exit test.     */<br>
&gt; +/* It is then shifted into the high word, to make room for the wmask */<br>
&gt; +/* value, which it will always accompany.                            */<br>
&gt; +<br>
&gt; +             decl    %ebx<br>
&gt; +             shll    $16, %ebx<br>
&gt; +             orl     %eax, %ebx<br>
&gt; +             movl    %ebx, chainlenwmask(%esp)<br>
&gt; +<br>
&gt; +/* if ((uInt)nice_match &gt; s-&gt;lookahead) nice_match = s-&gt;lookahead;   */<br>
&gt; +<br>
&gt; +             movl    dsNiceMatch(%edx), %eax<br>
&gt; +             movl    dsLookahead(%edx), %ebx<br>
&gt; +             cmpl    %eax, %ebx<br>
&gt; +             jl      LookaheadLess<br>
&gt; +             movl    %eax, %ebx<br>
&gt; +LookaheadLess:       movl    %ebx, nicematch(%esp)<br>
&gt; +<br>
&gt; +/* register Bytef *scan = s-&gt;window + s-&gt;strstart;                   */<br>
&gt; +<br>
&gt; +             movl    dsWindow(%edx), %esi<br>
&gt; +             movl    %esi, window(%esp)<br>
&gt; +             movl    dsStrStart(%edx), %ebp<br>
&gt; +             lea     (%esi,%ebp), %edi<br>
&gt; +             movl    %edi, scan(%esp)<br>
&gt; +<br>
&gt; +/* Determine how many bytes the scan ptr is off from being           */<br>
&gt; +/* dword-aligned.                                                    */<br>
&gt; +<br>
&gt; +             movl    %edi, %eax<br>
&gt; +             negl    %eax<br>
&gt; +             andl    $3, %eax<br>
&gt; +             movl    %eax, scanalign(%esp)<br>
&gt; +<br>
&gt; +/* IPos limit = s-&gt;strstart &gt; (IPos)MAX_DIST(s) ?                    */<br>
&gt; +/*     s-&gt;strstart - (IPos)MAX_DIST(s) : NIL;                                */<br>
&gt; +<br>
&gt; +             movl    dsWSize(%edx), %eax<br>
&gt; +             subl    $MIN_LOOKAHEAD, %eax<br>
&gt; +             subl    %eax, %ebp<br>
&gt; +             jg      LimitPositive<br>
&gt; +             xorl    %ebp, %ebp<br>
&gt; +LimitPositive:<br>
&gt; +<br>
&gt; +/* int best_len = s-&gt;prev_length;                                    */<br>
&gt; +<br>
&gt; +             movl    dsPrevLen(%edx), %eax<br>
&gt; +             movl    %eax, bestlen(%esp)<br>
&gt; +<br>
&gt; +/* Store the sum of s-&gt;window + best_len in %esi locally, and in %esi.       */<br>
&gt; +<br>
&gt; +             addl    %eax, %esi<br>
&gt; +             movl    %esi, windowbestlen(%esp)<br>
&gt; +<br>
&gt; +/* register ush scan_start = *(ushf*)scan;                           */<br>
&gt; +/* register ush scan_end   = *(ushf*)(scan+best_len-1);                      */<br>
&gt; +/* Posf *prev = s-&gt;prev;                                             */<br>
&gt; +<br>
&gt; +             movzwl  (%edi), %ebx<br>
&gt; +             movl    %ebx, scanstart(%esp)<br>
&gt; +             movzwl  -1(%edi,%eax), %ebx<br>
&gt; +             movl    %ebx, scanend(%esp)<br>
&gt; +             movl    dsPrev(%edx), %edi<br>
&gt; +<br>
&gt; +/* Jump into the main loop.                                          */<br>
&gt; +<br>
&gt; +             movl    chainlenwmask(%esp), %edx<br>
&gt; +             jmp     LoopEntry<br>
&gt; +<br>
&gt; +.balign 16<br>
&gt; +<br>
&gt; +/* do {<br>
&gt; + *     match = s-&gt;window + cur_match;<br>
&gt; + *     if (*(ushf*)(match+best_len-1) != scan_end ||<br>
&gt; + *         *(ushf*)match != scan_start) continue;<br>
&gt; + *     [...]<br>
&gt; + * } while ((cur_match = prev[cur_match &amp; wmask]) &gt; limit<br>
&gt; + *          &amp;&amp; --chain_length != 0);<br>
&gt; + *<br>
&gt; + * Here is the inner loop of the function. The function will spend the<br>
&gt; + * majority of its time in this loop, and majority of that time will<br>
&gt; + * be spent in the first ten instructions.<br>
&gt; + *<br>
&gt; + * Within this loop:<br>
&gt; + * %ebx = scanend<br>
&gt; + * %ecx = curmatch<br>
&gt; + * %edx = chainlenwmask - i.e., ((chainlen &lt;&lt; 16) | wmask)<br>
&gt; + * %esi = windowbestlen - i.e., (window + bestlen)<br>
&gt; + * %edi = prev<br>
&gt; + * %ebp = limit<br>
&gt; + */<br>
&gt; +LookupLoop:<br>
&gt; +             andl    %edx, %ecx<br>
&gt; +             movzwl  (%edi,%ecx,2), %ecx<br>
&gt; +             cmpl    %ebp, %ecx<br>
&gt; +             jbe     LeaveNow<br>
&gt; +             subl    $0x00010000, %edx<br>
&gt; +             js      LeaveNow<br>
&gt; +LoopEntry:   movzwl  -1(%esi,%ecx), %eax<br>
&gt; +             cmpl    %ebx, %eax<br>
&gt; +             jnz     LookupLoop<br>
&gt; +             movl    window(%esp), %eax<br>
&gt; +             movzwl  (%eax,%ecx), %eax<br>
&gt; +             cmpl    scanstart(%esp), %eax<br>
&gt; +             jnz     LookupLoop<br>
&gt; +<br>
&gt; +/* Store the current value of chainlen.                                      */<br>
&gt; +<br>
&gt; +             movl    %edx, chainlenwmask(%esp)<br>
&gt; +<br>
&gt; +/* Point %edi to the string under scrutiny, and %esi to the string we        */<br>
&gt; +/* are hoping to match it up with. In actuality, %esi and %edi are   */<br>
&gt; +/* both pointed (MAX_MATCH_8 - scanalign) bytes ahead, and %edx is   */<br>
&gt; +/* initialized to -(MAX_MATCH_8 - scanalign).                                */<br>
&gt; +<br>
&gt; +             movl    window(%esp), %esi<br>
&gt; +             movl    scan(%esp), %edi<br>
&gt; +             addl    %ecx, %esi<br>
&gt; +             movl    scanalign(%esp), %eax<br>
&gt; +             movl    $(-MAX_MATCH_8), %edx<br>
&gt; +             lea     MAX_MATCH_8(%edi,%eax), %edi<br>
&gt; +             lea     MAX_MATCH_8(%esi,%eax), %esi<br>
&gt; +<br>
&gt; +/* Test the strings for equality, 8 bytes at a time. At the end,<br>
&gt; + * adjust %edx so that it is offset to the exact byte that mismatched.<br>
&gt; + *<br>
&gt; + * We already know at this point that the first three bytes of the<br>
&gt; + * strings match each other, and they can be safely passed over before<br>
&gt; + * starting the compare loop. So what this code does is skip over 0-3<br>
&gt; + * bytes, as much as necessary in order to dword-align the %edi<br>
&gt; + * pointer. (%esi will still be misaligned three times out of four.)<br>
&gt; + *<br>
&gt; + * It should be confessed that this loop usually does not represent<br>
&gt; + * much of the total running time. Replacing it with a more<br>
&gt; + * straightforward &quot;rep cmpsb&quot; would not drastically degrade<br>
&gt; + * performance.<br>
&gt; + */<br>
&gt; +LoopCmps:<br>
&gt; +             movl    (%esi,%edx), %eax<br>
&gt; +             xorl    (%edi,%edx), %eax<br>
&gt; +             jnz     LeaveLoopCmps<br>
&gt; +             movl    4(%esi,%edx), %eax<br>
&gt; +             xorl    4(%edi,%edx), %eax<br>
&gt; +             jnz     LeaveLoopCmps4<br>
&gt; +             addl    $8, %edx<br>
&gt; +             jnz     LoopCmps<br>
&gt; +             jmp     LenMaximum<br>
&gt; +LeaveLoopCmps4:      addl    $4, %edx<br>
&gt; +LeaveLoopCmps:       testl   $0x0000FFFF, %eax<br>
&gt; +             jnz     LenLower<br>
&gt; +             addl    $2, %edx<br>
&gt; +             shrl    $16, %eax<br>
&gt; +LenLower:    subb    $1, %al<br>
&gt; +             adcl    $0, %edx<br>
&gt; +<br>
&gt; +/* Calculate the length of the match. If it is longer than MAX_MATCH,        */<br>
&gt; +/* then automatically accept it as the best possible match and leave.        */<br>
&gt; +<br>
&gt; +             lea     (%edi,%edx), %eax<br>
&gt; +             movl    scan(%esp), %edi<br>
&gt; +             subl    %edi, %eax<br>
&gt; +             cmpl    $MAX_MATCH, %eax<br>
&gt; +             jge     LenMaximum<br>
&gt; +<br>
&gt; +/* If the length of the match is not longer than the best match we   */<br>
&gt; +/* have so far, then forget it and return to the lookup loop.                */<br>
&gt; +<br>
&gt; +             movl    deflatestate(%esp), %edx<br>
&gt; +             movl    bestlen(%esp), %ebx<br>
&gt; +             cmpl    %ebx, %eax<br>
&gt; +             jg      LongerMatch<br>
&gt; +             movl    windowbestlen(%esp), %esi<br>
&gt; +             movl    dsPrev(%edx), %edi<br>
&gt; +             movl    scanend(%esp), %ebx<br>
&gt; +             movl    chainlenwmask(%esp), %edx<br>
&gt; +             jmp     LookupLoop<br>
&gt; +<br>
&gt; +/*         s-&gt;match_start = cur_match;                                       */<br>
&gt; +/*         best_len = len;                                           */<br>
&gt; +/*         if (len &gt;= nice_match) break;                             */<br>
&gt; +/*         scan_end = *(ushf*)(scan+best_len-1);                     */<br>
&gt; +<br>
&gt; +LongerMatch: movl    nicematch(%esp), %ebx<br>
&gt; +             movl    %eax, bestlen(%esp)<br>
&gt; +             movl    %ecx, dsMatchStart(%edx)<br>
&gt; +             cmpl    %ebx, %eax<br>
&gt; +             jge     LeaveNow<br>
&gt; +             movl    window(%esp), %esi<br>
&gt; +             addl    %eax, %esi<br>
&gt; +             movl    %esi, windowbestlen(%esp)<br>
&gt; +             movzwl  -1(%edi,%eax), %ebx<br>
&gt; +             movl    dsPrev(%edx), %edi<br>
&gt; +             movl    %ebx, scanend(%esp)<br>
&gt; +             movl    chainlenwmask(%esp), %edx<br>
&gt; +             jmp     LookupLoop<br>
&gt; +<br>
&gt; +/* Accept the current string, with the maximum possible length.              */<br>
&gt; +<br>
&gt; +LenMaximum:  movl    deflatestate(%esp), %edx<br>
&gt; +             movl    $MAX_MATCH, bestlen(%esp)<br>
&gt; +             movl    %ecx, dsMatchStart(%edx)<br>
&gt; +<br>
&gt; +/* if ((uInt)best_len &lt;= s-&gt;lookahead) return (uInt)best_len;                */<br>
&gt; +/* return s-&gt;lookahead;                                                      */<br>
&gt; +<br>
&gt; +LeaveNow:<br>
&gt; +             movl    deflatestate(%esp), %edx<br>
&gt; +             movl    bestlen(%esp), %ebx<br>
&gt; +             movl    dsLookahead(%edx), %eax<br>
&gt; +             cmpl    %eax, %ebx<br>
&gt; +             jg      LookaheadRet<br>
&gt; +             movl    %ebx, %eax<br>
&gt; +LookaheadRet:<br>
&gt; +<br>
&gt; +/* Restore the stack and return from whence we came.                 */<br>
&gt; +<br>
&gt; +             addl    $LocalVarsSize, %esp<br>
&gt; +             .cfi_def_cfa_offset 20<br>
&gt; +             popl    %ebx<br>
&gt; +             .cfi_def_cfa_offset 16<br>
&gt; +             popl    %esi<br>
&gt; +             .cfi_def_cfa_offset 12<br>
&gt; +             popl    %edi<br>
&gt; +             .cfi_def_cfa_offset 8<br>
&gt; +             popl    %ebp<br>
&gt; +             .cfi_def_cfa_offset 4<br>
&gt; +.cfi_endproc<br>
&gt; +match_init:  ret<br>
&gt; diff --git a/sys/dev/ice/ice_sriov.c b/sys/dev/ice/ice_sriov.c<br>
&gt; new file mode 100644<br>
&gt; index 000000000000..c0521e667fa2<br>
&gt; --- /dev/null<br>
&gt; +++ b/sys/dev/ice/ice_sriov.c<br>
&gt; @@ -0,0 +1,595 @@<br>
&gt; +/* SPDX-License-Identifier: BSD-3-Clause */<br>
&gt; +/*  Copyright (c) 2021, Intel Corporation<br>
&gt; + *  All rights reserved.<br>
&gt; + *<br>
&gt; + *  Redistribution and use in source and binary forms, with or without<br>
&gt; + *  modification, are permitted provided that the following conditions are met:<br>
&gt; + *<br>
&gt; + *   1. Redistributions of source code must retain the above copyright notice,<br>
&gt; + *      this list of conditions and the following disclaimer.<br>
&gt; + *<br>
&gt; + *   2. Redistributions in binary form must reproduce the above copyright<br>
&gt; + *      notice, this list of conditions and the following disclaimer in the<br>
&gt; + *      documentation and/or other materials provided with the distribution.<br>
&gt; + *<br>
&gt; + *   3. Neither the name of the Intel Corporation nor the names of its<br>
&gt; + *      contributors may be used to endorse or promote products derived from<br>
&gt; + *      this software without specific prior written permission.<br>
&gt; + *<br>
&gt; + *  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS &quot;AS IS&quot;<br>
&gt; + *  AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE<br>
&gt; + *  IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE<br>
&gt; + *  ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE<br>
&gt; + *  LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR<br>
&gt; + *  CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF<br>
&gt; + *  SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS<br>
&gt; + *  INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN<br>
&gt; + *  CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)<br>
&gt; + *  ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE<br>
&gt; + *  POSSIBILITY OF SUCH DAMAGE.<br>
&gt; + */<br>
&gt; +<br>
&gt; +#include &quot;ice_common.h&quot;<br>
&gt; +#include &quot;ice_sriov.h&quot;<br>
&gt; +<br>
&gt; +/**<br>
&gt; + * ice_aq_send_msg_to_vf<br>
&gt; + * @hw: pointer to the hardware structure<br>
&gt; + * @vfid: VF ID to send msg<br>
&gt; + * @v_opcode: opcodes for VF-PF communication<br>
&gt; + * @v_retval: return error code<br>
&gt; + * @msg: pointer to the msg buffer<br>
&gt; + * @msglen: msg length<br>
&gt; + * @cd: pointer to command details<br>
&gt; + *<br>
&gt; + * Send message to VF driver (0x0802) using mailbox<br>
&gt; + * queue and asynchronously sending message via<br>
&gt; + * ice_sq_send_cmd() function<br>
&gt; + */<br>
&gt; +enum ice_status<br>
&gt; +ice_aq_send_msg_to_vf(struct ice_hw *hw, u16 vfid, u32 v_opcode, u32 v_retval,<br>
&gt; +                   u8 *msg, u16 msglen, struct ice_sq_cd *cd)<br>
&gt; +{<br>
&gt; +     struct ice_aqc_pf_vf_msg *cmd;<br>
&gt; +     struct ice_aq_desc desc;<br>
&gt; +<br>
&gt; +     ice_fill_dflt_direct_cmd_desc(&amp;desc, ice_mbx_opc_send_msg_to_vf);<br>
&gt; +<br>
&gt; +     cmd = &amp;desc.params.virt;<br>
&gt; +     cmd-&gt;id = CPU_TO_LE32(vfid);<br>
&gt; +<br>
&gt; +     desc.cookie_high = CPU_TO_LE32(v_opcode);<br>
&gt; +     desc.cookie_low = CPU_TO_LE32(v_retval);<br>
&gt; +<br>
&gt; +     if (msglen)<br>
&gt; +             desc.flags |= CPU_TO_LE16(ICE_AQ_FLAG_RD);<br>
&gt; +<br>
&gt; +     return ice_sq_send_cmd(hw, &amp;hw-&gt;mailboxq, &amp;desc, msg, msglen, cd);<br>
&gt; +}<br>
&gt; +<br>
&gt; +/**<br>
&gt; + * ice_aq_send_msg_to_pf<br>
&gt; + * @hw: pointer to the hardware structure<br>
&gt; + * @v_opcode: opcodes for VF-PF communication<br>
&gt; + * @v_retval: return error code<br>
&gt; + * @msg: pointer to the msg buffer<br>
&gt; + * @msglen: msg length<br>
&gt; + * @cd: pointer to command details<br>
&gt; + *<br>
&gt; + * Send message to PF driver using mailbox queue. By default, this<br>
&gt; + * message is sent asynchronously, i.e. ice_sq_send_cmd()<br>
&gt; + * does not wait for completion before returning.<br>
&gt; + */<br>
&gt; +enum ice_status<br>
&gt; +ice_aq_send_msg_to_pf(struct ice_hw *hw, enum virtchnl_ops v_opcode,<br>
&gt; +                   enum ice_status v_retval, u8 *msg, u16 msglen,<br>
&gt; +                   struct ice_sq_cd *cd)<br>
&gt; +{<br>
&gt; +     struct ice_aq_desc desc;<br>
&gt; +<br>
&gt; +     ice_fill_dflt_direct_cmd_desc(&amp;desc, ice_mbx_opc_send_msg_to_pf);<br>
&gt; +     desc.cookie_high = CPU_TO_LE32(v_opcode);<br>
&gt; +     desc.cookie_low = CPU_TO_LE32(v_retval);<br>
&gt; +<br>
&gt; +     if (msglen)<br>
&gt; +             desc.flags |= CPU_TO_LE16(ICE_AQ_FLAG_RD);<br>
&gt; +<br>
&gt; +     return ice_sq_send_cmd(hw, &amp;hw-&gt;mailboxq, &amp;desc, msg, msglen, cd);<br>
&gt; +}<br>
&gt; +<br>
&gt; +/**<br>
&gt; + * ice_conv_link_speed_to_virtchnl<br>
&gt; + * @adv_link_support: determines the format of the returned link speed<br>
&gt; + * @link_speed: variable containing the link_speed to be converted<br>
&gt; + *<br>
&gt; + * Convert link speed supported by HW to link speed supported by virtchnl.<br>
&gt; + * If adv_link_support is true, then return link speed in Mbps. Else return<br>
&gt; + * link speed as a VIRTCHNL_LINK_SPEED_* casted to a u32. Note that the caller<br>
&gt; + * needs to cast back to an enum virtchnl_link_speed in the case where<br>
&gt; + * adv_link_support is false, but when adv_link_support is true the caller can<br>
&gt; + * expect the speed in Mbps.<br>
&gt; + */<br>
&gt; +u32 ice_conv_link_speed_to_virtchnl(bool adv_link_support, u16 link_speed)<br>
&gt; +{<br>
&gt; +     u32 speed;<br>
&gt; +<br>
&gt; +     if (adv_link_support)<br>
&gt; +             switch (link_speed) {<br>
&gt; +             case ICE_AQ_LINK_SPEED_10MB:<br>
&gt; +                     speed = ICE_LINK_SPEED_10MBPS;<br>
&gt; +                     break;<br>
&gt; +             case ICE_AQ_LINK_SPEED_100MB:<br>
&gt; +                     speed = ICE_LINK_SPEED_100MBPS;<br>
&gt; +                     break;<br>
&gt; +             case ICE_AQ_LINK_SPEED_1000MB:<br>
&gt; +                     speed = ICE_LINK_SPEED_1000MBPS;<br>
&gt; +                     break;<br>
&gt; +             case ICE_AQ_LINK_SPEED_2500MB:<br>
&gt; +                     speed = ICE_LINK_SPEED_2500MBPS;<br>
&gt; +                     break;<br>
&gt; +             case ICE_AQ_LINK_SPEED_5GB:<br>
&gt; +                     speed = ICE_LINK_SPEED_5000MBPS;<br>
&gt; +                     break;<br>
&gt; +             case ICE_AQ_LINK_SPEED_10GB:<br>
&gt; +                     speed = ICE_LINK_SPEED_10000MBPS;<br>
&gt; +                     break;<br>
&gt; +             case ICE_AQ_LINK_SPEED_20GB:<br>
&gt; +                     speed = ICE_LINK_SPEED_20000MBPS;<br>
&gt; +                     break;<br>
&gt; +             case ICE_AQ_LINK_SPEED_25GB:<br>
&gt; +                     speed = ICE_LINK_SPEED_25000MBPS;<br>
&gt; +                     break;<br>
&gt; +             case ICE_AQ_LINK_SPEED_40GB:<br>
&gt; +                     speed = ICE_LINK_SPEED_40000MBPS;<br>
&gt; +                     break;<br>
&gt; +             case ICE_AQ_LINK_SPEED_50GB:<br>
&gt; +                     speed = ICE_LINK_SPEED_50000MBPS;<br>
&gt; +                     break;<br>
&gt; +             case ICE_AQ_LINK_SPEED_100GB:<br>
&gt; +                     speed = ICE_LINK_SPEED_100000MBPS;<br>
&gt; +                     break;<br>
&gt; +             default:<br>
&gt; +                     speed = ICE_LINK_SPEED_UNKNOWN;<br>
&gt; +                     break;<br>
&gt; +             }<br>
&gt; +     else<br>
&gt; +             /* Virtchnl speeds are not defined for every speed supported in<br>
&gt; +              * the hardware. To maintain compatibility with older AVF<br>
&gt; +              * drivers, while reporting the speed the new speed values are<br>
&gt; +              * resolved to the closest known virtchnl speeds<br>
&gt; +              */<br>
&gt; +             switch (link_speed) {<br>
&gt; +             case ICE_AQ_LINK_SPEED_10MB:<br>
&gt; +             case ICE_AQ_LINK_SPEED_100MB:<br>
&gt; +                     speed = (u32)VIRTCHNL_LINK_SPEED_100MB;<br>
&gt; +                     break;<br>
&gt; +             case ICE_AQ_LINK_SPEED_1000MB:<br>
&gt; +             case ICE_AQ_LINK_SPEED_2500MB:<br>
&gt; +             case ICE_AQ_LINK_SPEED_5GB:<br>
&gt; +                     speed = (u32)VIRTCHNL_LINK_SPEED_1GB;<br>
&gt; +                     break;<br>
&gt; +             case ICE_AQ_LINK_SPEED_10GB:<br>
&gt; +                     speed = (u32)VIRTCHNL_LINK_SPEED_10GB;<br>
&gt; +                     break;<br>
&gt; +             case ICE_AQ_LINK_SPEED_20GB:<br>
&gt; +                     speed = (u32)VIRTCHNL_LINK_SPEED_20GB;<br>
&gt; +                     break;<br>
&gt; +             case ICE_AQ_LINK_SPEED_25GB:<br>
&gt; +                     speed = (u32)VIRTCHNL_LINK_SPEED_25GB;<br>
&gt; +                     break;<br>
&gt; +             case ICE_AQ_LINK_SPEED_40GB:<br>
&gt; +             case ICE_AQ_LINK_SPEED_50GB:<br>
&gt; +             case ICE_AQ_LINK_SPEED_100GB:<br>
&gt; +                     speed = (u32)VIRTCHNL_LINK_SPEED_40GB;<br>
&gt; +                     break;<br>
&gt; +             default:<br>
&gt; +                     speed = (u32)VIRTCHNL_LINK_SPEED_UNKNOWN;<br>
&gt; +                     break;<br>
&gt; +             }<br>
&gt; +<br>
&gt; +     return speed;<br>
&gt; +}<br>
&gt; +<br>
&gt; +/* The mailbox overflow detection algorithm helps to check if there<br>
&gt; + * is a possibility of a malicious VF transmitting too many MBX messages to the<br>
&gt; + * PF.<br>
&gt; + * 1. The mailbox snapshot structure, ice_mbx_snapshot, is initialized during<br>
&gt; + * driver initialization in ice_init_hw() using ice_mbx_init_snapshot().<br>
&gt; + * The struct ice_mbx_snapshot helps to track and traverse a static window of<br>
&gt; + * messages within the mailbox queue while looking for a malicious VF.<br>
&gt; + *<br>
&gt; + * 2. When the caller starts processing its mailbox queue in response to an<br>
&gt; + * interrupt, the structure ice_mbx_snapshot is expected to be cleared before<br>
&gt; + * the algorithm can be run for the first time for that interrupt. This can be<br>
&gt; + * done via ice_mbx_reset_snapshot().<br>
&gt; + *<br>
&gt; + * 3. For every message read by the caller from the MBX Queue, the caller must<br>
&gt; + * call the detection algorithm&#39;s entry function ice_mbx_vf_state_handler().<br>
&gt; + * Before every call to ice_mbx_vf_state_handler() the struct ice_mbx_data is<br>
&gt; + * filled as it is required to be passed to the algorithm.<br>
&gt; + *<br>
&gt; + * 4. Every time a message is read from the MBX queue, a VFId is received which<br>
&gt; + * is passed to the state handler. The boolean output is_malvf of the state<br>
&gt; + * handler ice_mbx_vf_state_handler() serves as an indicator to the caller<br>
&gt; + * whether this VF is malicious or not.<br>
&gt; + *<br>
&gt; + * 5. When a VF is identified to be malicious, the caller can send a message<br>
&gt; + * to the system administrator. The caller can invoke ice_mbx_report_malvf()<br>
&gt; + * to help determine if a malicious VF is to be reported or not. This function<br>
&gt; + * requires the caller to maintain a global bitmap to track all malicious VFs<br>
&gt; + * and pass that to ice_mbx_report_malvf() along with the VFID which was identified<br>
&gt; + * to be malicious by ice_mbx_vf_state_handler().<br>
&gt; + *<br>
&gt; + * 6. The global bitmap maintained by PF can be cleared completely if PF is in<br>
&gt; + * reset or the bit corresponding to a VF can be cleared if that VF is in reset.<br>
&gt; + * When a VF is shut down and brought back up, we assume that the new VF<br>
&gt; + * brought up is not malicious and hence report it if found malicious.<br>
&gt; + *<br>
&gt; + * 7. The function ice_mbx_reset_snapshot() is called to reset the information<br>
&gt; + * in ice_mbx_snapshot for every new mailbox interrupt handled.<br>
&gt; + *<br>
&gt; + * 8. The memory allocated for variables in ice_mbx_snapshot is de-allocated<br>
&gt; + * when driver is unloaded.<br>
&gt; + */<br>
&gt; +#define ICE_RQ_DATA_MASK(rq_data) ((rq_data) &amp; PF_MBX_ARQH_ARQH_M)<br>
&gt; +/* Using the highest value for an unsigned 16-bit value 0xFFFF to indicate that<br>
&gt; + * the max messages check must be ignored in the algorithm<br>
&gt; + */<br>
&gt; +#define ICE_IGNORE_MAX_MSG_CNT       0xFFFF<br>
&gt; +<br>
&gt; +/**<br>
&gt; + * ice_mbx_traverse - Pass through mailbox snapshot<br>
&gt; + * @hw: pointer to the HW struct<br>
&gt; + * @new_state: new algorithm state<br>
&gt; + *<br>
&gt; + * Traversing the mailbox static snapshot without checking<br>
&gt; + * for malicious VFs.<br>
&gt; + */<br>
&gt; +static void<br>
&gt; +ice_mbx_traverse(struct ice_hw *hw,<br>
&gt; +              enum ice_mbx_snapshot_state *new_state)<br>
&gt; +{<br>
&gt; +     struct ice_mbx_snap_buffer_data *snap_buf;<br>
&gt; +     u32 num_iterations;<br>
&gt; +<br>
&gt; +     snap_buf = &amp;hw-&gt;mbx_snapshot.mbx_buf;<br>
&gt; +<br>
&gt; +     /* As mailbox buffer is circular, applying a mask<br>
&gt; +      * on the incremented iteration count.<br>
&gt; +      */<br>
&gt; +     num_iterations = ICE_RQ_DATA_MASK(++snap_buf-&gt;num_iterations);<br>
&gt; +<br>
&gt; +     /* Checking either of the below conditions to exit snapshot traversal:<br>
&gt; +      * Condition-1: If the number of iterations in the mailbox is equal to<br>
&gt; +      * the mailbox head which would indicate that we have reached the end<br>
&gt; +      * of the static snapshot.<br>
&gt; +      * Condition-2: If the maximum messages serviced in the mailbox for a<br>
&gt; +      * given interrupt is the highest possible value then there is no need<br>
&gt; +      * to check if the number of messages processed is equal to it. If not<br>
&gt; +      * check if the number of messages processed is greater than or equal<br>
&gt; +      * to the maximum number of mailbox entries serviced in current work item.<br>
&gt; +      */<br>
&gt; +     if (num_iterations == snap_buf-&gt;head ||<br>
&gt; +         (snap_buf-&gt;max_num_msgs_mbx &lt; ICE_IGNORE_MAX_MSG_CNT &amp;&amp;<br>
&gt; +          ++snap_buf-&gt;num_msg_proc &gt;= snap_buf-&gt;max_num_msgs_mbx))<br>
&gt; +             *new_state = ICE_MAL_VF_DETECT_STATE_NEW_SNAPSHOT;<br>
&gt; +}<br>
&gt; +<br>
&gt; +/**<br>
&gt; + * ice_mbx_detect_malvf - Detect malicious VF in snapshot<br>
&gt; + * @hw: pointer to the HW struct<br>
&gt; + * @vf_id: relative virtual function ID<br>
&gt; + * @new_state: new algorithm state<br>
&gt; + * @is_malvf: boolean output to indicate if VF is malicious<br>
&gt; + *<br>
&gt; + * This function tracks the number of asynchronous messages<br>
&gt; + * sent per VF and marks the VF as malicious if it exceeds<br>
&gt; + * the permissible number of messages to send.<br>
&gt; + */<br>
&gt; +static enum ice_status<br>
&gt; +ice_mbx_detect_malvf(struct ice_hw *hw, u16 vf_id,<br>
&gt; +                  enum ice_mbx_snapshot_state *new_state,<br>
&gt; +                  bool *is_malvf)<br>
&gt; +{<br>
&gt; +     struct ice_mbx_snapshot *snap = &amp;hw-&gt;mbx_snapshot;<br>
&gt; +<br>
&gt; +     if (vf_id &gt;= snap-&gt;mbx_vf.vfcntr_len)<br>
&gt; +             return ICE_ERR_OUT_OF_RANGE;<br>
&gt; +<br>
&gt; +     /* increment the message count in the VF array */<br>
&gt; +     snap-&gt;mbx_vf.vf_cntr[vf_id]++;<br>
&gt; +<br>
&gt; +     if (snap-&gt;mbx_vf.vf_cntr[vf_id] &gt;= ICE_ASYNC_VF_MSG_THRESHOLD)<br>
&gt; +             *is_malvf = true;<br>
&gt; +<br>
&gt; +     /* continue to iterate through the mailbox snapshot */<br>
&gt; +     ice_mbx_traverse(hw, new_state);<br>
&gt; +<br>
&gt; +     return ICE_SUCCESS;<br>
&gt; +}<br>
&gt; +<br>
&gt; +/**<br>
&gt; + * ice_mbx_reset_snapshot - Reset mailbox snapshot structure<br>
&gt; + * @snap: pointer to mailbox snapshot structure in the ice_hw struct<br>
&gt; + *<br>
&gt; + * Reset the mailbox snapshot structure and clear VF counter array.<br>
&gt; + */<br>
&gt; +static void ice_mbx_reset_snapshot(struct ice_mbx_snapshot *snap)<br>
&gt; *** 15611 LINES SKIPPED ***<br>
<br>
<br>
<br>
</blockquote></div></div></div>

Want to link to this message? Use this URL: <https://mail-archive.FreeBSD.org/cgi/mid.cgi?CANCZdfpk7dSiuYaU42cFXrhqMsonbPrQrjzTDeWL=vvCnoHMxA>