summaryrefslogtreecommitdiff
path: root/lib/dpif-netdev-lookup.c
blob: 4c1379aa54cc68452d71364888411011df345abf (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
/*
 * Copyright (c) 2020 Intel Corporation.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at:
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#include <config.h>
#include <errno.h>
#include "dpif-netdev-lookup.h"

#include "cpu.h"
#include "openvswitch/vlog.h"

VLOG_DEFINE_THIS_MODULE(dpif_netdev_lookup);
#define DPCLS_IMPL_AVX512_CHECK (__x86_64__ && HAVE_AVX512F \
    && HAVE_LD_AVX512_GOOD && HAVE_AVX512BW && __SSE4_2__)

#if DPCLS_IMPL_AVX512_CHECK
static dpcls_subtable_lookup_func
dpcls_subtable_avx512_gather_probe(uint32_t u0_bits, uint32_t u1_bits)
{
    if (!cpu_has_isa(OVS_CPU_ISA_X86_AVX512F)
        || !cpu_has_isa(OVS_CPU_ISA_X86_BMI2)) {
        return NULL;
    }

    return dpcls_subtable_avx512_gather_probe__(u0_bits, u1_bits,
        cpu_has_isa(OVS_CPU_ISA_X86_VPOPCNTDQ));
}
#endif

/* Actual list of implementations goes here */
static struct dpcls_subtable_lookup_info_t subtable_lookups[] = {
    /* The autovalidator implementation will not be used by default, it must
     * be enabled at compile time to be the default lookup implementation. The
     * user may enable it at runtime using the normal "prio-set" command if
     * desired. The compile time default switch is here to enable all unit
     * tests to transparently run with the autovalidator.
     */
#ifdef DPCLS_AUTOVALIDATOR_DEFAULT
    { .prio = 255,
#else
    { .prio = 0,
#endif
      .probe = dpcls_subtable_autovalidator_probe,
      .name = "autovalidator",
      .usage_cnt = ATOMIC_COUNT_INIT(0), },

    /* The default scalar C code implementation. */
    { .prio = 1,
      .probe = dpcls_subtable_generic_probe,
      .name = "generic",
      .usage_cnt = ATOMIC_COUNT_INIT(0), },

#if DPCLS_IMPL_AVX512_CHECK
    /* Only available on x86_64 bit builds with SSE 4.2 used for OVS core. */
    { .prio = 0,
      .probe = dpcls_subtable_avx512_gather_probe,
      .name = "avx512_gather",
      .usage_cnt = ATOMIC_COUNT_INIT(0), },
#else
    /* Disabling AVX512 at compile time, as compile time requirements not met.
     * This could be due to a number of reasons:
     *  1) core OVS is not compiled with SSE4.2 instruction set.
     *     The SSE42 instructions are required to use CRC32 ISA for high-
     *     performance hashing. Consider ./configure of OVS with -msse42 (or
     *     newer) to enable CRC32 hashing and higher performance.
     *  2) The assembler in binutils versions 2.30 and 2.31 has bugs in AVX512
     *     assembly. Compile time probes check for this assembler issue, and
     *     disable the HAVE_LD_AVX512_GOOD check if an issue is detected.
     *     Please upgrade binutils, or backport this binutils fix commit:
     *     2069ccaf8dc28ea699bd901fdd35d90613e4402a
     */
#endif
};

int
dpcls_subtable_lookup_info_get(struct dpcls_subtable_lookup_info_t **out_ptr)
{
    if (out_ptr == NULL) {
        return -1;
    }

    *out_ptr = subtable_lookups;
    return ARRAY_SIZE(subtable_lookups);
}

/* sets the priority of the lookup function with "name". */
int
dpcls_subtable_set_prio(const char *name, uint8_t priority)
{
    for (int i = 0; i < ARRAY_SIZE(subtable_lookups); i++) {
        if (strcmp(name, subtable_lookups[i].name) == 0) {
                subtable_lookups[i].prio = priority;
                VLOG_INFO("Subtable function '%s' set priority to %d\n",
                         name, priority);
                return 0;
        }
    }
    VLOG_WARN("Subtable function '%s' not found, failed to set priority\n",
              name);
    return -EINVAL;
}

dpcls_subtable_lookup_func
dpcls_subtable_get_best_impl(uint32_t u0_bit_count, uint32_t u1_bit_count,
                             struct dpcls_subtable_lookup_info_t **info)
{
    struct dpcls_subtable_lookup_info_t *best_info = NULL;
    dpcls_subtable_lookup_func best_func = NULL;
    int prio = -1;

    /* Iter over each subtable impl, and get highest priority one. */
    for (int i = 0; i < ARRAY_SIZE(subtable_lookups); i++) {
        struct dpcls_subtable_lookup_info_t *impl_info = &subtable_lookups[i];
        dpcls_subtable_lookup_func probed_func;

        if (impl_info->prio <= prio) {
            continue;
        }

        probed_func = subtable_lookups[i].probe(u0_bit_count,
                                                u1_bit_count);
        if (!probed_func) {
            continue;
        }

        best_func = probed_func;
        best_info = impl_info;
        prio = impl_info->prio;
    }

    /* Programming error - we must always return a valid func ptr. */
    ovs_assert(best_func != NULL && best_info != NULL);

    VLOG_DBG("Subtable lookup function '%s' with units (%d,%d), priority %d\n",
             best_info->name, u0_bit_count, u1_bit_count, prio);

    if (info) {
        *info = best_info;
    }
    return best_func;
}

void
dpcls_info_inc_usage(struct dpcls_subtable_lookup_info_t *info)
{
    if (info) {
        atomic_count_inc(&info->usage_cnt);
    }
}

void
dpcls_info_dec_usage(struct dpcls_subtable_lookup_info_t *info)
{
    if (info) {
        atomic_count_dec(&info->usage_cnt);
    }
}

void
dpcls_impl_print_stats(struct ds *reply)
{
    struct dpcls_subtable_lookup_info_t *lookup_funcs = NULL;
    int count = dpcls_subtable_lookup_info_get(&lookup_funcs);

    /* Add all DPCLS functions to reply string. */
    ds_put_cstr(reply, "Available dpcls implementations:\n");

    for (int i = 0; i < count; i++) {
        ds_put_format(reply, "  %s (Use count: %d, Priority: %d",
                      lookup_funcs[i].name,
                      atomic_count_get(&lookup_funcs[i].usage_cnt),
                      lookup_funcs[i].prio);

        if (ds_last(reply) == ' ') {
            ds_put_cstr(reply, "none");
        }

        ds_put_cstr(reply, ")\n");
    }

}