1d9ae7f2bSJakub Kicinski /* 2854dc87dSJiong Wang * Copyright (C) 2016-2017 Netronome Systems, Inc. 3d9ae7f2bSJakub Kicinski * 4d9ae7f2bSJakub Kicinski * This software is dual licensed under the GNU General License Version 2, 5d9ae7f2bSJakub Kicinski * June 1991 as shown in the file COPYING in the top-level directory of this 6d9ae7f2bSJakub Kicinski * source tree or the BSD 2-Clause License provided below. You have the 7d9ae7f2bSJakub Kicinski * option to license this software under the complete terms of either license. 8d9ae7f2bSJakub Kicinski * 9d9ae7f2bSJakub Kicinski * The BSD 2-Clause License: 10d9ae7f2bSJakub Kicinski * 11d9ae7f2bSJakub Kicinski * Redistribution and use in source and binary forms, with or 12d9ae7f2bSJakub Kicinski * without modification, are permitted provided that the following 13d9ae7f2bSJakub Kicinski * conditions are met: 14d9ae7f2bSJakub Kicinski * 15d9ae7f2bSJakub Kicinski * 1. Redistributions of source code must retain the above 16d9ae7f2bSJakub Kicinski * copyright notice, this list of conditions and the following 17d9ae7f2bSJakub Kicinski * disclaimer. 18d9ae7f2bSJakub Kicinski * 19d9ae7f2bSJakub Kicinski * 2. Redistributions in binary form must reproduce the above 20d9ae7f2bSJakub Kicinski * copyright notice, this list of conditions and the following 21d9ae7f2bSJakub Kicinski * disclaimer in the documentation and/or other materials 22d9ae7f2bSJakub Kicinski * provided with the distribution. 23d9ae7f2bSJakub Kicinski * 24d9ae7f2bSJakub Kicinski * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 25d9ae7f2bSJakub Kicinski * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 26d9ae7f2bSJakub Kicinski * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 27d9ae7f2bSJakub Kicinski * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 28d9ae7f2bSJakub Kicinski * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 29d9ae7f2bSJakub Kicinski * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 30d9ae7f2bSJakub Kicinski * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 31d9ae7f2bSJakub Kicinski * SOFTWARE. 32d9ae7f2bSJakub Kicinski */ 33d9ae7f2bSJakub Kicinski 34d9ae7f2bSJakub Kicinski #define pr_fmt(fmt) "NFP net bpf: " fmt 35d9ae7f2bSJakub Kicinski 36d9ae7f2bSJakub Kicinski #include <linux/kernel.h> 37d9ae7f2bSJakub Kicinski #include <linux/bpf.h> 38d9ae7f2bSJakub Kicinski #include <linux/filter.h> 39d9ae7f2bSJakub Kicinski #include <linux/pkt_cls.h> 40d9ae7f2bSJakub Kicinski #include <linux/unistd.h> 41d9ae7f2bSJakub Kicinski 42d9ae7f2bSJakub Kicinski #include "main.h" 43d9ae7f2bSJakub Kicinski #include "../nfp_asm.h" 44d9ae7f2bSJakub Kicinski 45d9ae7f2bSJakub Kicinski /* --- NFP prog --- */ 46d9ae7f2bSJakub Kicinski /* Foreach "multiple" entries macros provide pos and next<n> pointers. 47d9ae7f2bSJakub Kicinski * It's safe to modify the next pointers (but not pos). 48d9ae7f2bSJakub Kicinski */ 49d9ae7f2bSJakub Kicinski #define nfp_for_each_insn_walk2(nfp_prog, pos, next) \ 50d9ae7f2bSJakub Kicinski for (pos = list_first_entry(&(nfp_prog)->insns, typeof(*pos), l), \ 51d9ae7f2bSJakub Kicinski next = list_next_entry(pos, l); \ 52d9ae7f2bSJakub Kicinski &(nfp_prog)->insns != &pos->l && \ 53d9ae7f2bSJakub Kicinski &(nfp_prog)->insns != &next->l; \ 54d9ae7f2bSJakub Kicinski pos = nfp_meta_next(pos), \ 55d9ae7f2bSJakub Kicinski next = nfp_meta_next(pos)) 56d9ae7f2bSJakub Kicinski 57d9ae7f2bSJakub Kicinski #define nfp_for_each_insn_walk3(nfp_prog, pos, next, next2) \ 58d9ae7f2bSJakub Kicinski for (pos = list_first_entry(&(nfp_prog)->insns, typeof(*pos), l), \ 59d9ae7f2bSJakub Kicinski next = list_next_entry(pos, l), \ 60d9ae7f2bSJakub Kicinski next2 = list_next_entry(next, l); \ 61d9ae7f2bSJakub Kicinski &(nfp_prog)->insns != &pos->l && \ 62d9ae7f2bSJakub Kicinski &(nfp_prog)->insns != &next->l && \ 63d9ae7f2bSJakub Kicinski &(nfp_prog)->insns != &next2->l; \ 64d9ae7f2bSJakub Kicinski pos = nfp_meta_next(pos), \ 65d9ae7f2bSJakub Kicinski next = nfp_meta_next(pos), \ 66d9ae7f2bSJakub Kicinski next2 = nfp_meta_next(next)) 67d9ae7f2bSJakub Kicinski 68d9ae7f2bSJakub Kicinski static bool 69d9ae7f2bSJakub Kicinski nfp_meta_has_prev(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 70d9ae7f2bSJakub Kicinski { 71d9ae7f2bSJakub Kicinski return meta->l.prev != &nfp_prog->insns; 72d9ae7f2bSJakub Kicinski } 73d9ae7f2bSJakub Kicinski 74d9ae7f2bSJakub Kicinski static void nfp_prog_push(struct nfp_prog *nfp_prog, u64 insn) 75d9ae7f2bSJakub Kicinski { 76d9ae7f2bSJakub Kicinski if (nfp_prog->__prog_alloc_len == nfp_prog->prog_len) { 77d9ae7f2bSJakub Kicinski nfp_prog->error = -ENOSPC; 78d9ae7f2bSJakub Kicinski return; 79d9ae7f2bSJakub Kicinski } 80d9ae7f2bSJakub Kicinski 81d9ae7f2bSJakub Kicinski nfp_prog->prog[nfp_prog->prog_len] = insn; 82d9ae7f2bSJakub Kicinski nfp_prog->prog_len++; 83d9ae7f2bSJakub Kicinski } 84d9ae7f2bSJakub Kicinski 85d9ae7f2bSJakub Kicinski static unsigned int nfp_prog_current_offset(struct nfp_prog *nfp_prog) 86d9ae7f2bSJakub Kicinski { 87d9ae7f2bSJakub Kicinski return nfp_prog->start_off + nfp_prog->prog_len; 88d9ae7f2bSJakub Kicinski } 89d9ae7f2bSJakub Kicinski 90d9ae7f2bSJakub Kicinski static unsigned int 91d9ae7f2bSJakub Kicinski nfp_prog_offset_to_index(struct nfp_prog *nfp_prog, unsigned int offset) 92d9ae7f2bSJakub Kicinski { 93d9ae7f2bSJakub Kicinski return offset - nfp_prog->start_off; 94d9ae7f2bSJakub Kicinski } 95d9ae7f2bSJakub Kicinski 96d9ae7f2bSJakub Kicinski /* --- Emitters --- */ 97d9ae7f2bSJakub Kicinski static void 98d9ae7f2bSJakub Kicinski __emit_cmd(struct nfp_prog *nfp_prog, enum cmd_tgt_map op, 995468a8b9SJakub Kicinski u8 mode, u8 xfer, u8 areg, u8 breg, u8 size, bool sync, bool indir) 100d9ae7f2bSJakub Kicinski { 101d9ae7f2bSJakub Kicinski enum cmd_ctx_swap ctx; 102d9ae7f2bSJakub Kicinski u64 insn; 103d9ae7f2bSJakub Kicinski 104d9ae7f2bSJakub Kicinski if (sync) 105d9ae7f2bSJakub Kicinski ctx = CMD_CTX_SWAP; 106d9ae7f2bSJakub Kicinski else 107d9ae7f2bSJakub Kicinski ctx = CMD_CTX_NO_SWAP; 108d9ae7f2bSJakub Kicinski 109d9ae7f2bSJakub Kicinski insn = FIELD_PREP(OP_CMD_A_SRC, areg) | 110d9ae7f2bSJakub Kicinski FIELD_PREP(OP_CMD_CTX, ctx) | 111d9ae7f2bSJakub Kicinski FIELD_PREP(OP_CMD_B_SRC, breg) | 112d9ae7f2bSJakub Kicinski FIELD_PREP(OP_CMD_TOKEN, cmd_tgt_act[op].token) | 113d9ae7f2bSJakub Kicinski FIELD_PREP(OP_CMD_XFER, xfer) | 114d9ae7f2bSJakub Kicinski FIELD_PREP(OP_CMD_CNT, size) | 115d9ae7f2bSJakub Kicinski FIELD_PREP(OP_CMD_SIG, sync) | 116d9ae7f2bSJakub Kicinski FIELD_PREP(OP_CMD_TGT_CMD, cmd_tgt_act[op].tgt_cmd) | 1175468a8b9SJakub Kicinski FIELD_PREP(OP_CMD_INDIR, indir) | 118d9ae7f2bSJakub Kicinski FIELD_PREP(OP_CMD_MODE, mode); 119d9ae7f2bSJakub Kicinski 120d9ae7f2bSJakub Kicinski nfp_prog_push(nfp_prog, insn); 121d9ae7f2bSJakub Kicinski } 122d9ae7f2bSJakub Kicinski 123d9ae7f2bSJakub Kicinski static void 1245468a8b9SJakub Kicinski emit_cmd_any(struct nfp_prog *nfp_prog, enum cmd_tgt_map op, u8 mode, u8 xfer, 1255468a8b9SJakub Kicinski swreg lreg, swreg rreg, u8 size, bool sync, bool indir) 126d9ae7f2bSJakub Kicinski { 127d9ae7f2bSJakub Kicinski struct nfp_insn_re_regs reg; 128d9ae7f2bSJakub Kicinski int err; 129d9ae7f2bSJakub Kicinski 130d9ae7f2bSJakub Kicinski err = swreg_to_restricted(reg_none(), lreg, rreg, ®, false); 131d9ae7f2bSJakub Kicinski if (err) { 132d9ae7f2bSJakub Kicinski nfp_prog->error = err; 133d9ae7f2bSJakub Kicinski return; 134d9ae7f2bSJakub Kicinski } 135d9ae7f2bSJakub Kicinski if (reg.swap) { 136d9ae7f2bSJakub Kicinski pr_err("cmd can't swap arguments\n"); 137d9ae7f2bSJakub Kicinski nfp_prog->error = -EFAULT; 138d9ae7f2bSJakub Kicinski return; 139d9ae7f2bSJakub Kicinski } 140995e101fSJakub Kicinski if (reg.dst_lmextn || reg.src_lmextn) { 141995e101fSJakub Kicinski pr_err("cmd can't use LMextn\n"); 142995e101fSJakub Kicinski nfp_prog->error = -EFAULT; 143995e101fSJakub Kicinski return; 144995e101fSJakub Kicinski } 145d9ae7f2bSJakub Kicinski 1465468a8b9SJakub Kicinski __emit_cmd(nfp_prog, op, mode, xfer, reg.areg, reg.breg, size, sync, 1475468a8b9SJakub Kicinski indir); 1485468a8b9SJakub Kicinski } 1495468a8b9SJakub Kicinski 1505468a8b9SJakub Kicinski static void 1515468a8b9SJakub Kicinski emit_cmd(struct nfp_prog *nfp_prog, enum cmd_tgt_map op, u8 mode, u8 xfer, 1525468a8b9SJakub Kicinski swreg lreg, swreg rreg, u8 size, bool sync) 1535468a8b9SJakub Kicinski { 1545468a8b9SJakub Kicinski emit_cmd_any(nfp_prog, op, mode, xfer, lreg, rreg, size, sync, false); 155d9ae7f2bSJakub Kicinski } 156d9ae7f2bSJakub Kicinski 157d9ae7f2bSJakub Kicinski static void 1589879a381SJiong Wang emit_cmd_indir(struct nfp_prog *nfp_prog, enum cmd_tgt_map op, u8 mode, u8 xfer, 1599879a381SJiong Wang swreg lreg, swreg rreg, u8 size, bool sync) 1609879a381SJiong Wang { 1619879a381SJiong Wang emit_cmd_any(nfp_prog, op, mode, xfer, lreg, rreg, size, sync, true); 1629879a381SJiong Wang } 1639879a381SJiong Wang 1649879a381SJiong Wang static void 165d9ae7f2bSJakub Kicinski __emit_br(struct nfp_prog *nfp_prog, enum br_mask mask, enum br_ev_pip ev_pip, 166d9ae7f2bSJakub Kicinski enum br_ctx_signal_state css, u16 addr, u8 defer) 167d9ae7f2bSJakub Kicinski { 168d9ae7f2bSJakub Kicinski u16 addr_lo, addr_hi; 169d9ae7f2bSJakub Kicinski u64 insn; 170d9ae7f2bSJakub Kicinski 171d9ae7f2bSJakub Kicinski addr_lo = addr & (OP_BR_ADDR_LO >> __bf_shf(OP_BR_ADDR_LO)); 172d9ae7f2bSJakub Kicinski addr_hi = addr != addr_lo; 173d9ae7f2bSJakub Kicinski 174d9ae7f2bSJakub Kicinski insn = OP_BR_BASE | 175d9ae7f2bSJakub Kicinski FIELD_PREP(OP_BR_MASK, mask) | 176d9ae7f2bSJakub Kicinski FIELD_PREP(OP_BR_EV_PIP, ev_pip) | 177d9ae7f2bSJakub Kicinski FIELD_PREP(OP_BR_CSS, css) | 178d9ae7f2bSJakub Kicinski FIELD_PREP(OP_BR_DEFBR, defer) | 179d9ae7f2bSJakub Kicinski FIELD_PREP(OP_BR_ADDR_LO, addr_lo) | 180d9ae7f2bSJakub Kicinski FIELD_PREP(OP_BR_ADDR_HI, addr_hi); 181d9ae7f2bSJakub Kicinski 182d9ae7f2bSJakub Kicinski nfp_prog_push(nfp_prog, insn); 183d9ae7f2bSJakub Kicinski } 184d9ae7f2bSJakub Kicinski 185d9ae7f2bSJakub Kicinski static void emit_br_def(struct nfp_prog *nfp_prog, u16 addr, u8 defer) 186d9ae7f2bSJakub Kicinski { 187d9ae7f2bSJakub Kicinski if (defer > 2) { 188d9ae7f2bSJakub Kicinski pr_err("BUG: branch defer out of bounds %d\n", defer); 189d9ae7f2bSJakub Kicinski nfp_prog->error = -EFAULT; 190d9ae7f2bSJakub Kicinski return; 191d9ae7f2bSJakub Kicinski } 192d9ae7f2bSJakub Kicinski __emit_br(nfp_prog, BR_UNC, BR_EV_PIP_UNCOND, BR_CSS_NONE, addr, defer); 193d9ae7f2bSJakub Kicinski } 194d9ae7f2bSJakub Kicinski 195d9ae7f2bSJakub Kicinski static void 196d9ae7f2bSJakub Kicinski emit_br(struct nfp_prog *nfp_prog, enum br_mask mask, u16 addr, u8 defer) 197d9ae7f2bSJakub Kicinski { 198d9ae7f2bSJakub Kicinski __emit_br(nfp_prog, mask, 199d9ae7f2bSJakub Kicinski mask != BR_UNC ? BR_EV_PIP_COND : BR_EV_PIP_UNCOND, 200d9ae7f2bSJakub Kicinski BR_CSS_NONE, addr, defer); 201d9ae7f2bSJakub Kicinski } 202d9ae7f2bSJakub Kicinski 203d9ae7f2bSJakub Kicinski static void 204d9ae7f2bSJakub Kicinski __emit_immed(struct nfp_prog *nfp_prog, u16 areg, u16 breg, u16 imm_hi, 205d9ae7f2bSJakub Kicinski enum immed_width width, bool invert, 206995e101fSJakub Kicinski enum immed_shift shift, bool wr_both, 207995e101fSJakub Kicinski bool dst_lmextn, bool src_lmextn) 208d9ae7f2bSJakub Kicinski { 209d9ae7f2bSJakub Kicinski u64 insn; 210d9ae7f2bSJakub Kicinski 211d9ae7f2bSJakub Kicinski insn = OP_IMMED_BASE | 212d9ae7f2bSJakub Kicinski FIELD_PREP(OP_IMMED_A_SRC, areg) | 213d9ae7f2bSJakub Kicinski FIELD_PREP(OP_IMMED_B_SRC, breg) | 214d9ae7f2bSJakub Kicinski FIELD_PREP(OP_IMMED_IMM, imm_hi) | 215d9ae7f2bSJakub Kicinski FIELD_PREP(OP_IMMED_WIDTH, width) | 216d9ae7f2bSJakub Kicinski FIELD_PREP(OP_IMMED_INV, invert) | 217d9ae7f2bSJakub Kicinski FIELD_PREP(OP_IMMED_SHIFT, shift) | 218995e101fSJakub Kicinski FIELD_PREP(OP_IMMED_WR_AB, wr_both) | 219995e101fSJakub Kicinski FIELD_PREP(OP_IMMED_SRC_LMEXTN, src_lmextn) | 220995e101fSJakub Kicinski FIELD_PREP(OP_IMMED_DST_LMEXTN, dst_lmextn); 221d9ae7f2bSJakub Kicinski 222d9ae7f2bSJakub Kicinski nfp_prog_push(nfp_prog, insn); 223d9ae7f2bSJakub Kicinski } 224d9ae7f2bSJakub Kicinski 225d9ae7f2bSJakub Kicinski static void 226b3f868dfSJakub Kicinski emit_immed(struct nfp_prog *nfp_prog, swreg dst, u16 imm, 227d9ae7f2bSJakub Kicinski enum immed_width width, bool invert, enum immed_shift shift) 228d9ae7f2bSJakub Kicinski { 229d9ae7f2bSJakub Kicinski struct nfp_insn_ur_regs reg; 230d9ae7f2bSJakub Kicinski int err; 231d9ae7f2bSJakub Kicinski 232b3f868dfSJakub Kicinski if (swreg_type(dst) == NN_REG_IMM) { 233d9ae7f2bSJakub Kicinski nfp_prog->error = -EFAULT; 234d9ae7f2bSJakub Kicinski return; 235d9ae7f2bSJakub Kicinski } 236d9ae7f2bSJakub Kicinski 237d9ae7f2bSJakub Kicinski err = swreg_to_unrestricted(dst, dst, reg_imm(imm & 0xff), ®); 238d9ae7f2bSJakub Kicinski if (err) { 239d9ae7f2bSJakub Kicinski nfp_prog->error = err; 240d9ae7f2bSJakub Kicinski return; 241d9ae7f2bSJakub Kicinski } 242d9ae7f2bSJakub Kicinski 2433239e7bbSJiong Wang /* Use reg.dst when destination is No-Dest. */ 2443239e7bbSJiong Wang __emit_immed(nfp_prog, 2453239e7bbSJiong Wang swreg_type(dst) == NN_REG_NONE ? reg.dst : reg.areg, 2463239e7bbSJiong Wang reg.breg, imm >> 8, width, invert, shift, 2473239e7bbSJiong Wang reg.wr_both, reg.dst_lmextn, reg.src_lmextn); 248d9ae7f2bSJakub Kicinski } 249d9ae7f2bSJakub Kicinski 250d9ae7f2bSJakub Kicinski static void 251d9ae7f2bSJakub Kicinski __emit_shf(struct nfp_prog *nfp_prog, u16 dst, enum alu_dst_ab dst_ab, 252d9ae7f2bSJakub Kicinski enum shf_sc sc, u8 shift, 253995e101fSJakub Kicinski u16 areg, enum shf_op op, u16 breg, bool i8, bool sw, bool wr_both, 254995e101fSJakub Kicinski bool dst_lmextn, bool src_lmextn) 255d9ae7f2bSJakub Kicinski { 256d9ae7f2bSJakub Kicinski u64 insn; 257d9ae7f2bSJakub Kicinski 258d9ae7f2bSJakub Kicinski if (!FIELD_FIT(OP_SHF_SHIFT, shift)) { 259d9ae7f2bSJakub Kicinski nfp_prog->error = -EFAULT; 260d9ae7f2bSJakub Kicinski return; 261d9ae7f2bSJakub Kicinski } 262d9ae7f2bSJakub Kicinski 263d9ae7f2bSJakub Kicinski if (sc == SHF_SC_L_SHF) 264d9ae7f2bSJakub Kicinski shift = 32 - shift; 265d9ae7f2bSJakub Kicinski 266d9ae7f2bSJakub Kicinski insn = OP_SHF_BASE | 267d9ae7f2bSJakub Kicinski FIELD_PREP(OP_SHF_A_SRC, areg) | 268d9ae7f2bSJakub Kicinski FIELD_PREP(OP_SHF_SC, sc) | 269d9ae7f2bSJakub Kicinski FIELD_PREP(OP_SHF_B_SRC, breg) | 270d9ae7f2bSJakub Kicinski FIELD_PREP(OP_SHF_I8, i8) | 271d9ae7f2bSJakub Kicinski FIELD_PREP(OP_SHF_SW, sw) | 272d9ae7f2bSJakub Kicinski FIELD_PREP(OP_SHF_DST, dst) | 273d9ae7f2bSJakub Kicinski FIELD_PREP(OP_SHF_SHIFT, shift) | 274d9ae7f2bSJakub Kicinski FIELD_PREP(OP_SHF_OP, op) | 275d9ae7f2bSJakub Kicinski FIELD_PREP(OP_SHF_DST_AB, dst_ab) | 276995e101fSJakub Kicinski FIELD_PREP(OP_SHF_WR_AB, wr_both) | 277995e101fSJakub Kicinski FIELD_PREP(OP_SHF_SRC_LMEXTN, src_lmextn) | 278995e101fSJakub Kicinski FIELD_PREP(OP_SHF_DST_LMEXTN, dst_lmextn); 279d9ae7f2bSJakub Kicinski 280d9ae7f2bSJakub Kicinski nfp_prog_push(nfp_prog, insn); 281d9ae7f2bSJakub Kicinski } 282d9ae7f2bSJakub Kicinski 283d9ae7f2bSJakub Kicinski static void 284b3f868dfSJakub Kicinski emit_shf(struct nfp_prog *nfp_prog, swreg dst, 285b3f868dfSJakub Kicinski swreg lreg, enum shf_op op, swreg rreg, enum shf_sc sc, u8 shift) 286d9ae7f2bSJakub Kicinski { 287d9ae7f2bSJakub Kicinski struct nfp_insn_re_regs reg; 288d9ae7f2bSJakub Kicinski int err; 289d9ae7f2bSJakub Kicinski 290d9ae7f2bSJakub Kicinski err = swreg_to_restricted(dst, lreg, rreg, ®, true); 291d9ae7f2bSJakub Kicinski if (err) { 292d9ae7f2bSJakub Kicinski nfp_prog->error = err; 293d9ae7f2bSJakub Kicinski return; 294d9ae7f2bSJakub Kicinski } 295d9ae7f2bSJakub Kicinski 296d9ae7f2bSJakub Kicinski __emit_shf(nfp_prog, reg.dst, reg.dst_ab, sc, shift, 297995e101fSJakub Kicinski reg.areg, op, reg.breg, reg.i8, reg.swap, reg.wr_both, 298995e101fSJakub Kicinski reg.dst_lmextn, reg.src_lmextn); 299d9ae7f2bSJakub Kicinski } 300d9ae7f2bSJakub Kicinski 301d9ae7f2bSJakub Kicinski static void 302d9ae7f2bSJakub Kicinski __emit_alu(struct nfp_prog *nfp_prog, u16 dst, enum alu_dst_ab dst_ab, 303995e101fSJakub Kicinski u16 areg, enum alu_op op, u16 breg, bool swap, bool wr_both, 304995e101fSJakub Kicinski bool dst_lmextn, bool src_lmextn) 305d9ae7f2bSJakub Kicinski { 306d9ae7f2bSJakub Kicinski u64 insn; 307d9ae7f2bSJakub Kicinski 308d9ae7f2bSJakub Kicinski insn = OP_ALU_BASE | 309d9ae7f2bSJakub Kicinski FIELD_PREP(OP_ALU_A_SRC, areg) | 310d9ae7f2bSJakub Kicinski FIELD_PREP(OP_ALU_B_SRC, breg) | 311d9ae7f2bSJakub Kicinski FIELD_PREP(OP_ALU_DST, dst) | 312d9ae7f2bSJakub Kicinski FIELD_PREP(OP_ALU_SW, swap) | 313d9ae7f2bSJakub Kicinski FIELD_PREP(OP_ALU_OP, op) | 314d9ae7f2bSJakub Kicinski FIELD_PREP(OP_ALU_DST_AB, dst_ab) | 315995e101fSJakub Kicinski FIELD_PREP(OP_ALU_WR_AB, wr_both) | 316995e101fSJakub Kicinski FIELD_PREP(OP_ALU_SRC_LMEXTN, src_lmextn) | 317995e101fSJakub Kicinski FIELD_PREP(OP_ALU_DST_LMEXTN, dst_lmextn); 318d9ae7f2bSJakub Kicinski 319d9ae7f2bSJakub Kicinski nfp_prog_push(nfp_prog, insn); 320d9ae7f2bSJakub Kicinski } 321d9ae7f2bSJakub Kicinski 322d9ae7f2bSJakub Kicinski static void 323b3f868dfSJakub Kicinski emit_alu(struct nfp_prog *nfp_prog, swreg dst, 324b3f868dfSJakub Kicinski swreg lreg, enum alu_op op, swreg rreg) 325d9ae7f2bSJakub Kicinski { 326d9ae7f2bSJakub Kicinski struct nfp_insn_ur_regs reg; 327d9ae7f2bSJakub Kicinski int err; 328d9ae7f2bSJakub Kicinski 329d9ae7f2bSJakub Kicinski err = swreg_to_unrestricted(dst, lreg, rreg, ®); 330d9ae7f2bSJakub Kicinski if (err) { 331d9ae7f2bSJakub Kicinski nfp_prog->error = err; 332d9ae7f2bSJakub Kicinski return; 333d9ae7f2bSJakub Kicinski } 334d9ae7f2bSJakub Kicinski 335d9ae7f2bSJakub Kicinski __emit_alu(nfp_prog, reg.dst, reg.dst_ab, 336995e101fSJakub Kicinski reg.areg, op, reg.breg, reg.swap, reg.wr_both, 337995e101fSJakub Kicinski reg.dst_lmextn, reg.src_lmextn); 338d9ae7f2bSJakub Kicinski } 339d9ae7f2bSJakub Kicinski 340d9ae7f2bSJakub Kicinski static void 341d9ae7f2bSJakub Kicinski __emit_ld_field(struct nfp_prog *nfp_prog, enum shf_sc sc, 342d9ae7f2bSJakub Kicinski u8 areg, u8 bmask, u8 breg, u8 shift, bool imm8, 343995e101fSJakub Kicinski bool zero, bool swap, bool wr_both, 344995e101fSJakub Kicinski bool dst_lmextn, bool src_lmextn) 345d9ae7f2bSJakub Kicinski { 346d9ae7f2bSJakub Kicinski u64 insn; 347d9ae7f2bSJakub Kicinski 348d9ae7f2bSJakub Kicinski insn = OP_LDF_BASE | 349d9ae7f2bSJakub Kicinski FIELD_PREP(OP_LDF_A_SRC, areg) | 350d9ae7f2bSJakub Kicinski FIELD_PREP(OP_LDF_SC, sc) | 351d9ae7f2bSJakub Kicinski FIELD_PREP(OP_LDF_B_SRC, breg) | 352d9ae7f2bSJakub Kicinski FIELD_PREP(OP_LDF_I8, imm8) | 353d9ae7f2bSJakub Kicinski FIELD_PREP(OP_LDF_SW, swap) | 354d9ae7f2bSJakub Kicinski FIELD_PREP(OP_LDF_ZF, zero) | 355d9ae7f2bSJakub Kicinski FIELD_PREP(OP_LDF_BMASK, bmask) | 356d9ae7f2bSJakub Kicinski FIELD_PREP(OP_LDF_SHF, shift) | 357995e101fSJakub Kicinski FIELD_PREP(OP_LDF_WR_AB, wr_both) | 358995e101fSJakub Kicinski FIELD_PREP(OP_LDF_SRC_LMEXTN, src_lmextn) | 359995e101fSJakub Kicinski FIELD_PREP(OP_LDF_DST_LMEXTN, dst_lmextn); 360d9ae7f2bSJakub Kicinski 361d9ae7f2bSJakub Kicinski nfp_prog_push(nfp_prog, insn); 362d9ae7f2bSJakub Kicinski } 363d9ae7f2bSJakub Kicinski 364d9ae7f2bSJakub Kicinski static void 365bc8c80a8SJakub Kicinski emit_ld_field_any(struct nfp_prog *nfp_prog, swreg dst, u8 bmask, swreg src, 366bc8c80a8SJakub Kicinski enum shf_sc sc, u8 shift, bool zero) 367d9ae7f2bSJakub Kicinski { 368d9ae7f2bSJakub Kicinski struct nfp_insn_re_regs reg; 369d9ae7f2bSJakub Kicinski int err; 370d9ae7f2bSJakub Kicinski 3712de1be1dSJakub Kicinski /* Note: ld_field is special as it uses one of the src regs as dst */ 3722de1be1dSJakub Kicinski err = swreg_to_restricted(dst, dst, src, ®, true); 373d9ae7f2bSJakub Kicinski if (err) { 374d9ae7f2bSJakub Kicinski nfp_prog->error = err; 375d9ae7f2bSJakub Kicinski return; 376d9ae7f2bSJakub Kicinski } 377d9ae7f2bSJakub Kicinski 378d9ae7f2bSJakub Kicinski __emit_ld_field(nfp_prog, sc, reg.areg, bmask, reg.breg, shift, 379995e101fSJakub Kicinski reg.i8, zero, reg.swap, reg.wr_both, 380995e101fSJakub Kicinski reg.dst_lmextn, reg.src_lmextn); 381d9ae7f2bSJakub Kicinski } 382d9ae7f2bSJakub Kicinski 383d9ae7f2bSJakub Kicinski static void 384b3f868dfSJakub Kicinski emit_ld_field(struct nfp_prog *nfp_prog, swreg dst, u8 bmask, swreg src, 385d9ae7f2bSJakub Kicinski enum shf_sc sc, u8 shift) 386d9ae7f2bSJakub Kicinski { 387bc8c80a8SJakub Kicinski emit_ld_field_any(nfp_prog, dst, bmask, src, sc, shift, false); 388d9ae7f2bSJakub Kicinski } 389d9ae7f2bSJakub Kicinski 3902df03a50SJakub Kicinski static void 3912df03a50SJakub Kicinski __emit_lcsr(struct nfp_prog *nfp_prog, u16 areg, u16 breg, bool wr, u16 addr, 3922df03a50SJakub Kicinski bool dst_lmextn, bool src_lmextn) 3932df03a50SJakub Kicinski { 3942df03a50SJakub Kicinski u64 insn; 3952df03a50SJakub Kicinski 3962df03a50SJakub Kicinski insn = OP_LCSR_BASE | 3972df03a50SJakub Kicinski FIELD_PREP(OP_LCSR_A_SRC, areg) | 3982df03a50SJakub Kicinski FIELD_PREP(OP_LCSR_B_SRC, breg) | 3992df03a50SJakub Kicinski FIELD_PREP(OP_LCSR_WRITE, wr) | 4002df03a50SJakub Kicinski FIELD_PREP(OP_LCSR_ADDR, addr) | 4012df03a50SJakub Kicinski FIELD_PREP(OP_LCSR_SRC_LMEXTN, src_lmextn) | 4022df03a50SJakub Kicinski FIELD_PREP(OP_LCSR_DST_LMEXTN, dst_lmextn); 4032df03a50SJakub Kicinski 4042df03a50SJakub Kicinski nfp_prog_push(nfp_prog, insn); 4052df03a50SJakub Kicinski } 4062df03a50SJakub Kicinski 4072df03a50SJakub Kicinski static void emit_csr_wr(struct nfp_prog *nfp_prog, swreg src, u16 addr) 4082df03a50SJakub Kicinski { 4092df03a50SJakub Kicinski struct nfp_insn_ur_regs reg; 4102df03a50SJakub Kicinski int err; 4112df03a50SJakub Kicinski 4122df03a50SJakub Kicinski /* This instruction takes immeds instead of reg_none() for the ignored 4132df03a50SJakub Kicinski * operand, but we can't encode 2 immeds in one instr with our normal 4142df03a50SJakub Kicinski * swreg infra so if param is an immed, we encode as reg_none() and 4152df03a50SJakub Kicinski * copy the immed to both operands. 4162df03a50SJakub Kicinski */ 4172df03a50SJakub Kicinski if (swreg_type(src) == NN_REG_IMM) { 4182df03a50SJakub Kicinski err = swreg_to_unrestricted(reg_none(), src, reg_none(), ®); 4192df03a50SJakub Kicinski reg.breg = reg.areg; 4202df03a50SJakub Kicinski } else { 4212df03a50SJakub Kicinski err = swreg_to_unrestricted(reg_none(), src, reg_imm(0), ®); 4222df03a50SJakub Kicinski } 4232df03a50SJakub Kicinski if (err) { 4242df03a50SJakub Kicinski nfp_prog->error = err; 4252df03a50SJakub Kicinski return; 4262df03a50SJakub Kicinski } 4272df03a50SJakub Kicinski 4282df03a50SJakub Kicinski __emit_lcsr(nfp_prog, reg.areg, reg.breg, true, addr / 4, 4292df03a50SJakub Kicinski false, reg.src_lmextn); 4302df03a50SJakub Kicinski } 4312df03a50SJakub Kicinski 4321c03e03fSJakub Kicinski static void emit_nop(struct nfp_prog *nfp_prog) 4331c03e03fSJakub Kicinski { 4341c03e03fSJakub Kicinski __emit_immed(nfp_prog, UR_REG_IMM, UR_REG_IMM, 0, 0, 0, 0, 0, 0, 0); 4351c03e03fSJakub Kicinski } 4361c03e03fSJakub Kicinski 437d9ae7f2bSJakub Kicinski /* --- Wrappers --- */ 438d9ae7f2bSJakub Kicinski static bool pack_immed(u32 imm, u16 *val, enum immed_shift *shift) 439d9ae7f2bSJakub Kicinski { 440d9ae7f2bSJakub Kicinski if (!(imm & 0xffff0000)) { 441d9ae7f2bSJakub Kicinski *val = imm; 442d9ae7f2bSJakub Kicinski *shift = IMMED_SHIFT_0B; 443d9ae7f2bSJakub Kicinski } else if (!(imm & 0xff0000ff)) { 444d9ae7f2bSJakub Kicinski *val = imm >> 8; 445d9ae7f2bSJakub Kicinski *shift = IMMED_SHIFT_1B; 446d9ae7f2bSJakub Kicinski } else if (!(imm & 0x0000ffff)) { 447d9ae7f2bSJakub Kicinski *val = imm >> 16; 448d9ae7f2bSJakub Kicinski *shift = IMMED_SHIFT_2B; 449d9ae7f2bSJakub Kicinski } else { 450d9ae7f2bSJakub Kicinski return false; 451d9ae7f2bSJakub Kicinski } 452d9ae7f2bSJakub Kicinski 453d9ae7f2bSJakub Kicinski return true; 454d9ae7f2bSJakub Kicinski } 455d9ae7f2bSJakub Kicinski 456b3f868dfSJakub Kicinski static void wrp_immed(struct nfp_prog *nfp_prog, swreg dst, u32 imm) 457d9ae7f2bSJakub Kicinski { 458d9ae7f2bSJakub Kicinski enum immed_shift shift; 459d9ae7f2bSJakub Kicinski u16 val; 460d9ae7f2bSJakub Kicinski 461d9ae7f2bSJakub Kicinski if (pack_immed(imm, &val, &shift)) { 462d9ae7f2bSJakub Kicinski emit_immed(nfp_prog, dst, val, IMMED_WIDTH_ALL, false, shift); 463d9ae7f2bSJakub Kicinski } else if (pack_immed(~imm, &val, &shift)) { 464d9ae7f2bSJakub Kicinski emit_immed(nfp_prog, dst, val, IMMED_WIDTH_ALL, true, shift); 465d9ae7f2bSJakub Kicinski } else { 466d9ae7f2bSJakub Kicinski emit_immed(nfp_prog, dst, imm & 0xffff, IMMED_WIDTH_ALL, 467d9ae7f2bSJakub Kicinski false, IMMED_SHIFT_0B); 468d9ae7f2bSJakub Kicinski emit_immed(nfp_prog, dst, imm >> 16, IMMED_WIDTH_WORD, 469d9ae7f2bSJakub Kicinski false, IMMED_SHIFT_2B); 470d9ae7f2bSJakub Kicinski } 471d9ae7f2bSJakub Kicinski } 472d9ae7f2bSJakub Kicinski 473d9ae7f2bSJakub Kicinski /* ur_load_imm_any() - encode immediate or use tmp register (unrestricted) 474d9ae7f2bSJakub Kicinski * If the @imm is small enough encode it directly in operand and return 475d9ae7f2bSJakub Kicinski * otherwise load @imm to a spare register and return its encoding. 476d9ae7f2bSJakub Kicinski */ 477b3f868dfSJakub Kicinski static swreg ur_load_imm_any(struct nfp_prog *nfp_prog, u32 imm, swreg tmp_reg) 478d9ae7f2bSJakub Kicinski { 479d9ae7f2bSJakub Kicinski if (FIELD_FIT(UR_REG_IMM_MAX, imm)) 480d9ae7f2bSJakub Kicinski return reg_imm(imm); 481d9ae7f2bSJakub Kicinski 482d9ae7f2bSJakub Kicinski wrp_immed(nfp_prog, tmp_reg, imm); 483d9ae7f2bSJakub Kicinski return tmp_reg; 484d9ae7f2bSJakub Kicinski } 485d9ae7f2bSJakub Kicinski 486d9ae7f2bSJakub Kicinski /* re_load_imm_any() - encode immediate or use tmp register (restricted) 487d9ae7f2bSJakub Kicinski * If the @imm is small enough encode it directly in operand and return 488d9ae7f2bSJakub Kicinski * otherwise load @imm to a spare register and return its encoding. 489d9ae7f2bSJakub Kicinski */ 490b3f868dfSJakub Kicinski static swreg re_load_imm_any(struct nfp_prog *nfp_prog, u32 imm, swreg tmp_reg) 491d9ae7f2bSJakub Kicinski { 492d9ae7f2bSJakub Kicinski if (FIELD_FIT(RE_REG_IMM_MAX, imm)) 493d9ae7f2bSJakub Kicinski return reg_imm(imm); 494d9ae7f2bSJakub Kicinski 495d9ae7f2bSJakub Kicinski wrp_immed(nfp_prog, tmp_reg, imm); 496d9ae7f2bSJakub Kicinski return tmp_reg; 497d9ae7f2bSJakub Kicinski } 498d9ae7f2bSJakub Kicinski 499ff42bb9fSJakub Kicinski static void wrp_nops(struct nfp_prog *nfp_prog, unsigned int count) 500ff42bb9fSJakub Kicinski { 501ff42bb9fSJakub Kicinski while (count--) 502ff42bb9fSJakub Kicinski emit_nop(nfp_prog); 503ff42bb9fSJakub Kicinski } 504ff42bb9fSJakub Kicinski 505d9ae7f2bSJakub Kicinski static void 506d9ae7f2bSJakub Kicinski wrp_br_special(struct nfp_prog *nfp_prog, enum br_mask mask, 507d9ae7f2bSJakub Kicinski enum br_special special) 508d9ae7f2bSJakub Kicinski { 509d9ae7f2bSJakub Kicinski emit_br(nfp_prog, mask, 0, 0); 510d9ae7f2bSJakub Kicinski 511d9ae7f2bSJakub Kicinski nfp_prog->prog[nfp_prog->prog_len - 1] |= 512d9ae7f2bSJakub Kicinski FIELD_PREP(OP_BR_SPECIAL, special); 513d9ae7f2bSJakub Kicinski } 514d9ae7f2bSJakub Kicinski 515c000dfb5SJakub Kicinski static void wrp_mov(struct nfp_prog *nfp_prog, swreg dst, swreg src) 516c000dfb5SJakub Kicinski { 517c000dfb5SJakub Kicinski emit_alu(nfp_prog, dst, reg_none(), ALU_OP_NONE, src); 518c000dfb5SJakub Kicinski } 519c000dfb5SJakub Kicinski 520d9ae7f2bSJakub Kicinski static void wrp_reg_mov(struct nfp_prog *nfp_prog, u16 dst, u16 src) 521d9ae7f2bSJakub Kicinski { 522c000dfb5SJakub Kicinski wrp_mov(nfp_prog, reg_both(dst), reg_b(src)); 523d9ae7f2bSJakub Kicinski } 524d9ae7f2bSJakub Kicinski 5259879a381SJiong Wang /* wrp_reg_subpart() - load @field_len bytes from @offset of @src, write the 5269879a381SJiong Wang * result to @dst from low end. 5279879a381SJiong Wang */ 5289879a381SJiong Wang static void 5299879a381SJiong Wang wrp_reg_subpart(struct nfp_prog *nfp_prog, swreg dst, swreg src, u8 field_len, 5309879a381SJiong Wang u8 offset) 5319879a381SJiong Wang { 5329879a381SJiong Wang enum shf_sc sc = offset ? SHF_SC_R_SHF : SHF_SC_NONE; 5339879a381SJiong Wang u8 mask = (1 << field_len) - 1; 5349879a381SJiong Wang 5359879a381SJiong Wang emit_ld_field_any(nfp_prog, dst, mask, src, sc, offset * 8, true); 5369879a381SJiong Wang } 5379879a381SJiong Wang 5389879a381SJiong Wang /* NFP has Command Push Pull bus which supports bluk memory operations. */ 5399879a381SJiong Wang static int nfp_cpp_memcpy(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 5409879a381SJiong Wang { 5419879a381SJiong Wang bool descending_seq = meta->ldst_gather_len < 0; 5429879a381SJiong Wang s16 len = abs(meta->ldst_gather_len); 5439879a381SJiong Wang swreg src_base, off; 5449879a381SJiong Wang unsigned int i; 5459879a381SJiong Wang u8 xfer_num; 5469879a381SJiong Wang 5479879a381SJiong Wang off = re_load_imm_any(nfp_prog, meta->insn.off, imm_b(nfp_prog)); 5489879a381SJiong Wang src_base = reg_a(meta->insn.src_reg * 2); 5499879a381SJiong Wang xfer_num = round_up(len, 4) / 4; 5509879a381SJiong Wang 5518c900538SJiong Wang /* Setup PREV_ALU fields to override memory read length. */ 5528c900538SJiong Wang if (len > 32) 5538c900538SJiong Wang wrp_immed(nfp_prog, reg_none(), 5548c900538SJiong Wang CMD_OVE_LEN | FIELD_PREP(CMD_OV_LEN, xfer_num - 1)); 5558c900538SJiong Wang 5569879a381SJiong Wang /* Memory read from source addr into transfer-in registers. */ 5578c900538SJiong Wang emit_cmd_any(nfp_prog, CMD_TGT_READ32_SWAP, CMD_MODE_32b, 0, src_base, 5588c900538SJiong Wang off, xfer_num - 1, true, len > 32); 5599879a381SJiong Wang 5609879a381SJiong Wang /* Move from transfer-in to transfer-out. */ 5619879a381SJiong Wang for (i = 0; i < xfer_num; i++) 5629879a381SJiong Wang wrp_mov(nfp_prog, reg_xfer(i), reg_xfer(i)); 5639879a381SJiong Wang 5649879a381SJiong Wang off = re_load_imm_any(nfp_prog, meta->paired_st->off, imm_b(nfp_prog)); 5659879a381SJiong Wang 5669879a381SJiong Wang if (len <= 8) { 5679879a381SJiong Wang /* Use single direct_ref write8. */ 5689879a381SJiong Wang emit_cmd(nfp_prog, CMD_TGT_WRITE8_SWAP, CMD_MODE_32b, 0, 5699879a381SJiong Wang reg_a(meta->paired_st->dst_reg * 2), off, len - 1, 5709879a381SJiong Wang true); 5718c900538SJiong Wang } else if (len <= 32 && IS_ALIGNED(len, 4)) { 5729879a381SJiong Wang /* Use single direct_ref write32. */ 5739879a381SJiong Wang emit_cmd(nfp_prog, CMD_TGT_WRITE32_SWAP, CMD_MODE_32b, 0, 5749879a381SJiong Wang reg_a(meta->paired_st->dst_reg * 2), off, xfer_num - 1, 5759879a381SJiong Wang true); 5768c900538SJiong Wang } else if (len <= 32) { 5779879a381SJiong Wang /* Use single indirect_ref write8. */ 5789879a381SJiong Wang wrp_immed(nfp_prog, reg_none(), 5799879a381SJiong Wang CMD_OVE_LEN | FIELD_PREP(CMD_OV_LEN, len - 1)); 5809879a381SJiong Wang emit_cmd_indir(nfp_prog, CMD_TGT_WRITE8_SWAP, CMD_MODE_32b, 0, 5819879a381SJiong Wang reg_a(meta->paired_st->dst_reg * 2), off, 5829879a381SJiong Wang len - 1, true); 5838c900538SJiong Wang } else if (IS_ALIGNED(len, 4)) { 5848c900538SJiong Wang /* Use single indirect_ref write32. */ 5858c900538SJiong Wang wrp_immed(nfp_prog, reg_none(), 5868c900538SJiong Wang CMD_OVE_LEN | FIELD_PREP(CMD_OV_LEN, xfer_num - 1)); 5878c900538SJiong Wang emit_cmd_indir(nfp_prog, CMD_TGT_WRITE32_SWAP, CMD_MODE_32b, 0, 5888c900538SJiong Wang reg_a(meta->paired_st->dst_reg * 2), off, 5898c900538SJiong Wang xfer_num - 1, true); 5908c900538SJiong Wang } else if (len <= 40) { 5918c900538SJiong Wang /* Use one direct_ref write32 to write the first 32-bytes, then 5928c900538SJiong Wang * another direct_ref write8 to write the remaining bytes. 5938c900538SJiong Wang */ 5948c900538SJiong Wang emit_cmd(nfp_prog, CMD_TGT_WRITE32_SWAP, CMD_MODE_32b, 0, 5958c900538SJiong Wang reg_a(meta->paired_st->dst_reg * 2), off, 7, 5968c900538SJiong Wang true); 5978c900538SJiong Wang 5988c900538SJiong Wang off = re_load_imm_any(nfp_prog, meta->paired_st->off + 32, 5998c900538SJiong Wang imm_b(nfp_prog)); 6008c900538SJiong Wang emit_cmd(nfp_prog, CMD_TGT_WRITE8_SWAP, CMD_MODE_32b, 8, 6018c900538SJiong Wang reg_a(meta->paired_st->dst_reg * 2), off, len - 33, 6028c900538SJiong Wang true); 6038c900538SJiong Wang } else { 6048c900538SJiong Wang /* Use one indirect_ref write32 to write 4-bytes aligned length, 6058c900538SJiong Wang * then another direct_ref write8 to write the remaining bytes. 6068c900538SJiong Wang */ 6078c900538SJiong Wang u8 new_off; 6088c900538SJiong Wang 6098c900538SJiong Wang wrp_immed(nfp_prog, reg_none(), 6108c900538SJiong Wang CMD_OVE_LEN | FIELD_PREP(CMD_OV_LEN, xfer_num - 2)); 6118c900538SJiong Wang emit_cmd_indir(nfp_prog, CMD_TGT_WRITE32_SWAP, CMD_MODE_32b, 0, 6128c900538SJiong Wang reg_a(meta->paired_st->dst_reg * 2), off, 6138c900538SJiong Wang xfer_num - 2, true); 6148c900538SJiong Wang new_off = meta->paired_st->off + (xfer_num - 1) * 4; 6158c900538SJiong Wang off = re_load_imm_any(nfp_prog, new_off, imm_b(nfp_prog)); 6168c900538SJiong Wang emit_cmd(nfp_prog, CMD_TGT_WRITE8_SWAP, CMD_MODE_32b, 6178c900538SJiong Wang xfer_num - 1, reg_a(meta->paired_st->dst_reg * 2), off, 6188c900538SJiong Wang (len & 0x3) - 1, true); 6199879a381SJiong Wang } 6209879a381SJiong Wang 6219879a381SJiong Wang /* TODO: The following extra load is to make sure data flow be identical 6229879a381SJiong Wang * before and after we do memory copy optimization. 6239879a381SJiong Wang * 6249879a381SJiong Wang * The load destination register is not guaranteed to be dead, so we 6259879a381SJiong Wang * need to make sure it is loaded with the value the same as before 6269879a381SJiong Wang * this transformation. 6279879a381SJiong Wang * 6289879a381SJiong Wang * These extra loads could be removed once we have accurate register 6299879a381SJiong Wang * usage information. 6309879a381SJiong Wang */ 6319879a381SJiong Wang if (descending_seq) 6329879a381SJiong Wang xfer_num = 0; 6339879a381SJiong Wang else if (BPF_SIZE(meta->insn.code) != BPF_DW) 6349879a381SJiong Wang xfer_num = xfer_num - 1; 6359879a381SJiong Wang else 6369879a381SJiong Wang xfer_num = xfer_num - 2; 6379879a381SJiong Wang 6389879a381SJiong Wang switch (BPF_SIZE(meta->insn.code)) { 6399879a381SJiong Wang case BPF_B: 6409879a381SJiong Wang wrp_reg_subpart(nfp_prog, reg_both(meta->insn.dst_reg * 2), 6419879a381SJiong Wang reg_xfer(xfer_num), 1, 6429879a381SJiong Wang IS_ALIGNED(len, 4) ? 3 : (len & 3) - 1); 6439879a381SJiong Wang break; 6449879a381SJiong Wang case BPF_H: 6459879a381SJiong Wang wrp_reg_subpart(nfp_prog, reg_both(meta->insn.dst_reg * 2), 6469879a381SJiong Wang reg_xfer(xfer_num), 2, (len & 3) ^ 2); 6479879a381SJiong Wang break; 6489879a381SJiong Wang case BPF_W: 6499879a381SJiong Wang wrp_mov(nfp_prog, reg_both(meta->insn.dst_reg * 2), 6509879a381SJiong Wang reg_xfer(0)); 6519879a381SJiong Wang break; 6529879a381SJiong Wang case BPF_DW: 6539879a381SJiong Wang wrp_mov(nfp_prog, reg_both(meta->insn.dst_reg * 2), 6549879a381SJiong Wang reg_xfer(xfer_num)); 6559879a381SJiong Wang wrp_mov(nfp_prog, reg_both(meta->insn.dst_reg * 2 + 1), 6569879a381SJiong Wang reg_xfer(xfer_num + 1)); 6579879a381SJiong Wang break; 6589879a381SJiong Wang } 6599879a381SJiong Wang 6609879a381SJiong Wang if (BPF_SIZE(meta->insn.code) != BPF_DW) 6619879a381SJiong Wang wrp_immed(nfp_prog, reg_both(meta->insn.dst_reg * 2 + 1), 0); 6629879a381SJiong Wang 6639879a381SJiong Wang return 0; 6649879a381SJiong Wang } 6659879a381SJiong Wang 666d9ae7f2bSJakub Kicinski static int 6670a793977SJakub Kicinski data_ld(struct nfp_prog *nfp_prog, swreg offset, u8 dst_gpr, int size) 668d9ae7f2bSJakub Kicinski { 669d9ae7f2bSJakub Kicinski unsigned int i; 670d9ae7f2bSJakub Kicinski u16 shift, sz; 671d9ae7f2bSJakub Kicinski 672d9ae7f2bSJakub Kicinski /* We load the value from the address indicated in @offset and then 673d9ae7f2bSJakub Kicinski * shift out the data we don't need. Note: this is big endian! 674d9ae7f2bSJakub Kicinski */ 6750a793977SJakub Kicinski sz = max(size, 4); 676d9ae7f2bSJakub Kicinski shift = size < 4 ? 4 - size : 0; 677d9ae7f2bSJakub Kicinski 6780a793977SJakub Kicinski emit_cmd(nfp_prog, CMD_TGT_READ8, CMD_MODE_32b, 0, 6790a793977SJakub Kicinski pptr_reg(nfp_prog), offset, sz - 1, true); 6800a793977SJakub Kicinski 6810a793977SJakub Kicinski i = 0; 6820a793977SJakub Kicinski if (shift) 6830a793977SJakub Kicinski emit_shf(nfp_prog, reg_both(dst_gpr), reg_none(), SHF_OP_NONE, 6840a793977SJakub Kicinski reg_xfer(0), SHF_SC_R_SHF, shift * 8); 6850a793977SJakub Kicinski else 6860a793977SJakub Kicinski for (; i * 4 < size; i++) 6870a793977SJakub Kicinski wrp_mov(nfp_prog, reg_both(dst_gpr + i), reg_xfer(i)); 6880a793977SJakub Kicinski 6890a793977SJakub Kicinski if (i < 2) 6900a793977SJakub Kicinski wrp_immed(nfp_prog, reg_both(dst_gpr + 1), 0); 6910a793977SJakub Kicinski 6920a793977SJakub Kicinski return 0; 6930a793977SJakub Kicinski } 6940a793977SJakub Kicinski 6950a793977SJakub Kicinski static int 6962ca71441SJakub Kicinski data_ld_host_order(struct nfp_prog *nfp_prog, u8 src_gpr, swreg offset, 6972ca71441SJakub Kicinski u8 dst_gpr, int size) 6982ca71441SJakub Kicinski { 6992ca71441SJakub Kicinski unsigned int i; 7002ca71441SJakub Kicinski u8 mask, sz; 7012ca71441SJakub Kicinski 7022ca71441SJakub Kicinski /* We load the value from the address indicated in @offset and then 7032ca71441SJakub Kicinski * mask out the data we don't need. Note: this is little endian! 7042ca71441SJakub Kicinski */ 7052ca71441SJakub Kicinski sz = max(size, 4); 7062ca71441SJakub Kicinski mask = size < 4 ? GENMASK(size - 1, 0) : 0; 7072ca71441SJakub Kicinski 7082ca71441SJakub Kicinski emit_cmd(nfp_prog, CMD_TGT_READ32_SWAP, CMD_MODE_32b, 0, 7092ca71441SJakub Kicinski reg_a(src_gpr), offset, sz / 4 - 1, true); 7102ca71441SJakub Kicinski 7112ca71441SJakub Kicinski i = 0; 7122ca71441SJakub Kicinski if (mask) 7132ca71441SJakub Kicinski emit_ld_field_any(nfp_prog, reg_both(dst_gpr), mask, 7142ca71441SJakub Kicinski reg_xfer(0), SHF_SC_NONE, 0, true); 7152ca71441SJakub Kicinski else 7162ca71441SJakub Kicinski for (; i * 4 < size; i++) 7172ca71441SJakub Kicinski wrp_mov(nfp_prog, reg_both(dst_gpr + i), reg_xfer(i)); 7182ca71441SJakub Kicinski 7192ca71441SJakub Kicinski if (i < 2) 7202ca71441SJakub Kicinski wrp_immed(nfp_prog, reg_both(dst_gpr + 1), 0); 7212ca71441SJakub Kicinski 7222ca71441SJakub Kicinski return 0; 7232ca71441SJakub Kicinski } 7242ca71441SJakub Kicinski 7252ca71441SJakub Kicinski static int 7260a793977SJakub Kicinski construct_data_ind_ld(struct nfp_prog *nfp_prog, u16 offset, u16 src, u8 size) 7270a793977SJakub Kicinski { 7280a793977SJakub Kicinski swreg tmp_reg; 7290a793977SJakub Kicinski 730d9ae7f2bSJakub Kicinski /* Calculate the true offset (src_reg + imm) */ 731d9ae7f2bSJakub Kicinski tmp_reg = ur_load_imm_any(nfp_prog, offset, imm_b(nfp_prog)); 7320a793977SJakub Kicinski emit_alu(nfp_prog, imm_both(nfp_prog), reg_a(src), ALU_OP_ADD, tmp_reg); 7330a793977SJakub Kicinski 734d9ae7f2bSJakub Kicinski /* Check packet length (size guaranteed to fit b/c it's u8) */ 735d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, imm_a(nfp_prog), 736d9ae7f2bSJakub Kicinski imm_a(nfp_prog), ALU_OP_ADD, reg_imm(size)); 737d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), 73818e53b6cSJakub Kicinski plen_reg(nfp_prog), ALU_OP_SUB, imm_a(nfp_prog)); 739d9ae7f2bSJakub Kicinski wrp_br_special(nfp_prog, BR_BLO, OP_BR_GO_ABORT); 7400a793977SJakub Kicinski 741d9ae7f2bSJakub Kicinski /* Load data */ 7420a793977SJakub Kicinski return data_ld(nfp_prog, imm_b(nfp_prog), 0, size); 743d9ae7f2bSJakub Kicinski } 744d9ae7f2bSJakub Kicinski 745d9ae7f2bSJakub Kicinski static int construct_data_ld(struct nfp_prog *nfp_prog, u16 offset, u8 size) 746d9ae7f2bSJakub Kicinski { 7470a793977SJakub Kicinski swreg tmp_reg; 7480a793977SJakub Kicinski 7490a793977SJakub Kicinski /* Check packet length */ 7500a793977SJakub Kicinski tmp_reg = ur_load_imm_any(nfp_prog, offset + size, imm_a(nfp_prog)); 7510a793977SJakub Kicinski emit_alu(nfp_prog, reg_none(), plen_reg(nfp_prog), ALU_OP_SUB, tmp_reg); 7520a793977SJakub Kicinski wrp_br_special(nfp_prog, BR_BLO, OP_BR_GO_ABORT); 7530a793977SJakub Kicinski 7540a793977SJakub Kicinski /* Load data */ 7550a793977SJakub Kicinski tmp_reg = re_load_imm_any(nfp_prog, offset, imm_b(nfp_prog)); 7560a793977SJakub Kicinski return data_ld(nfp_prog, tmp_reg, 0, size); 757d9ae7f2bSJakub Kicinski } 758d9ae7f2bSJakub Kicinski 759e663fe38SJakub Kicinski static int 760e663fe38SJakub Kicinski data_stx_host_order(struct nfp_prog *nfp_prog, u8 dst_gpr, swreg offset, 761e663fe38SJakub Kicinski u8 src_gpr, u8 size) 762e663fe38SJakub Kicinski { 763e663fe38SJakub Kicinski unsigned int i; 764e663fe38SJakub Kicinski 765e663fe38SJakub Kicinski for (i = 0; i * 4 < size; i++) 766e663fe38SJakub Kicinski wrp_mov(nfp_prog, reg_xfer(i), reg_a(src_gpr + i)); 767e663fe38SJakub Kicinski 768e663fe38SJakub Kicinski emit_cmd(nfp_prog, CMD_TGT_WRITE8_SWAP, CMD_MODE_32b, 0, 769e663fe38SJakub Kicinski reg_a(dst_gpr), offset, size - 1, true); 770e663fe38SJakub Kicinski 771e663fe38SJakub Kicinski return 0; 772e663fe38SJakub Kicinski } 773e663fe38SJakub Kicinski 774e663fe38SJakub Kicinski static int 775e663fe38SJakub Kicinski data_st_host_order(struct nfp_prog *nfp_prog, u8 dst_gpr, swreg offset, 776e663fe38SJakub Kicinski u64 imm, u8 size) 777e663fe38SJakub Kicinski { 778e663fe38SJakub Kicinski wrp_immed(nfp_prog, reg_xfer(0), imm); 779e663fe38SJakub Kicinski if (size == 8) 780e663fe38SJakub Kicinski wrp_immed(nfp_prog, reg_xfer(1), imm >> 32); 781e663fe38SJakub Kicinski 782e663fe38SJakub Kicinski emit_cmd(nfp_prog, CMD_TGT_WRITE8_SWAP, CMD_MODE_32b, 0, 783e663fe38SJakub Kicinski reg_a(dst_gpr), offset, size - 1, true); 784e663fe38SJakub Kicinski 785e663fe38SJakub Kicinski return 0; 786e663fe38SJakub Kicinski } 787e663fe38SJakub Kicinski 788ee9133a8SJakub Kicinski typedef int 789ee9133a8SJakub Kicinski (*lmem_step)(struct nfp_prog *nfp_prog, u8 gpr, u8 gpr_byte, s32 off, 7902df03a50SJakub Kicinski unsigned int size, bool first, bool new_gpr, bool last, bool lm3, 7912df03a50SJakub Kicinski bool needs_inc); 792a82b23fbSJakub Kicinski 793a82b23fbSJakub Kicinski static int 794a82b23fbSJakub Kicinski wrp_lmem_load(struct nfp_prog *nfp_prog, u8 dst, u8 dst_byte, s32 off, 7952df03a50SJakub Kicinski unsigned int size, bool first, bool new_gpr, bool last, bool lm3, 7962df03a50SJakub Kicinski bool needs_inc) 797a82b23fbSJakub Kicinski { 7982df03a50SJakub Kicinski bool should_inc = needs_inc && new_gpr && !last; 799a82b23fbSJakub Kicinski u32 idx, src_byte; 800a82b23fbSJakub Kicinski enum shf_sc sc; 801a82b23fbSJakub Kicinski swreg reg; 802a82b23fbSJakub Kicinski int shf; 803a82b23fbSJakub Kicinski u8 mask; 804a82b23fbSJakub Kicinski 805a82b23fbSJakub Kicinski if (WARN_ON_ONCE(dst_byte + size > 4 || off % 4 + size > 4)) 806a82b23fbSJakub Kicinski return -EOPNOTSUPP; 807a82b23fbSJakub Kicinski 808a82b23fbSJakub Kicinski idx = off / 4; 809a82b23fbSJakub Kicinski 810a82b23fbSJakub Kicinski /* Move the entire word */ 811a82b23fbSJakub Kicinski if (size == 4) { 8122df03a50SJakub Kicinski wrp_mov(nfp_prog, reg_both(dst), 8132df03a50SJakub Kicinski should_inc ? reg_lm_inc(3) : reg_lm(lm3 ? 3 : 0, idx)); 814a82b23fbSJakub Kicinski return 0; 815a82b23fbSJakub Kicinski } 816a82b23fbSJakub Kicinski 8172df03a50SJakub Kicinski if (WARN_ON_ONCE(lm3 && idx > RE_REG_LM_IDX_MAX)) 8182df03a50SJakub Kicinski return -EOPNOTSUPP; 8192df03a50SJakub Kicinski 820a82b23fbSJakub Kicinski src_byte = off % 4; 821a82b23fbSJakub Kicinski 822a82b23fbSJakub Kicinski mask = (1 << size) - 1; 823a82b23fbSJakub Kicinski mask <<= dst_byte; 824a82b23fbSJakub Kicinski 825a82b23fbSJakub Kicinski if (WARN_ON_ONCE(mask > 0xf)) 826a82b23fbSJakub Kicinski return -EOPNOTSUPP; 827a82b23fbSJakub Kicinski 828a82b23fbSJakub Kicinski shf = abs(src_byte - dst_byte) * 8; 829a82b23fbSJakub Kicinski if (src_byte == dst_byte) { 830a82b23fbSJakub Kicinski sc = SHF_SC_NONE; 831a82b23fbSJakub Kicinski } else if (src_byte < dst_byte) { 832a82b23fbSJakub Kicinski shf = 32 - shf; 833a82b23fbSJakub Kicinski sc = SHF_SC_L_SHF; 834a82b23fbSJakub Kicinski } else { 835a82b23fbSJakub Kicinski sc = SHF_SC_R_SHF; 836a82b23fbSJakub Kicinski } 837a82b23fbSJakub Kicinski 838a82b23fbSJakub Kicinski /* ld_field can address fewer indexes, if offset too large do RMW. 839a82b23fbSJakub Kicinski * Because we RMV twice we waste 2 cycles on unaligned 8 byte writes. 840a82b23fbSJakub Kicinski */ 841a82b23fbSJakub Kicinski if (idx <= RE_REG_LM_IDX_MAX) { 8422df03a50SJakub Kicinski reg = reg_lm(lm3 ? 3 : 0, idx); 843a82b23fbSJakub Kicinski } else { 844a82b23fbSJakub Kicinski reg = imm_a(nfp_prog); 8459a90c83cSJakub Kicinski /* If it's not the first part of the load and we start a new GPR 8469a90c83cSJakub Kicinski * that means we are loading a second part of the LMEM word into 8479a90c83cSJakub Kicinski * a new GPR. IOW we've already looked that LMEM word and 8489a90c83cSJakub Kicinski * therefore it has been loaded into imm_a(). 8499a90c83cSJakub Kicinski */ 8509a90c83cSJakub Kicinski if (first || !new_gpr) 851a82b23fbSJakub Kicinski wrp_mov(nfp_prog, reg, reg_lm(0, idx)); 852a82b23fbSJakub Kicinski } 853a82b23fbSJakub Kicinski 854a82b23fbSJakub Kicinski emit_ld_field_any(nfp_prog, reg_both(dst), mask, reg, sc, shf, new_gpr); 855a82b23fbSJakub Kicinski 8562df03a50SJakub Kicinski if (should_inc) 8572df03a50SJakub Kicinski wrp_mov(nfp_prog, reg_none(), reg_lm_inc(3)); 8582df03a50SJakub Kicinski 859a82b23fbSJakub Kicinski return 0; 860a82b23fbSJakub Kicinski } 861ee9133a8SJakub Kicinski 862ee9133a8SJakub Kicinski static int 863ee9133a8SJakub Kicinski wrp_lmem_store(struct nfp_prog *nfp_prog, u8 src, u8 src_byte, s32 off, 8642df03a50SJakub Kicinski unsigned int size, bool first, bool new_gpr, bool last, bool lm3, 8652df03a50SJakub Kicinski bool needs_inc) 866ee9133a8SJakub Kicinski { 8672df03a50SJakub Kicinski bool should_inc = needs_inc && new_gpr && !last; 868ee9133a8SJakub Kicinski u32 idx, dst_byte; 869ee9133a8SJakub Kicinski enum shf_sc sc; 870ee9133a8SJakub Kicinski swreg reg; 871ee9133a8SJakub Kicinski int shf; 872ee9133a8SJakub Kicinski u8 mask; 873ee9133a8SJakub Kicinski 874ee9133a8SJakub Kicinski if (WARN_ON_ONCE(src_byte + size > 4 || off % 4 + size > 4)) 875ee9133a8SJakub Kicinski return -EOPNOTSUPP; 876ee9133a8SJakub Kicinski 877ee9133a8SJakub Kicinski idx = off / 4; 878ee9133a8SJakub Kicinski 879ee9133a8SJakub Kicinski /* Move the entire word */ 880ee9133a8SJakub Kicinski if (size == 4) { 8812df03a50SJakub Kicinski wrp_mov(nfp_prog, 8822df03a50SJakub Kicinski should_inc ? reg_lm_inc(3) : reg_lm(lm3 ? 3 : 0, idx), 8832df03a50SJakub Kicinski reg_b(src)); 884ee9133a8SJakub Kicinski return 0; 885ee9133a8SJakub Kicinski } 886ee9133a8SJakub Kicinski 8872df03a50SJakub Kicinski if (WARN_ON_ONCE(lm3 && idx > RE_REG_LM_IDX_MAX)) 8882df03a50SJakub Kicinski return -EOPNOTSUPP; 8892df03a50SJakub Kicinski 890ee9133a8SJakub Kicinski dst_byte = off % 4; 891ee9133a8SJakub Kicinski 892ee9133a8SJakub Kicinski mask = (1 << size) - 1; 893ee9133a8SJakub Kicinski mask <<= dst_byte; 894ee9133a8SJakub Kicinski 895ee9133a8SJakub Kicinski if (WARN_ON_ONCE(mask > 0xf)) 896ee9133a8SJakub Kicinski return -EOPNOTSUPP; 897ee9133a8SJakub Kicinski 898ee9133a8SJakub Kicinski shf = abs(src_byte - dst_byte) * 8; 899ee9133a8SJakub Kicinski if (src_byte == dst_byte) { 900ee9133a8SJakub Kicinski sc = SHF_SC_NONE; 901ee9133a8SJakub Kicinski } else if (src_byte < dst_byte) { 902ee9133a8SJakub Kicinski shf = 32 - shf; 903ee9133a8SJakub Kicinski sc = SHF_SC_L_SHF; 904ee9133a8SJakub Kicinski } else { 905ee9133a8SJakub Kicinski sc = SHF_SC_R_SHF; 906ee9133a8SJakub Kicinski } 907ee9133a8SJakub Kicinski 908ee9133a8SJakub Kicinski /* ld_field can address fewer indexes, if offset too large do RMW. 909ee9133a8SJakub Kicinski * Because we RMV twice we waste 2 cycles on unaligned 8 byte writes. 910ee9133a8SJakub Kicinski */ 911ee9133a8SJakub Kicinski if (idx <= RE_REG_LM_IDX_MAX) { 9122df03a50SJakub Kicinski reg = reg_lm(lm3 ? 3 : 0, idx); 913ee9133a8SJakub Kicinski } else { 914ee9133a8SJakub Kicinski reg = imm_a(nfp_prog); 9159a90c83cSJakub Kicinski /* Only first and last LMEM locations are going to need RMW, 9169a90c83cSJakub Kicinski * the middle location will be overwritten fully. 9179a90c83cSJakub Kicinski */ 9189a90c83cSJakub Kicinski if (first || last) 919ee9133a8SJakub Kicinski wrp_mov(nfp_prog, reg, reg_lm(0, idx)); 920ee9133a8SJakub Kicinski } 921ee9133a8SJakub Kicinski 922ee9133a8SJakub Kicinski emit_ld_field(nfp_prog, reg, mask, reg_b(src), sc, shf); 923ee9133a8SJakub Kicinski 9249a90c83cSJakub Kicinski if (new_gpr || last) { 925ee9133a8SJakub Kicinski if (idx > RE_REG_LM_IDX_MAX) 926ee9133a8SJakub Kicinski wrp_mov(nfp_prog, reg_lm(0, idx), reg); 9272df03a50SJakub Kicinski if (should_inc) 9282df03a50SJakub Kicinski wrp_mov(nfp_prog, reg_none(), reg_lm_inc(3)); 9299a90c83cSJakub Kicinski } 930ee9133a8SJakub Kicinski 931ee9133a8SJakub Kicinski return 0; 932ee9133a8SJakub Kicinski } 933ee9133a8SJakub Kicinski 934ee9133a8SJakub Kicinski static int 935ee9133a8SJakub Kicinski mem_op_stack(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 936b14157eeSJakub Kicinski unsigned int size, unsigned int ptr_off, u8 gpr, u8 ptr_gpr, 937b14157eeSJakub Kicinski bool clr_gpr, lmem_step step) 938ee9133a8SJakub Kicinski { 939d3488480SJakub Kicinski s32 off = nfp_prog->stack_depth + meta->insn.off + ptr_off; 9409a90c83cSJakub Kicinski bool first = true, last; 9412df03a50SJakub Kicinski bool needs_inc = false; 9422df03a50SJakub Kicinski swreg stack_off_reg; 943a82b23fbSJakub Kicinski u8 prev_gpr = 255; 944ee9133a8SJakub Kicinski u32 gpr_byte = 0; 9452df03a50SJakub Kicinski bool lm3 = true; 946ee9133a8SJakub Kicinski int ret; 947ee9133a8SJakub Kicinski 948b14157eeSJakub Kicinski if (meta->ptr_not_const) { 949b14157eeSJakub Kicinski /* Use of the last encountered ptr_off is OK, they all have 950b14157eeSJakub Kicinski * the same alignment. Depend on low bits of value being 951b14157eeSJakub Kicinski * discarded when written to LMaddr register. 952b14157eeSJakub Kicinski */ 953b14157eeSJakub Kicinski stack_off_reg = ur_load_imm_any(nfp_prog, meta->insn.off, 954b14157eeSJakub Kicinski stack_imm(nfp_prog)); 955b14157eeSJakub Kicinski 956b14157eeSJakub Kicinski emit_alu(nfp_prog, imm_b(nfp_prog), 957b14157eeSJakub Kicinski reg_a(ptr_gpr), ALU_OP_ADD, stack_off_reg); 958b14157eeSJakub Kicinski 959b14157eeSJakub Kicinski needs_inc = true; 960b14157eeSJakub Kicinski } else if (off + size <= 64) { 9612df03a50SJakub Kicinski /* We can reach bottom 64B with LMaddr0 */ 9622df03a50SJakub Kicinski lm3 = false; 9632df03a50SJakub Kicinski } else if (round_down(off, 32) == round_down(off + size - 1, 32)) { 9642df03a50SJakub Kicinski /* We have to set up a new pointer. If we know the offset 9652df03a50SJakub Kicinski * and the entire access falls into a single 32 byte aligned 9662df03a50SJakub Kicinski * window we won't have to increment the LM pointer. 9672df03a50SJakub Kicinski * The 32 byte alignment is imporant because offset is ORed in 9682df03a50SJakub Kicinski * not added when doing *l$indexN[off]. 9692df03a50SJakub Kicinski */ 9702df03a50SJakub Kicinski stack_off_reg = ur_load_imm_any(nfp_prog, round_down(off, 32), 9712df03a50SJakub Kicinski stack_imm(nfp_prog)); 9722df03a50SJakub Kicinski emit_alu(nfp_prog, imm_b(nfp_prog), 9732df03a50SJakub Kicinski stack_reg(nfp_prog), ALU_OP_ADD, stack_off_reg); 9742df03a50SJakub Kicinski 9752df03a50SJakub Kicinski off %= 32; 9762df03a50SJakub Kicinski } else { 9772df03a50SJakub Kicinski stack_off_reg = ur_load_imm_any(nfp_prog, round_down(off, 4), 9782df03a50SJakub Kicinski stack_imm(nfp_prog)); 9792df03a50SJakub Kicinski 9802df03a50SJakub Kicinski emit_alu(nfp_prog, imm_b(nfp_prog), 9812df03a50SJakub Kicinski stack_reg(nfp_prog), ALU_OP_ADD, stack_off_reg); 9822df03a50SJakub Kicinski 9832df03a50SJakub Kicinski needs_inc = true; 9842df03a50SJakub Kicinski } 9852df03a50SJakub Kicinski if (lm3) { 9862df03a50SJakub Kicinski emit_csr_wr(nfp_prog, imm_b(nfp_prog), NFP_CSR_ACT_LM_ADDR3); 9872df03a50SJakub Kicinski /* For size < 4 one slot will be filled by zeroing of upper. */ 9882df03a50SJakub Kicinski wrp_nops(nfp_prog, clr_gpr && size < 8 ? 2 : 3); 9892df03a50SJakub Kicinski } 9902df03a50SJakub Kicinski 991a82b23fbSJakub Kicinski if (clr_gpr && size < 8) 992a82b23fbSJakub Kicinski wrp_immed(nfp_prog, reg_both(gpr + 1), 0); 993a82b23fbSJakub Kicinski 994ee9133a8SJakub Kicinski while (size) { 995ee9133a8SJakub Kicinski u32 slice_end; 996ee9133a8SJakub Kicinski u8 slice_size; 997ee9133a8SJakub Kicinski 998ee9133a8SJakub Kicinski slice_size = min(size, 4 - gpr_byte); 999ee9133a8SJakub Kicinski slice_end = min(off + slice_size, round_up(off + 1, 4)); 1000ee9133a8SJakub Kicinski slice_size = slice_end - off; 1001ee9133a8SJakub Kicinski 10029a90c83cSJakub Kicinski last = slice_size == size; 10039a90c83cSJakub Kicinski 10042df03a50SJakub Kicinski if (needs_inc) 10052df03a50SJakub Kicinski off %= 4; 10062df03a50SJakub Kicinski 1007a82b23fbSJakub Kicinski ret = step(nfp_prog, gpr, gpr_byte, off, slice_size, 10082df03a50SJakub Kicinski first, gpr != prev_gpr, last, lm3, needs_inc); 1009ee9133a8SJakub Kicinski if (ret) 1010ee9133a8SJakub Kicinski return ret; 1011ee9133a8SJakub Kicinski 1012a82b23fbSJakub Kicinski prev_gpr = gpr; 10139a90c83cSJakub Kicinski first = false; 10149a90c83cSJakub Kicinski 1015ee9133a8SJakub Kicinski gpr_byte += slice_size; 1016ee9133a8SJakub Kicinski if (gpr_byte >= 4) { 1017ee9133a8SJakub Kicinski gpr_byte -= 4; 1018ee9133a8SJakub Kicinski gpr++; 1019ee9133a8SJakub Kicinski } 1020ee9133a8SJakub Kicinski 1021ee9133a8SJakub Kicinski size -= slice_size; 1022ee9133a8SJakub Kicinski off += slice_size; 1023ee9133a8SJakub Kicinski } 1024ee9133a8SJakub Kicinski 1025ee9133a8SJakub Kicinski return 0; 1026ee9133a8SJakub Kicinski } 1027ee9133a8SJakub Kicinski 1028d9ae7f2bSJakub Kicinski static void 1029d9ae7f2bSJakub Kicinski wrp_alu_imm(struct nfp_prog *nfp_prog, u8 dst, enum alu_op alu_op, u32 imm) 1030d9ae7f2bSJakub Kicinski { 1031b3f868dfSJakub Kicinski swreg tmp_reg; 1032d9ae7f2bSJakub Kicinski 1033d9ae7f2bSJakub Kicinski if (alu_op == ALU_OP_AND) { 1034d9ae7f2bSJakub Kicinski if (!imm) 1035d9ae7f2bSJakub Kicinski wrp_immed(nfp_prog, reg_both(dst), 0); 1036d9ae7f2bSJakub Kicinski if (!imm || !~imm) 1037d9ae7f2bSJakub Kicinski return; 1038d9ae7f2bSJakub Kicinski } 1039d9ae7f2bSJakub Kicinski if (alu_op == ALU_OP_OR) { 1040d9ae7f2bSJakub Kicinski if (!~imm) 1041d9ae7f2bSJakub Kicinski wrp_immed(nfp_prog, reg_both(dst), ~0U); 1042d9ae7f2bSJakub Kicinski if (!imm || !~imm) 1043d9ae7f2bSJakub Kicinski return; 1044d9ae7f2bSJakub Kicinski } 1045d9ae7f2bSJakub Kicinski if (alu_op == ALU_OP_XOR) { 1046d9ae7f2bSJakub Kicinski if (!~imm) 1047d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_both(dst), reg_none(), 10485d42ced1SJiong Wang ALU_OP_NOT, reg_b(dst)); 1049d9ae7f2bSJakub Kicinski if (!imm || !~imm) 1050d9ae7f2bSJakub Kicinski return; 1051d9ae7f2bSJakub Kicinski } 1052d9ae7f2bSJakub Kicinski 1053d9ae7f2bSJakub Kicinski tmp_reg = ur_load_imm_any(nfp_prog, imm, imm_b(nfp_prog)); 1054d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_both(dst), reg_a(dst), alu_op, tmp_reg); 1055d9ae7f2bSJakub Kicinski } 1056d9ae7f2bSJakub Kicinski 1057d9ae7f2bSJakub Kicinski static int 1058d9ae7f2bSJakub Kicinski wrp_alu64_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 1059d9ae7f2bSJakub Kicinski enum alu_op alu_op, bool skip) 1060d9ae7f2bSJakub Kicinski { 1061d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 1062d9ae7f2bSJakub Kicinski u64 imm = insn->imm; /* sign extend */ 1063d9ae7f2bSJakub Kicinski 1064d9ae7f2bSJakub Kicinski if (skip) { 1065d9ae7f2bSJakub Kicinski meta->skip = true; 1066d9ae7f2bSJakub Kicinski return 0; 1067d9ae7f2bSJakub Kicinski } 1068d9ae7f2bSJakub Kicinski 1069d9ae7f2bSJakub Kicinski wrp_alu_imm(nfp_prog, insn->dst_reg * 2, alu_op, imm & ~0U); 1070d9ae7f2bSJakub Kicinski wrp_alu_imm(nfp_prog, insn->dst_reg * 2 + 1, alu_op, imm >> 32); 1071d9ae7f2bSJakub Kicinski 1072d9ae7f2bSJakub Kicinski return 0; 1073d9ae7f2bSJakub Kicinski } 1074d9ae7f2bSJakub Kicinski 1075d9ae7f2bSJakub Kicinski static int 1076d9ae7f2bSJakub Kicinski wrp_alu64_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 1077d9ae7f2bSJakub Kicinski enum alu_op alu_op) 1078d9ae7f2bSJakub Kicinski { 1079d9ae7f2bSJakub Kicinski u8 dst = meta->insn.dst_reg * 2, src = meta->insn.src_reg * 2; 1080d9ae7f2bSJakub Kicinski 1081d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_both(dst), reg_a(dst), alu_op, reg_b(src)); 1082d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_both(dst + 1), 1083d9ae7f2bSJakub Kicinski reg_a(dst + 1), alu_op, reg_b(src + 1)); 1084d9ae7f2bSJakub Kicinski 1085d9ae7f2bSJakub Kicinski return 0; 1086d9ae7f2bSJakub Kicinski } 1087d9ae7f2bSJakub Kicinski 1088d9ae7f2bSJakub Kicinski static int 1089d9ae7f2bSJakub Kicinski wrp_alu32_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 1090d9ae7f2bSJakub Kicinski enum alu_op alu_op, bool skip) 1091d9ae7f2bSJakub Kicinski { 1092d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 1093d9ae7f2bSJakub Kicinski 1094d9ae7f2bSJakub Kicinski if (skip) { 1095d9ae7f2bSJakub Kicinski meta->skip = true; 1096d9ae7f2bSJakub Kicinski return 0; 1097d9ae7f2bSJakub Kicinski } 1098d9ae7f2bSJakub Kicinski 1099d9ae7f2bSJakub Kicinski wrp_alu_imm(nfp_prog, insn->dst_reg * 2, alu_op, insn->imm); 1100d9ae7f2bSJakub Kicinski wrp_immed(nfp_prog, reg_both(insn->dst_reg * 2 + 1), 0); 1101d9ae7f2bSJakub Kicinski 1102d9ae7f2bSJakub Kicinski return 0; 1103d9ae7f2bSJakub Kicinski } 1104d9ae7f2bSJakub Kicinski 1105d9ae7f2bSJakub Kicinski static int 1106d9ae7f2bSJakub Kicinski wrp_alu32_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 1107d9ae7f2bSJakub Kicinski enum alu_op alu_op) 1108d9ae7f2bSJakub Kicinski { 1109d9ae7f2bSJakub Kicinski u8 dst = meta->insn.dst_reg * 2, src = meta->insn.src_reg * 2; 1110d9ae7f2bSJakub Kicinski 1111d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_both(dst), reg_a(dst), alu_op, reg_b(src)); 1112d9ae7f2bSJakub Kicinski wrp_immed(nfp_prog, reg_both(meta->insn.dst_reg * 2 + 1), 0); 1113d9ae7f2bSJakub Kicinski 1114d9ae7f2bSJakub Kicinski return 0; 1115d9ae7f2bSJakub Kicinski } 1116d9ae7f2bSJakub Kicinski 1117d9ae7f2bSJakub Kicinski static void 1118d9ae7f2bSJakub Kicinski wrp_test_reg_one(struct nfp_prog *nfp_prog, u8 dst, enum alu_op alu_op, u8 src, 1119d9ae7f2bSJakub Kicinski enum br_mask br_mask, u16 off) 1120d9ae7f2bSJakub Kicinski { 1121d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), reg_a(dst), alu_op, reg_b(src)); 1122d9ae7f2bSJakub Kicinski emit_br(nfp_prog, br_mask, off, 0); 1123d9ae7f2bSJakub Kicinski } 1124d9ae7f2bSJakub Kicinski 1125d9ae7f2bSJakub Kicinski static int 1126d9ae7f2bSJakub Kicinski wrp_test_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 1127d9ae7f2bSJakub Kicinski enum alu_op alu_op, enum br_mask br_mask) 1128d9ae7f2bSJakub Kicinski { 1129d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 1130d9ae7f2bSJakub Kicinski 1131d9ae7f2bSJakub Kicinski wrp_test_reg_one(nfp_prog, insn->dst_reg * 2, alu_op, 1132d9ae7f2bSJakub Kicinski insn->src_reg * 2, br_mask, insn->off); 1133d9ae7f2bSJakub Kicinski wrp_test_reg_one(nfp_prog, insn->dst_reg * 2 + 1, alu_op, 1134d9ae7f2bSJakub Kicinski insn->src_reg * 2 + 1, br_mask, insn->off); 1135d9ae7f2bSJakub Kicinski 1136d9ae7f2bSJakub Kicinski return 0; 1137d9ae7f2bSJakub Kicinski } 1138d9ae7f2bSJakub Kicinski 1139d9ae7f2bSJakub Kicinski static int 1140d9ae7f2bSJakub Kicinski wrp_cmp_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 1141d9ae7f2bSJakub Kicinski enum br_mask br_mask, bool swap) 1142d9ae7f2bSJakub Kicinski { 1143d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 1144d9ae7f2bSJakub Kicinski u64 imm = insn->imm; /* sign extend */ 1145d9ae7f2bSJakub Kicinski u8 reg = insn->dst_reg * 2; 1146b3f868dfSJakub Kicinski swreg tmp_reg; 1147d9ae7f2bSJakub Kicinski 1148d9ae7f2bSJakub Kicinski tmp_reg = ur_load_imm_any(nfp_prog, imm & ~0U, imm_b(nfp_prog)); 1149d9ae7f2bSJakub Kicinski if (!swap) 1150d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), reg_a(reg), ALU_OP_SUB, tmp_reg); 1151d9ae7f2bSJakub Kicinski else 1152d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), tmp_reg, ALU_OP_SUB, reg_a(reg)); 1153d9ae7f2bSJakub Kicinski 1154d9ae7f2bSJakub Kicinski tmp_reg = ur_load_imm_any(nfp_prog, imm >> 32, imm_b(nfp_prog)); 1155d9ae7f2bSJakub Kicinski if (!swap) 1156d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), 1157d9ae7f2bSJakub Kicinski reg_a(reg + 1), ALU_OP_SUB_C, tmp_reg); 1158d9ae7f2bSJakub Kicinski else 1159d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), 1160d9ae7f2bSJakub Kicinski tmp_reg, ALU_OP_SUB_C, reg_a(reg + 1)); 1161d9ae7f2bSJakub Kicinski 1162d9ae7f2bSJakub Kicinski emit_br(nfp_prog, br_mask, insn->off, 0); 1163d9ae7f2bSJakub Kicinski 1164d9ae7f2bSJakub Kicinski return 0; 1165d9ae7f2bSJakub Kicinski } 1166d9ae7f2bSJakub Kicinski 1167d9ae7f2bSJakub Kicinski static int 1168d9ae7f2bSJakub Kicinski wrp_cmp_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 1169d9ae7f2bSJakub Kicinski enum br_mask br_mask, bool swap) 1170d9ae7f2bSJakub Kicinski { 1171d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 117226fa818dSJakub Kicinski u8 areg, breg; 117326fa818dSJakub Kicinski 117426fa818dSJakub Kicinski areg = insn->dst_reg * 2; 117526fa818dSJakub Kicinski breg = insn->src_reg * 2; 1176d9ae7f2bSJakub Kicinski 1177d9ae7f2bSJakub Kicinski if (swap) { 1178d9ae7f2bSJakub Kicinski areg ^= breg; 1179d9ae7f2bSJakub Kicinski breg ^= areg; 1180d9ae7f2bSJakub Kicinski areg ^= breg; 1181d9ae7f2bSJakub Kicinski } 1182d9ae7f2bSJakub Kicinski 1183d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), reg_a(areg), ALU_OP_SUB, reg_b(breg)); 1184d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), 1185d9ae7f2bSJakub Kicinski reg_a(areg + 1), ALU_OP_SUB_C, reg_b(breg + 1)); 1186d9ae7f2bSJakub Kicinski emit_br(nfp_prog, br_mask, insn->off, 0); 1187d9ae7f2bSJakub Kicinski 1188d9ae7f2bSJakub Kicinski return 0; 1189d9ae7f2bSJakub Kicinski } 1190d9ae7f2bSJakub Kicinski 11913119d1fdSJakub Kicinski static void wrp_end32(struct nfp_prog *nfp_prog, swreg reg_in, u8 gpr_out) 11923119d1fdSJakub Kicinski { 11933119d1fdSJakub Kicinski emit_ld_field(nfp_prog, reg_both(gpr_out), 0xf, reg_in, 11943119d1fdSJakub Kicinski SHF_SC_R_ROT, 8); 11953119d1fdSJakub Kicinski emit_ld_field(nfp_prog, reg_both(gpr_out), 0x5, reg_a(gpr_out), 11963119d1fdSJakub Kicinski SHF_SC_R_ROT, 16); 11973119d1fdSJakub Kicinski } 11983119d1fdSJakub Kicinski 1199d9ae7f2bSJakub Kicinski /* --- Callbacks --- */ 1200d9ae7f2bSJakub Kicinski static int mov_reg64(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1201d9ae7f2bSJakub Kicinski { 1202d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 1203b14157eeSJakub Kicinski u8 dst = insn->dst_reg * 2; 1204b14157eeSJakub Kicinski u8 src = insn->src_reg * 2; 1205d9ae7f2bSJakub Kicinski 1206b14157eeSJakub Kicinski if (insn->src_reg == BPF_REG_10) { 1207b14157eeSJakub Kicinski swreg stack_depth_reg; 1208b14157eeSJakub Kicinski 1209b14157eeSJakub Kicinski stack_depth_reg = ur_load_imm_any(nfp_prog, 1210b14157eeSJakub Kicinski nfp_prog->stack_depth, 1211b14157eeSJakub Kicinski stack_imm(nfp_prog)); 1212b14157eeSJakub Kicinski emit_alu(nfp_prog, reg_both(dst), 1213b14157eeSJakub Kicinski stack_reg(nfp_prog), ALU_OP_ADD, stack_depth_reg); 1214b14157eeSJakub Kicinski wrp_immed(nfp_prog, reg_both(dst + 1), 0); 1215b14157eeSJakub Kicinski } else { 1216b14157eeSJakub Kicinski wrp_reg_mov(nfp_prog, dst, src); 1217b14157eeSJakub Kicinski wrp_reg_mov(nfp_prog, dst + 1, src + 1); 1218b14157eeSJakub Kicinski } 1219d9ae7f2bSJakub Kicinski 1220d9ae7f2bSJakub Kicinski return 0; 1221d9ae7f2bSJakub Kicinski } 1222d9ae7f2bSJakub Kicinski 1223d9ae7f2bSJakub Kicinski static int mov_imm64(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1224d9ae7f2bSJakub Kicinski { 1225d9ae7f2bSJakub Kicinski u64 imm = meta->insn.imm; /* sign extend */ 1226d9ae7f2bSJakub Kicinski 1227d9ae7f2bSJakub Kicinski wrp_immed(nfp_prog, reg_both(meta->insn.dst_reg * 2), imm & ~0U); 1228d9ae7f2bSJakub Kicinski wrp_immed(nfp_prog, reg_both(meta->insn.dst_reg * 2 + 1), imm >> 32); 1229d9ae7f2bSJakub Kicinski 1230d9ae7f2bSJakub Kicinski return 0; 1231d9ae7f2bSJakub Kicinski } 1232d9ae7f2bSJakub Kicinski 1233d9ae7f2bSJakub Kicinski static int xor_reg64(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1234d9ae7f2bSJakub Kicinski { 1235d9ae7f2bSJakub Kicinski return wrp_alu64_reg(nfp_prog, meta, ALU_OP_XOR); 1236d9ae7f2bSJakub Kicinski } 1237d9ae7f2bSJakub Kicinski 1238d9ae7f2bSJakub Kicinski static int xor_imm64(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1239d9ae7f2bSJakub Kicinski { 1240d9ae7f2bSJakub Kicinski return wrp_alu64_imm(nfp_prog, meta, ALU_OP_XOR, !meta->insn.imm); 1241d9ae7f2bSJakub Kicinski } 1242d9ae7f2bSJakub Kicinski 1243d9ae7f2bSJakub Kicinski static int and_reg64(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1244d9ae7f2bSJakub Kicinski { 1245d9ae7f2bSJakub Kicinski return wrp_alu64_reg(nfp_prog, meta, ALU_OP_AND); 1246d9ae7f2bSJakub Kicinski } 1247d9ae7f2bSJakub Kicinski 1248d9ae7f2bSJakub Kicinski static int and_imm64(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1249d9ae7f2bSJakub Kicinski { 1250d9ae7f2bSJakub Kicinski return wrp_alu64_imm(nfp_prog, meta, ALU_OP_AND, !~meta->insn.imm); 1251d9ae7f2bSJakub Kicinski } 1252d9ae7f2bSJakub Kicinski 1253d9ae7f2bSJakub Kicinski static int or_reg64(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1254d9ae7f2bSJakub Kicinski { 1255d9ae7f2bSJakub Kicinski return wrp_alu64_reg(nfp_prog, meta, ALU_OP_OR); 1256d9ae7f2bSJakub Kicinski } 1257d9ae7f2bSJakub Kicinski 1258d9ae7f2bSJakub Kicinski static int or_imm64(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1259d9ae7f2bSJakub Kicinski { 1260d9ae7f2bSJakub Kicinski return wrp_alu64_imm(nfp_prog, meta, ALU_OP_OR, !meta->insn.imm); 1261d9ae7f2bSJakub Kicinski } 1262d9ae7f2bSJakub Kicinski 1263d9ae7f2bSJakub Kicinski static int add_reg64(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1264d9ae7f2bSJakub Kicinski { 1265d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 1266d9ae7f2bSJakub Kicinski 1267d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_both(insn->dst_reg * 2), 1268d9ae7f2bSJakub Kicinski reg_a(insn->dst_reg * 2), ALU_OP_ADD, 1269d9ae7f2bSJakub Kicinski reg_b(insn->src_reg * 2)); 1270d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_both(insn->dst_reg * 2 + 1), 1271d9ae7f2bSJakub Kicinski reg_a(insn->dst_reg * 2 + 1), ALU_OP_ADD_C, 1272d9ae7f2bSJakub Kicinski reg_b(insn->src_reg * 2 + 1)); 1273d9ae7f2bSJakub Kicinski 1274d9ae7f2bSJakub Kicinski return 0; 1275d9ae7f2bSJakub Kicinski } 1276d9ae7f2bSJakub Kicinski 1277d9ae7f2bSJakub Kicinski static int add_imm64(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1278d9ae7f2bSJakub Kicinski { 1279d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 1280d9ae7f2bSJakub Kicinski u64 imm = insn->imm; /* sign extend */ 1281d9ae7f2bSJakub Kicinski 1282d9ae7f2bSJakub Kicinski wrp_alu_imm(nfp_prog, insn->dst_reg * 2, ALU_OP_ADD, imm & ~0U); 1283d9ae7f2bSJakub Kicinski wrp_alu_imm(nfp_prog, insn->dst_reg * 2 + 1, ALU_OP_ADD_C, imm >> 32); 1284d9ae7f2bSJakub Kicinski 1285d9ae7f2bSJakub Kicinski return 0; 1286d9ae7f2bSJakub Kicinski } 1287d9ae7f2bSJakub Kicinski 1288d9ae7f2bSJakub Kicinski static int sub_reg64(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1289d9ae7f2bSJakub Kicinski { 1290d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 1291d9ae7f2bSJakub Kicinski 1292d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_both(insn->dst_reg * 2), 1293d9ae7f2bSJakub Kicinski reg_a(insn->dst_reg * 2), ALU_OP_SUB, 1294d9ae7f2bSJakub Kicinski reg_b(insn->src_reg * 2)); 1295d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_both(insn->dst_reg * 2 + 1), 1296d9ae7f2bSJakub Kicinski reg_a(insn->dst_reg * 2 + 1), ALU_OP_SUB_C, 1297d9ae7f2bSJakub Kicinski reg_b(insn->src_reg * 2 + 1)); 1298d9ae7f2bSJakub Kicinski 1299d9ae7f2bSJakub Kicinski return 0; 1300d9ae7f2bSJakub Kicinski } 1301d9ae7f2bSJakub Kicinski 1302d9ae7f2bSJakub Kicinski static int sub_imm64(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1303d9ae7f2bSJakub Kicinski { 1304d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 1305d9ae7f2bSJakub Kicinski u64 imm = insn->imm; /* sign extend */ 1306d9ae7f2bSJakub Kicinski 1307d9ae7f2bSJakub Kicinski wrp_alu_imm(nfp_prog, insn->dst_reg * 2, ALU_OP_SUB, imm & ~0U); 1308d9ae7f2bSJakub Kicinski wrp_alu_imm(nfp_prog, insn->dst_reg * 2 + 1, ALU_OP_SUB_C, imm >> 32); 1309d9ae7f2bSJakub Kicinski 1310d9ae7f2bSJakub Kicinski return 0; 1311d9ae7f2bSJakub Kicinski } 1312d9ae7f2bSJakub Kicinski 1313254ef4d7SJiong Wang static int neg_reg64(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1314254ef4d7SJiong Wang { 1315254ef4d7SJiong Wang const struct bpf_insn *insn = &meta->insn; 1316254ef4d7SJiong Wang 1317254ef4d7SJiong Wang emit_alu(nfp_prog, reg_both(insn->dst_reg * 2), reg_imm(0), 1318254ef4d7SJiong Wang ALU_OP_SUB, reg_b(insn->dst_reg * 2)); 1319254ef4d7SJiong Wang emit_alu(nfp_prog, reg_both(insn->dst_reg * 2 + 1), reg_imm(0), 1320254ef4d7SJiong Wang ALU_OP_SUB_C, reg_b(insn->dst_reg * 2 + 1)); 1321254ef4d7SJiong Wang 1322254ef4d7SJiong Wang return 0; 1323254ef4d7SJiong Wang } 1324254ef4d7SJiong Wang 1325d9ae7f2bSJakub Kicinski static int shl_imm64(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1326d9ae7f2bSJakub Kicinski { 1327d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 13283cae1319SJakub Kicinski u8 dst = insn->dst_reg * 2; 1329d9ae7f2bSJakub Kicinski 13303cae1319SJakub Kicinski if (insn->imm < 32) { 13313cae1319SJakub Kicinski emit_shf(nfp_prog, reg_both(dst + 1), 13323cae1319SJakub Kicinski reg_a(dst + 1), SHF_OP_NONE, reg_b(dst), 13333cae1319SJakub Kicinski SHF_SC_R_DSHF, 32 - insn->imm); 13343cae1319SJakub Kicinski emit_shf(nfp_prog, reg_both(dst), 13353cae1319SJakub Kicinski reg_none(), SHF_OP_NONE, reg_b(dst), 13363cae1319SJakub Kicinski SHF_SC_L_SHF, insn->imm); 13373cae1319SJakub Kicinski } else if (insn->imm == 32) { 13383cae1319SJakub Kicinski wrp_reg_mov(nfp_prog, dst + 1, dst); 13393cae1319SJakub Kicinski wrp_immed(nfp_prog, reg_both(dst), 0); 13403cae1319SJakub Kicinski } else if (insn->imm > 32) { 13413cae1319SJakub Kicinski emit_shf(nfp_prog, reg_both(dst + 1), 13423cae1319SJakub Kicinski reg_none(), SHF_OP_NONE, reg_b(dst), 13433cae1319SJakub Kicinski SHF_SC_L_SHF, insn->imm - 32); 13443cae1319SJakub Kicinski wrp_immed(nfp_prog, reg_both(dst), 0); 13453cae1319SJakub Kicinski } 1346d9ae7f2bSJakub Kicinski 1347d9ae7f2bSJakub Kicinski return 0; 1348d9ae7f2bSJakub Kicinski } 1349d9ae7f2bSJakub Kicinski 1350d9ae7f2bSJakub Kicinski static int shr_imm64(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1351d9ae7f2bSJakub Kicinski { 1352d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 13533cae1319SJakub Kicinski u8 dst = insn->dst_reg * 2; 1354d9ae7f2bSJakub Kicinski 13553cae1319SJakub Kicinski if (insn->imm < 32) { 13563cae1319SJakub Kicinski emit_shf(nfp_prog, reg_both(dst), 13573cae1319SJakub Kicinski reg_a(dst + 1), SHF_OP_NONE, reg_b(dst), 13583cae1319SJakub Kicinski SHF_SC_R_DSHF, insn->imm); 13593cae1319SJakub Kicinski emit_shf(nfp_prog, reg_both(dst + 1), 13603cae1319SJakub Kicinski reg_none(), SHF_OP_NONE, reg_b(dst + 1), 13613cae1319SJakub Kicinski SHF_SC_R_SHF, insn->imm); 13623cae1319SJakub Kicinski } else if (insn->imm == 32) { 13633cae1319SJakub Kicinski wrp_reg_mov(nfp_prog, dst, dst + 1); 13643cae1319SJakub Kicinski wrp_immed(nfp_prog, reg_both(dst + 1), 0); 13653cae1319SJakub Kicinski } else if (insn->imm > 32) { 13663cae1319SJakub Kicinski emit_shf(nfp_prog, reg_both(dst), 13673cae1319SJakub Kicinski reg_none(), SHF_OP_NONE, reg_b(dst + 1), 13683cae1319SJakub Kicinski SHF_SC_R_SHF, insn->imm - 32); 13693cae1319SJakub Kicinski wrp_immed(nfp_prog, reg_both(dst + 1), 0); 13703cae1319SJakub Kicinski } 1371d9ae7f2bSJakub Kicinski 1372d9ae7f2bSJakub Kicinski return 0; 1373d9ae7f2bSJakub Kicinski } 1374d9ae7f2bSJakub Kicinski 1375d9ae7f2bSJakub Kicinski static int mov_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1376d9ae7f2bSJakub Kicinski { 1377d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 1378d9ae7f2bSJakub Kicinski 1379d9ae7f2bSJakub Kicinski wrp_reg_mov(nfp_prog, insn->dst_reg * 2, insn->src_reg * 2); 1380d9ae7f2bSJakub Kicinski wrp_immed(nfp_prog, reg_both(insn->dst_reg * 2 + 1), 0); 1381d9ae7f2bSJakub Kicinski 1382d9ae7f2bSJakub Kicinski return 0; 1383d9ae7f2bSJakub Kicinski } 1384d9ae7f2bSJakub Kicinski 1385d9ae7f2bSJakub Kicinski static int mov_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1386d9ae7f2bSJakub Kicinski { 1387d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 1388d9ae7f2bSJakub Kicinski 1389d9ae7f2bSJakub Kicinski wrp_immed(nfp_prog, reg_both(insn->dst_reg * 2), insn->imm); 1390d9ae7f2bSJakub Kicinski wrp_immed(nfp_prog, reg_both(insn->dst_reg * 2 + 1), 0); 1391d9ae7f2bSJakub Kicinski 1392d9ae7f2bSJakub Kicinski return 0; 1393d9ae7f2bSJakub Kicinski } 1394d9ae7f2bSJakub Kicinski 1395d9ae7f2bSJakub Kicinski static int xor_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1396d9ae7f2bSJakub Kicinski { 1397d9ae7f2bSJakub Kicinski return wrp_alu32_reg(nfp_prog, meta, ALU_OP_XOR); 1398d9ae7f2bSJakub Kicinski } 1399d9ae7f2bSJakub Kicinski 1400d9ae7f2bSJakub Kicinski static int xor_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1401d9ae7f2bSJakub Kicinski { 1402d9ae7f2bSJakub Kicinski return wrp_alu32_imm(nfp_prog, meta, ALU_OP_XOR, !~meta->insn.imm); 1403d9ae7f2bSJakub Kicinski } 1404d9ae7f2bSJakub Kicinski 1405d9ae7f2bSJakub Kicinski static int and_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1406d9ae7f2bSJakub Kicinski { 1407d9ae7f2bSJakub Kicinski return wrp_alu32_reg(nfp_prog, meta, ALU_OP_AND); 1408d9ae7f2bSJakub Kicinski } 1409d9ae7f2bSJakub Kicinski 1410d9ae7f2bSJakub Kicinski static int and_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1411d9ae7f2bSJakub Kicinski { 1412d9ae7f2bSJakub Kicinski return wrp_alu32_imm(nfp_prog, meta, ALU_OP_AND, !~meta->insn.imm); 1413d9ae7f2bSJakub Kicinski } 1414d9ae7f2bSJakub Kicinski 1415d9ae7f2bSJakub Kicinski static int or_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1416d9ae7f2bSJakub Kicinski { 1417d9ae7f2bSJakub Kicinski return wrp_alu32_reg(nfp_prog, meta, ALU_OP_OR); 1418d9ae7f2bSJakub Kicinski } 1419d9ae7f2bSJakub Kicinski 1420d9ae7f2bSJakub Kicinski static int or_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1421d9ae7f2bSJakub Kicinski { 1422d9ae7f2bSJakub Kicinski return wrp_alu32_imm(nfp_prog, meta, ALU_OP_OR, !meta->insn.imm); 1423d9ae7f2bSJakub Kicinski } 1424d9ae7f2bSJakub Kicinski 1425d9ae7f2bSJakub Kicinski static int add_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1426d9ae7f2bSJakub Kicinski { 1427d9ae7f2bSJakub Kicinski return wrp_alu32_reg(nfp_prog, meta, ALU_OP_ADD); 1428d9ae7f2bSJakub Kicinski } 1429d9ae7f2bSJakub Kicinski 1430d9ae7f2bSJakub Kicinski static int add_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1431d9ae7f2bSJakub Kicinski { 1432d9ae7f2bSJakub Kicinski return wrp_alu32_imm(nfp_prog, meta, ALU_OP_ADD, !meta->insn.imm); 1433d9ae7f2bSJakub Kicinski } 1434d9ae7f2bSJakub Kicinski 1435d9ae7f2bSJakub Kicinski static int sub_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1436d9ae7f2bSJakub Kicinski { 1437d9ae7f2bSJakub Kicinski return wrp_alu32_reg(nfp_prog, meta, ALU_OP_SUB); 1438d9ae7f2bSJakub Kicinski } 1439d9ae7f2bSJakub Kicinski 1440d9ae7f2bSJakub Kicinski static int sub_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1441d9ae7f2bSJakub Kicinski { 1442d9ae7f2bSJakub Kicinski return wrp_alu32_imm(nfp_prog, meta, ALU_OP_SUB, !meta->insn.imm); 1443d9ae7f2bSJakub Kicinski } 1444d9ae7f2bSJakub Kicinski 1445254ef4d7SJiong Wang static int neg_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1446254ef4d7SJiong Wang { 1447254ef4d7SJiong Wang u8 dst = meta->insn.dst_reg * 2; 1448254ef4d7SJiong Wang 1449254ef4d7SJiong Wang emit_alu(nfp_prog, reg_both(dst), reg_imm(0), ALU_OP_SUB, reg_b(dst)); 1450254ef4d7SJiong Wang wrp_immed(nfp_prog, reg_both(meta->insn.dst_reg * 2 + 1), 0); 1451254ef4d7SJiong Wang 1452254ef4d7SJiong Wang return 0; 1453254ef4d7SJiong Wang } 1454254ef4d7SJiong Wang 1455d9ae7f2bSJakub Kicinski static int shl_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1456d9ae7f2bSJakub Kicinski { 1457d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 1458d9ae7f2bSJakub Kicinski 1459d9ae7f2bSJakub Kicinski if (!insn->imm) 1460d9ae7f2bSJakub Kicinski return 1; /* TODO: zero shift means indirect */ 1461d9ae7f2bSJakub Kicinski 1462d9ae7f2bSJakub Kicinski emit_shf(nfp_prog, reg_both(insn->dst_reg * 2), 1463d9ae7f2bSJakub Kicinski reg_none(), SHF_OP_NONE, reg_b(insn->dst_reg * 2), 1464d9ae7f2bSJakub Kicinski SHF_SC_L_SHF, insn->imm); 1465d9ae7f2bSJakub Kicinski wrp_immed(nfp_prog, reg_both(insn->dst_reg * 2 + 1), 0); 1466d9ae7f2bSJakub Kicinski 1467d9ae7f2bSJakub Kicinski return 0; 1468d9ae7f2bSJakub Kicinski } 1469d9ae7f2bSJakub Kicinski 14703119d1fdSJakub Kicinski static int end_reg32(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 14713119d1fdSJakub Kicinski { 14723119d1fdSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 14733119d1fdSJakub Kicinski u8 gpr = insn->dst_reg * 2; 14743119d1fdSJakub Kicinski 14753119d1fdSJakub Kicinski switch (insn->imm) { 14763119d1fdSJakub Kicinski case 16: 14773119d1fdSJakub Kicinski emit_ld_field(nfp_prog, reg_both(gpr), 0x9, reg_b(gpr), 14783119d1fdSJakub Kicinski SHF_SC_R_ROT, 8); 14793119d1fdSJakub Kicinski emit_ld_field(nfp_prog, reg_both(gpr), 0xe, reg_a(gpr), 14803119d1fdSJakub Kicinski SHF_SC_R_SHF, 16); 14813119d1fdSJakub Kicinski 14823119d1fdSJakub Kicinski wrp_immed(nfp_prog, reg_both(gpr + 1), 0); 14833119d1fdSJakub Kicinski break; 14843119d1fdSJakub Kicinski case 32: 14853119d1fdSJakub Kicinski wrp_end32(nfp_prog, reg_a(gpr), gpr); 14863119d1fdSJakub Kicinski wrp_immed(nfp_prog, reg_both(gpr + 1), 0); 14873119d1fdSJakub Kicinski break; 14883119d1fdSJakub Kicinski case 64: 14893119d1fdSJakub Kicinski wrp_mov(nfp_prog, imm_a(nfp_prog), reg_b(gpr + 1)); 14903119d1fdSJakub Kicinski 14913119d1fdSJakub Kicinski wrp_end32(nfp_prog, reg_a(gpr), gpr + 1); 14923119d1fdSJakub Kicinski wrp_end32(nfp_prog, imm_a(nfp_prog), gpr); 14933119d1fdSJakub Kicinski break; 14943119d1fdSJakub Kicinski } 14953119d1fdSJakub Kicinski 14963119d1fdSJakub Kicinski return 0; 14973119d1fdSJakub Kicinski } 14983119d1fdSJakub Kicinski 1499d9ae7f2bSJakub Kicinski static int imm_ld8_part2(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1500d9ae7f2bSJakub Kicinski { 15019f16c8abSJakub Kicinski struct nfp_insn_meta *prev = nfp_meta_prev(meta); 15029f16c8abSJakub Kicinski u32 imm_lo, imm_hi; 15039f16c8abSJakub Kicinski u8 dst; 15049f16c8abSJakub Kicinski 15059f16c8abSJakub Kicinski dst = prev->insn.dst_reg * 2; 15069f16c8abSJakub Kicinski imm_lo = prev->insn.imm; 15079f16c8abSJakub Kicinski imm_hi = meta->insn.imm; 15089f16c8abSJakub Kicinski 15099f16c8abSJakub Kicinski wrp_immed(nfp_prog, reg_both(dst), imm_lo); 15109f16c8abSJakub Kicinski 15119f16c8abSJakub Kicinski /* mov is always 1 insn, load imm may be two, so try to use mov */ 15129f16c8abSJakub Kicinski if (imm_hi == imm_lo) 15139f16c8abSJakub Kicinski wrp_mov(nfp_prog, reg_both(dst + 1), reg_a(dst)); 15149f16c8abSJakub Kicinski else 15159f16c8abSJakub Kicinski wrp_immed(nfp_prog, reg_both(dst + 1), imm_hi); 1516d9ae7f2bSJakub Kicinski 1517d9ae7f2bSJakub Kicinski return 0; 1518d9ae7f2bSJakub Kicinski } 1519d9ae7f2bSJakub Kicinski 1520d9ae7f2bSJakub Kicinski static int imm_ld8(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1521d9ae7f2bSJakub Kicinski { 1522d9ae7f2bSJakub Kicinski meta->double_cb = imm_ld8_part2; 1523d9ae7f2bSJakub Kicinski return 0; 1524d9ae7f2bSJakub Kicinski } 1525d9ae7f2bSJakub Kicinski 1526d9ae7f2bSJakub Kicinski static int data_ld1(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1527d9ae7f2bSJakub Kicinski { 1528d9ae7f2bSJakub Kicinski return construct_data_ld(nfp_prog, meta->insn.imm, 1); 1529d9ae7f2bSJakub Kicinski } 1530d9ae7f2bSJakub Kicinski 1531d9ae7f2bSJakub Kicinski static int data_ld2(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1532d9ae7f2bSJakub Kicinski { 1533d9ae7f2bSJakub Kicinski return construct_data_ld(nfp_prog, meta->insn.imm, 2); 1534d9ae7f2bSJakub Kicinski } 1535d9ae7f2bSJakub Kicinski 1536d9ae7f2bSJakub Kicinski static int data_ld4(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1537d9ae7f2bSJakub Kicinski { 1538d9ae7f2bSJakub Kicinski return construct_data_ld(nfp_prog, meta->insn.imm, 4); 1539d9ae7f2bSJakub Kicinski } 1540d9ae7f2bSJakub Kicinski 1541d9ae7f2bSJakub Kicinski static int data_ind_ld1(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1542d9ae7f2bSJakub Kicinski { 1543d9ae7f2bSJakub Kicinski return construct_data_ind_ld(nfp_prog, meta->insn.imm, 15440a793977SJakub Kicinski meta->insn.src_reg * 2, 1); 1545d9ae7f2bSJakub Kicinski } 1546d9ae7f2bSJakub Kicinski 1547d9ae7f2bSJakub Kicinski static int data_ind_ld2(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1548d9ae7f2bSJakub Kicinski { 1549d9ae7f2bSJakub Kicinski return construct_data_ind_ld(nfp_prog, meta->insn.imm, 15500a793977SJakub Kicinski meta->insn.src_reg * 2, 2); 1551d9ae7f2bSJakub Kicinski } 1552d9ae7f2bSJakub Kicinski 1553d9ae7f2bSJakub Kicinski static int data_ind_ld4(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1554d9ae7f2bSJakub Kicinski { 1555d9ae7f2bSJakub Kicinski return construct_data_ind_ld(nfp_prog, meta->insn.imm, 15560a793977SJakub Kicinski meta->insn.src_reg * 2, 4); 1557d9ae7f2bSJakub Kicinski } 1558d9ae7f2bSJakub Kicinski 1559a82b23fbSJakub Kicinski static int 1560a82b23fbSJakub Kicinski mem_ldx_stack(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 1561d3488480SJakub Kicinski unsigned int size, unsigned int ptr_off) 1562a82b23fbSJakub Kicinski { 1563d3488480SJakub Kicinski return mem_op_stack(nfp_prog, meta, size, ptr_off, 1564b14157eeSJakub Kicinski meta->insn.dst_reg * 2, meta->insn.src_reg * 2, 1565b14157eeSJakub Kicinski true, wrp_lmem_load); 1566a82b23fbSJakub Kicinski } 1567a82b23fbSJakub Kicinski 1568943c57b9SJakub Kicinski static int mem_ldx_skb(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 1569943c57b9SJakub Kicinski u8 size) 1570d9ae7f2bSJakub Kicinski { 1571bfddbc8aSJakub Kicinski swreg dst = reg_both(meta->insn.dst_reg * 2); 1572bfddbc8aSJakub Kicinski 1573943c57b9SJakub Kicinski switch (meta->insn.off) { 1574c6c580d7SJakub Kicinski case offsetof(struct __sk_buff, len): 1575c6c580d7SJakub Kicinski if (size != FIELD_SIZEOF(struct __sk_buff, len)) 1576943c57b9SJakub Kicinski return -EOPNOTSUPP; 1577bfddbc8aSJakub Kicinski wrp_mov(nfp_prog, dst, plen_reg(nfp_prog)); 1578bfddbc8aSJakub Kicinski break; 1579c6c580d7SJakub Kicinski case offsetof(struct __sk_buff, data): 1580c6c580d7SJakub Kicinski if (size != FIELD_SIZEOF(struct __sk_buff, data)) 1581bfddbc8aSJakub Kicinski return -EOPNOTSUPP; 1582bfddbc8aSJakub Kicinski wrp_mov(nfp_prog, dst, pptr_reg(nfp_prog)); 1583bfddbc8aSJakub Kicinski break; 1584c6c580d7SJakub Kicinski case offsetof(struct __sk_buff, data_end): 1585c6c580d7SJakub Kicinski if (size != FIELD_SIZEOF(struct __sk_buff, data_end)) 1586bfddbc8aSJakub Kicinski return -EOPNOTSUPP; 1587bfddbc8aSJakub Kicinski emit_alu(nfp_prog, dst, 1588bfddbc8aSJakub Kicinski plen_reg(nfp_prog), ALU_OP_ADD, pptr_reg(nfp_prog)); 1589943c57b9SJakub Kicinski break; 1590943c57b9SJakub Kicinski default: 1591d9ae7f2bSJakub Kicinski return -EOPNOTSUPP; 1592943c57b9SJakub Kicinski } 1593943c57b9SJakub Kicinski 1594943c57b9SJakub Kicinski wrp_immed(nfp_prog, reg_both(meta->insn.dst_reg * 2 + 1), 0); 1595d9ae7f2bSJakub Kicinski 1596d9ae7f2bSJakub Kicinski return 0; 1597d9ae7f2bSJakub Kicinski } 1598d9ae7f2bSJakub Kicinski 1599943c57b9SJakub Kicinski static int mem_ldx_xdp(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 1600943c57b9SJakub Kicinski u8 size) 1601d9ae7f2bSJakub Kicinski { 1602b3f868dfSJakub Kicinski swreg dst = reg_both(meta->insn.dst_reg * 2); 1603d9ae7f2bSJakub Kicinski 1604943c57b9SJakub Kicinski switch (meta->insn.off) { 1605c6c580d7SJakub Kicinski case offsetof(struct xdp_md, data): 1606c6c580d7SJakub Kicinski if (size != FIELD_SIZEOF(struct xdp_md, data)) 1607c6c580d7SJakub Kicinski return -EOPNOTSUPP; 1608c000dfb5SJakub Kicinski wrp_mov(nfp_prog, dst, pptr_reg(nfp_prog)); 1609943c57b9SJakub Kicinski break; 1610c6c580d7SJakub Kicinski case offsetof(struct xdp_md, data_end): 1611c6c580d7SJakub Kicinski if (size != FIELD_SIZEOF(struct xdp_md, data_end)) 1612c6c580d7SJakub Kicinski return -EOPNOTSUPP; 1613943c57b9SJakub Kicinski emit_alu(nfp_prog, dst, 1614943c57b9SJakub Kicinski plen_reg(nfp_prog), ALU_OP_ADD, pptr_reg(nfp_prog)); 1615943c57b9SJakub Kicinski break; 1616943c57b9SJakub Kicinski default: 1617943c57b9SJakub Kicinski return -EOPNOTSUPP; 1618943c57b9SJakub Kicinski } 1619d9ae7f2bSJakub Kicinski 1620943c57b9SJakub Kicinski wrp_immed(nfp_prog, reg_both(meta->insn.dst_reg * 2 + 1), 0); 1621d9ae7f2bSJakub Kicinski 1622d9ae7f2bSJakub Kicinski return 0; 1623d9ae7f2bSJakub Kicinski } 1624d9ae7f2bSJakub Kicinski 16252ca71441SJakub Kicinski static int 16262ca71441SJakub Kicinski mem_ldx_data(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 16272ca71441SJakub Kicinski unsigned int size) 16282ca71441SJakub Kicinski { 16292ca71441SJakub Kicinski swreg tmp_reg; 16302ca71441SJakub Kicinski 16312ca71441SJakub Kicinski tmp_reg = re_load_imm_any(nfp_prog, meta->insn.off, imm_b(nfp_prog)); 16322ca71441SJakub Kicinski 16332ca71441SJakub Kicinski return data_ld_host_order(nfp_prog, meta->insn.src_reg * 2, tmp_reg, 16342ca71441SJakub Kicinski meta->insn.dst_reg * 2, size); 16352ca71441SJakub Kicinski } 16362ca71441SJakub Kicinski 16372ca71441SJakub Kicinski static int 16382ca71441SJakub Kicinski mem_ldx(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 16392ca71441SJakub Kicinski unsigned int size) 16402ca71441SJakub Kicinski { 16419879a381SJiong Wang if (meta->ldst_gather_len) 16429879a381SJiong Wang return nfp_cpp_memcpy(nfp_prog, meta); 16439879a381SJiong Wang 16442ca71441SJakub Kicinski if (meta->ptr.type == PTR_TO_CTX) { 1645012bb8a8SJakub Kicinski if (nfp_prog->type == BPF_PROG_TYPE_XDP) 16462ca71441SJakub Kicinski return mem_ldx_xdp(nfp_prog, meta, size); 16472ca71441SJakub Kicinski else 16482ca71441SJakub Kicinski return mem_ldx_skb(nfp_prog, meta, size); 16492ca71441SJakub Kicinski } 16502ca71441SJakub Kicinski 16512ca71441SJakub Kicinski if (meta->ptr.type == PTR_TO_PACKET) 16522ca71441SJakub Kicinski return mem_ldx_data(nfp_prog, meta, size); 16532ca71441SJakub Kicinski 1654a82b23fbSJakub Kicinski if (meta->ptr.type == PTR_TO_STACK) 1655d3488480SJakub Kicinski return mem_ldx_stack(nfp_prog, meta, size, 1656d3488480SJakub Kicinski meta->ptr.off + meta->ptr.var_off.value); 1657a82b23fbSJakub Kicinski 16582ca71441SJakub Kicinski return -EOPNOTSUPP; 16592ca71441SJakub Kicinski } 16602ca71441SJakub Kicinski 16612ca71441SJakub Kicinski static int mem_ldx1(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 16622ca71441SJakub Kicinski { 16632ca71441SJakub Kicinski return mem_ldx(nfp_prog, meta, 1); 16642ca71441SJakub Kicinski } 16652ca71441SJakub Kicinski 16662ca71441SJakub Kicinski static int mem_ldx2(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 16672ca71441SJakub Kicinski { 16682ca71441SJakub Kicinski return mem_ldx(nfp_prog, meta, 2); 16692ca71441SJakub Kicinski } 16702ca71441SJakub Kicinski 1671d9ae7f2bSJakub Kicinski static int mem_ldx4(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1672d9ae7f2bSJakub Kicinski { 16732ca71441SJakub Kicinski return mem_ldx(nfp_prog, meta, 4); 16742ca71441SJakub Kicinski } 16752ca71441SJakub Kicinski 16762ca71441SJakub Kicinski static int mem_ldx8(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 16772ca71441SJakub Kicinski { 16782ca71441SJakub Kicinski return mem_ldx(nfp_prog, meta, 8); 1679d9ae7f2bSJakub Kicinski } 1680d9ae7f2bSJakub Kicinski 1681e663fe38SJakub Kicinski static int 1682e663fe38SJakub Kicinski mem_st_data(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 1683e663fe38SJakub Kicinski unsigned int size) 1684d9ae7f2bSJakub Kicinski { 1685e663fe38SJakub Kicinski u64 imm = meta->insn.imm; /* sign extend */ 1686e663fe38SJakub Kicinski swreg off_reg; 1687e663fe38SJakub Kicinski 1688e663fe38SJakub Kicinski off_reg = re_load_imm_any(nfp_prog, meta->insn.off, imm_b(nfp_prog)); 1689e663fe38SJakub Kicinski 1690e663fe38SJakub Kicinski return data_st_host_order(nfp_prog, meta->insn.dst_reg * 2, off_reg, 1691e663fe38SJakub Kicinski imm, size); 1692e663fe38SJakub Kicinski } 1693e663fe38SJakub Kicinski 1694e663fe38SJakub Kicinski static int mem_st(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 1695e663fe38SJakub Kicinski unsigned int size) 1696e663fe38SJakub Kicinski { 1697e663fe38SJakub Kicinski if (meta->ptr.type == PTR_TO_PACKET) 1698e663fe38SJakub Kicinski return mem_st_data(nfp_prog, meta, size); 1699e663fe38SJakub Kicinski 1700d9ae7f2bSJakub Kicinski return -EOPNOTSUPP; 1701d9ae7f2bSJakub Kicinski } 1702d9ae7f2bSJakub Kicinski 1703e663fe38SJakub Kicinski static int mem_st1(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1704d9ae7f2bSJakub Kicinski { 1705e663fe38SJakub Kicinski return mem_st(nfp_prog, meta, 1); 1706e663fe38SJakub Kicinski } 1707e663fe38SJakub Kicinski 1708e663fe38SJakub Kicinski static int mem_st2(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1709e663fe38SJakub Kicinski { 1710e663fe38SJakub Kicinski return mem_st(nfp_prog, meta, 2); 1711e663fe38SJakub Kicinski } 1712e663fe38SJakub Kicinski 1713e663fe38SJakub Kicinski static int mem_st4(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1714e663fe38SJakub Kicinski { 1715e663fe38SJakub Kicinski return mem_st(nfp_prog, meta, 4); 1716e663fe38SJakub Kicinski } 1717e663fe38SJakub Kicinski 1718e663fe38SJakub Kicinski static int mem_st8(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1719e663fe38SJakub Kicinski { 1720e663fe38SJakub Kicinski return mem_st(nfp_prog, meta, 8); 1721e663fe38SJakub Kicinski } 1722e663fe38SJakub Kicinski 1723e663fe38SJakub Kicinski static int 1724e663fe38SJakub Kicinski mem_stx_data(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 1725e663fe38SJakub Kicinski unsigned int size) 1726e663fe38SJakub Kicinski { 1727e663fe38SJakub Kicinski swreg off_reg; 1728e663fe38SJakub Kicinski 1729e663fe38SJakub Kicinski off_reg = re_load_imm_any(nfp_prog, meta->insn.off, imm_b(nfp_prog)); 1730e663fe38SJakub Kicinski 1731e663fe38SJakub Kicinski return data_stx_host_order(nfp_prog, meta->insn.dst_reg * 2, off_reg, 1732e663fe38SJakub Kicinski meta->insn.src_reg * 2, size); 1733e663fe38SJakub Kicinski } 1734e663fe38SJakub Kicinski 1735e663fe38SJakub Kicinski static int 1736ee9133a8SJakub Kicinski mem_stx_stack(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 1737d3488480SJakub Kicinski unsigned int size, unsigned int ptr_off) 1738ee9133a8SJakub Kicinski { 1739d3488480SJakub Kicinski return mem_op_stack(nfp_prog, meta, size, ptr_off, 1740b14157eeSJakub Kicinski meta->insn.src_reg * 2, meta->insn.dst_reg * 2, 1741b14157eeSJakub Kicinski false, wrp_lmem_store); 1742ee9133a8SJakub Kicinski } 1743ee9133a8SJakub Kicinski 1744ee9133a8SJakub Kicinski static int 1745e663fe38SJakub Kicinski mem_stx(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta, 1746e663fe38SJakub Kicinski unsigned int size) 1747e663fe38SJakub Kicinski { 1748e663fe38SJakub Kicinski if (meta->ptr.type == PTR_TO_PACKET) 1749e663fe38SJakub Kicinski return mem_stx_data(nfp_prog, meta, size); 1750e663fe38SJakub Kicinski 1751ee9133a8SJakub Kicinski if (meta->ptr.type == PTR_TO_STACK) 1752d3488480SJakub Kicinski return mem_stx_stack(nfp_prog, meta, size, 1753d3488480SJakub Kicinski meta->ptr.off + meta->ptr.var_off.value); 1754ee9133a8SJakub Kicinski 1755d9ae7f2bSJakub Kicinski return -EOPNOTSUPP; 1756d9ae7f2bSJakub Kicinski } 1757d9ae7f2bSJakub Kicinski 1758e663fe38SJakub Kicinski static int mem_stx1(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1759e663fe38SJakub Kicinski { 1760e663fe38SJakub Kicinski return mem_stx(nfp_prog, meta, 1); 1761e663fe38SJakub Kicinski } 1762e663fe38SJakub Kicinski 1763e663fe38SJakub Kicinski static int mem_stx2(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1764e663fe38SJakub Kicinski { 1765e663fe38SJakub Kicinski return mem_stx(nfp_prog, meta, 2); 1766e663fe38SJakub Kicinski } 1767e663fe38SJakub Kicinski 1768d9ae7f2bSJakub Kicinski static int mem_stx4(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1769d9ae7f2bSJakub Kicinski { 1770e663fe38SJakub Kicinski return mem_stx(nfp_prog, meta, 4); 1771e663fe38SJakub Kicinski } 17722ca71441SJakub Kicinski 1773e663fe38SJakub Kicinski static int mem_stx8(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1774e663fe38SJakub Kicinski { 1775e663fe38SJakub Kicinski return mem_stx(nfp_prog, meta, 8); 1776d9ae7f2bSJakub Kicinski } 1777d9ae7f2bSJakub Kicinski 1778d9ae7f2bSJakub Kicinski static int jump(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1779d9ae7f2bSJakub Kicinski { 1780d9ae7f2bSJakub Kicinski emit_br(nfp_prog, BR_UNC, meta->insn.off, 0); 1781d9ae7f2bSJakub Kicinski 1782d9ae7f2bSJakub Kicinski return 0; 1783d9ae7f2bSJakub Kicinski } 1784d9ae7f2bSJakub Kicinski 1785d9ae7f2bSJakub Kicinski static int jeq_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1786d9ae7f2bSJakub Kicinski { 1787d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 1788d9ae7f2bSJakub Kicinski u64 imm = insn->imm; /* sign extend */ 1789b3f868dfSJakub Kicinski swreg or1, or2, tmp_reg; 1790b3f868dfSJakub Kicinski 1791b3f868dfSJakub Kicinski or1 = reg_a(insn->dst_reg * 2); 1792b3f868dfSJakub Kicinski or2 = reg_b(insn->dst_reg * 2 + 1); 1793d9ae7f2bSJakub Kicinski 1794d9ae7f2bSJakub Kicinski if (imm & ~0U) { 1795d9ae7f2bSJakub Kicinski tmp_reg = ur_load_imm_any(nfp_prog, imm & ~0U, imm_b(nfp_prog)); 1796d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, imm_a(nfp_prog), 1797d9ae7f2bSJakub Kicinski reg_a(insn->dst_reg * 2), ALU_OP_XOR, tmp_reg); 1798d9ae7f2bSJakub Kicinski or1 = imm_a(nfp_prog); 1799d9ae7f2bSJakub Kicinski } 1800d9ae7f2bSJakub Kicinski 1801d9ae7f2bSJakub Kicinski if (imm >> 32) { 1802d9ae7f2bSJakub Kicinski tmp_reg = ur_load_imm_any(nfp_prog, imm >> 32, imm_b(nfp_prog)); 1803d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, imm_b(nfp_prog), 1804d9ae7f2bSJakub Kicinski reg_a(insn->dst_reg * 2 + 1), ALU_OP_XOR, tmp_reg); 1805d9ae7f2bSJakub Kicinski or2 = imm_b(nfp_prog); 1806d9ae7f2bSJakub Kicinski } 1807d9ae7f2bSJakub Kicinski 1808d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), or1, ALU_OP_OR, or2); 1809d9ae7f2bSJakub Kicinski emit_br(nfp_prog, BR_BEQ, insn->off, 0); 1810d9ae7f2bSJakub Kicinski 1811d9ae7f2bSJakub Kicinski return 0; 1812d9ae7f2bSJakub Kicinski } 1813d9ae7f2bSJakub Kicinski 1814d9ae7f2bSJakub Kicinski static int jgt_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1815d9ae7f2bSJakub Kicinski { 181626fa818dSJakub Kicinski return wrp_cmp_imm(nfp_prog, meta, BR_BLO, true); 1817d9ae7f2bSJakub Kicinski } 1818d9ae7f2bSJakub Kicinski 1819d9ae7f2bSJakub Kicinski static int jge_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1820d9ae7f2bSJakub Kicinski { 182126fa818dSJakub Kicinski return wrp_cmp_imm(nfp_prog, meta, BR_BHS, false); 1822d9ae7f2bSJakub Kicinski } 1823d9ae7f2bSJakub Kicinski 18245dd294d4SDaniel Borkmann static int jlt_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 18255dd294d4SDaniel Borkmann { 182626fa818dSJakub Kicinski return wrp_cmp_imm(nfp_prog, meta, BR_BLO, false); 18275dd294d4SDaniel Borkmann } 18285dd294d4SDaniel Borkmann 18295dd294d4SDaniel Borkmann static int jle_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 18305dd294d4SDaniel Borkmann { 183126fa818dSJakub Kicinski return wrp_cmp_imm(nfp_prog, meta, BR_BHS, true); 18325dd294d4SDaniel Borkmann } 18335dd294d4SDaniel Borkmann 1834d9ae7f2bSJakub Kicinski static int jset_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1835d9ae7f2bSJakub Kicinski { 1836d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 1837d9ae7f2bSJakub Kicinski u64 imm = insn->imm; /* sign extend */ 1838b3f868dfSJakub Kicinski swreg tmp_reg; 1839d9ae7f2bSJakub Kicinski 1840d9ae7f2bSJakub Kicinski if (!imm) { 1841d9ae7f2bSJakub Kicinski meta->skip = true; 1842d9ae7f2bSJakub Kicinski return 0; 1843d9ae7f2bSJakub Kicinski } 1844d9ae7f2bSJakub Kicinski 1845d9ae7f2bSJakub Kicinski if (imm & ~0U) { 1846d9ae7f2bSJakub Kicinski tmp_reg = ur_load_imm_any(nfp_prog, imm & ~0U, imm_b(nfp_prog)); 1847d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), 1848d9ae7f2bSJakub Kicinski reg_a(insn->dst_reg * 2), ALU_OP_AND, tmp_reg); 1849d9ae7f2bSJakub Kicinski emit_br(nfp_prog, BR_BNE, insn->off, 0); 1850d9ae7f2bSJakub Kicinski } 1851d9ae7f2bSJakub Kicinski 1852d9ae7f2bSJakub Kicinski if (imm >> 32) { 1853d9ae7f2bSJakub Kicinski tmp_reg = ur_load_imm_any(nfp_prog, imm >> 32, imm_b(nfp_prog)); 1854d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), 1855d9ae7f2bSJakub Kicinski reg_a(insn->dst_reg * 2 + 1), ALU_OP_AND, tmp_reg); 1856d9ae7f2bSJakub Kicinski emit_br(nfp_prog, BR_BNE, insn->off, 0); 1857d9ae7f2bSJakub Kicinski } 1858d9ae7f2bSJakub Kicinski 1859d9ae7f2bSJakub Kicinski return 0; 1860d9ae7f2bSJakub Kicinski } 1861d9ae7f2bSJakub Kicinski 1862d9ae7f2bSJakub Kicinski static int jne_imm(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1863d9ae7f2bSJakub Kicinski { 1864d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 1865d9ae7f2bSJakub Kicinski u64 imm = insn->imm; /* sign extend */ 1866b3f868dfSJakub Kicinski swreg tmp_reg; 1867d9ae7f2bSJakub Kicinski 1868d9ae7f2bSJakub Kicinski if (!imm) { 1869d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), reg_a(insn->dst_reg * 2), 1870d9ae7f2bSJakub Kicinski ALU_OP_OR, reg_b(insn->dst_reg * 2 + 1)); 1871d9ae7f2bSJakub Kicinski emit_br(nfp_prog, BR_BNE, insn->off, 0); 187282837370SJakub Kicinski return 0; 1873d9ae7f2bSJakub Kicinski } 1874d9ae7f2bSJakub Kicinski 1875d9ae7f2bSJakub Kicinski tmp_reg = ur_load_imm_any(nfp_prog, imm & ~0U, imm_b(nfp_prog)); 1876d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), 1877d9ae7f2bSJakub Kicinski reg_a(insn->dst_reg * 2), ALU_OP_XOR, tmp_reg); 1878d9ae7f2bSJakub Kicinski emit_br(nfp_prog, BR_BNE, insn->off, 0); 1879d9ae7f2bSJakub Kicinski 1880d9ae7f2bSJakub Kicinski tmp_reg = ur_load_imm_any(nfp_prog, imm >> 32, imm_b(nfp_prog)); 1881d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), 1882d9ae7f2bSJakub Kicinski reg_a(insn->dst_reg * 2 + 1), ALU_OP_XOR, tmp_reg); 1883d9ae7f2bSJakub Kicinski emit_br(nfp_prog, BR_BNE, insn->off, 0); 1884d9ae7f2bSJakub Kicinski 1885d9ae7f2bSJakub Kicinski return 0; 1886d9ae7f2bSJakub Kicinski } 1887d9ae7f2bSJakub Kicinski 1888d9ae7f2bSJakub Kicinski static int jeq_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1889d9ae7f2bSJakub Kicinski { 1890d9ae7f2bSJakub Kicinski const struct bpf_insn *insn = &meta->insn; 1891d9ae7f2bSJakub Kicinski 1892d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, imm_a(nfp_prog), reg_a(insn->dst_reg * 2), 1893d9ae7f2bSJakub Kicinski ALU_OP_XOR, reg_b(insn->src_reg * 2)); 1894d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, imm_b(nfp_prog), reg_a(insn->dst_reg * 2 + 1), 1895d9ae7f2bSJakub Kicinski ALU_OP_XOR, reg_b(insn->src_reg * 2 + 1)); 1896d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), 1897d9ae7f2bSJakub Kicinski imm_a(nfp_prog), ALU_OP_OR, imm_b(nfp_prog)); 1898d9ae7f2bSJakub Kicinski emit_br(nfp_prog, BR_BEQ, insn->off, 0); 1899d9ae7f2bSJakub Kicinski 1900d9ae7f2bSJakub Kicinski return 0; 1901d9ae7f2bSJakub Kicinski } 1902d9ae7f2bSJakub Kicinski 1903d9ae7f2bSJakub Kicinski static int jgt_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1904d9ae7f2bSJakub Kicinski { 190526fa818dSJakub Kicinski return wrp_cmp_reg(nfp_prog, meta, BR_BLO, true); 1906d9ae7f2bSJakub Kicinski } 1907d9ae7f2bSJakub Kicinski 1908d9ae7f2bSJakub Kicinski static int jge_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1909d9ae7f2bSJakub Kicinski { 191026fa818dSJakub Kicinski return wrp_cmp_reg(nfp_prog, meta, BR_BHS, false); 1911d9ae7f2bSJakub Kicinski } 1912d9ae7f2bSJakub Kicinski 19135dd294d4SDaniel Borkmann static int jlt_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 19145dd294d4SDaniel Borkmann { 191526fa818dSJakub Kicinski return wrp_cmp_reg(nfp_prog, meta, BR_BLO, false); 19165dd294d4SDaniel Borkmann } 19175dd294d4SDaniel Borkmann 19185dd294d4SDaniel Borkmann static int jle_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 19195dd294d4SDaniel Borkmann { 192026fa818dSJakub Kicinski return wrp_cmp_reg(nfp_prog, meta, BR_BHS, true); 19215dd294d4SDaniel Borkmann } 19225dd294d4SDaniel Borkmann 1923d9ae7f2bSJakub Kicinski static int jset_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1924d9ae7f2bSJakub Kicinski { 1925d9ae7f2bSJakub Kicinski return wrp_test_reg(nfp_prog, meta, ALU_OP_AND, BR_BNE); 1926d9ae7f2bSJakub Kicinski } 1927d9ae7f2bSJakub Kicinski 1928d9ae7f2bSJakub Kicinski static int jne_reg(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1929d9ae7f2bSJakub Kicinski { 1930d9ae7f2bSJakub Kicinski return wrp_test_reg(nfp_prog, meta, ALU_OP_XOR, BR_BNE); 1931d9ae7f2bSJakub Kicinski } 1932d9ae7f2bSJakub Kicinski 1933d9ae7f2bSJakub Kicinski static int goto_out(struct nfp_prog *nfp_prog, struct nfp_insn_meta *meta) 1934d9ae7f2bSJakub Kicinski { 1935d9ae7f2bSJakub Kicinski wrp_br_special(nfp_prog, BR_UNC, OP_BR_GO_OUT); 1936d9ae7f2bSJakub Kicinski 1937d9ae7f2bSJakub Kicinski return 0; 1938d9ae7f2bSJakub Kicinski } 1939d9ae7f2bSJakub Kicinski 1940d9ae7f2bSJakub Kicinski static const instr_cb_t instr_cb[256] = { 1941d9ae7f2bSJakub Kicinski [BPF_ALU64 | BPF_MOV | BPF_X] = mov_reg64, 1942d9ae7f2bSJakub Kicinski [BPF_ALU64 | BPF_MOV | BPF_K] = mov_imm64, 1943d9ae7f2bSJakub Kicinski [BPF_ALU64 | BPF_XOR | BPF_X] = xor_reg64, 1944d9ae7f2bSJakub Kicinski [BPF_ALU64 | BPF_XOR | BPF_K] = xor_imm64, 1945d9ae7f2bSJakub Kicinski [BPF_ALU64 | BPF_AND | BPF_X] = and_reg64, 1946d9ae7f2bSJakub Kicinski [BPF_ALU64 | BPF_AND | BPF_K] = and_imm64, 1947d9ae7f2bSJakub Kicinski [BPF_ALU64 | BPF_OR | BPF_X] = or_reg64, 1948d9ae7f2bSJakub Kicinski [BPF_ALU64 | BPF_OR | BPF_K] = or_imm64, 1949d9ae7f2bSJakub Kicinski [BPF_ALU64 | BPF_ADD | BPF_X] = add_reg64, 1950d9ae7f2bSJakub Kicinski [BPF_ALU64 | BPF_ADD | BPF_K] = add_imm64, 1951d9ae7f2bSJakub Kicinski [BPF_ALU64 | BPF_SUB | BPF_X] = sub_reg64, 1952d9ae7f2bSJakub Kicinski [BPF_ALU64 | BPF_SUB | BPF_K] = sub_imm64, 1953254ef4d7SJiong Wang [BPF_ALU64 | BPF_NEG] = neg_reg64, 1954d9ae7f2bSJakub Kicinski [BPF_ALU64 | BPF_LSH | BPF_K] = shl_imm64, 1955d9ae7f2bSJakub Kicinski [BPF_ALU64 | BPF_RSH | BPF_K] = shr_imm64, 1956d9ae7f2bSJakub Kicinski [BPF_ALU | BPF_MOV | BPF_X] = mov_reg, 1957d9ae7f2bSJakub Kicinski [BPF_ALU | BPF_MOV | BPF_K] = mov_imm, 1958d9ae7f2bSJakub Kicinski [BPF_ALU | BPF_XOR | BPF_X] = xor_reg, 1959d9ae7f2bSJakub Kicinski [BPF_ALU | BPF_XOR | BPF_K] = xor_imm, 1960d9ae7f2bSJakub Kicinski [BPF_ALU | BPF_AND | BPF_X] = and_reg, 1961d9ae7f2bSJakub Kicinski [BPF_ALU | BPF_AND | BPF_K] = and_imm, 1962d9ae7f2bSJakub Kicinski [BPF_ALU | BPF_OR | BPF_X] = or_reg, 1963d9ae7f2bSJakub Kicinski [BPF_ALU | BPF_OR | BPF_K] = or_imm, 1964d9ae7f2bSJakub Kicinski [BPF_ALU | BPF_ADD | BPF_X] = add_reg, 1965d9ae7f2bSJakub Kicinski [BPF_ALU | BPF_ADD | BPF_K] = add_imm, 1966d9ae7f2bSJakub Kicinski [BPF_ALU | BPF_SUB | BPF_X] = sub_reg, 1967d9ae7f2bSJakub Kicinski [BPF_ALU | BPF_SUB | BPF_K] = sub_imm, 1968254ef4d7SJiong Wang [BPF_ALU | BPF_NEG] = neg_reg, 1969d9ae7f2bSJakub Kicinski [BPF_ALU | BPF_LSH | BPF_K] = shl_imm, 19703119d1fdSJakub Kicinski [BPF_ALU | BPF_END | BPF_X] = end_reg32, 1971d9ae7f2bSJakub Kicinski [BPF_LD | BPF_IMM | BPF_DW] = imm_ld8, 1972d9ae7f2bSJakub Kicinski [BPF_LD | BPF_ABS | BPF_B] = data_ld1, 1973d9ae7f2bSJakub Kicinski [BPF_LD | BPF_ABS | BPF_H] = data_ld2, 1974d9ae7f2bSJakub Kicinski [BPF_LD | BPF_ABS | BPF_W] = data_ld4, 1975d9ae7f2bSJakub Kicinski [BPF_LD | BPF_IND | BPF_B] = data_ind_ld1, 1976d9ae7f2bSJakub Kicinski [BPF_LD | BPF_IND | BPF_H] = data_ind_ld2, 1977d9ae7f2bSJakub Kicinski [BPF_LD | BPF_IND | BPF_W] = data_ind_ld4, 19782ca71441SJakub Kicinski [BPF_LDX | BPF_MEM | BPF_B] = mem_ldx1, 19792ca71441SJakub Kicinski [BPF_LDX | BPF_MEM | BPF_H] = mem_ldx2, 1980d9ae7f2bSJakub Kicinski [BPF_LDX | BPF_MEM | BPF_W] = mem_ldx4, 19812ca71441SJakub Kicinski [BPF_LDX | BPF_MEM | BPF_DW] = mem_ldx8, 1982e663fe38SJakub Kicinski [BPF_STX | BPF_MEM | BPF_B] = mem_stx1, 1983e663fe38SJakub Kicinski [BPF_STX | BPF_MEM | BPF_H] = mem_stx2, 1984d9ae7f2bSJakub Kicinski [BPF_STX | BPF_MEM | BPF_W] = mem_stx4, 1985e663fe38SJakub Kicinski [BPF_STX | BPF_MEM | BPF_DW] = mem_stx8, 1986e663fe38SJakub Kicinski [BPF_ST | BPF_MEM | BPF_B] = mem_st1, 1987e663fe38SJakub Kicinski [BPF_ST | BPF_MEM | BPF_H] = mem_st2, 1988e663fe38SJakub Kicinski [BPF_ST | BPF_MEM | BPF_W] = mem_st4, 1989e663fe38SJakub Kicinski [BPF_ST | BPF_MEM | BPF_DW] = mem_st8, 1990d9ae7f2bSJakub Kicinski [BPF_JMP | BPF_JA | BPF_K] = jump, 1991d9ae7f2bSJakub Kicinski [BPF_JMP | BPF_JEQ | BPF_K] = jeq_imm, 1992d9ae7f2bSJakub Kicinski [BPF_JMP | BPF_JGT | BPF_K] = jgt_imm, 1993d9ae7f2bSJakub Kicinski [BPF_JMP | BPF_JGE | BPF_K] = jge_imm, 19945dd294d4SDaniel Borkmann [BPF_JMP | BPF_JLT | BPF_K] = jlt_imm, 19955dd294d4SDaniel Borkmann [BPF_JMP | BPF_JLE | BPF_K] = jle_imm, 1996d9ae7f2bSJakub Kicinski [BPF_JMP | BPF_JSET | BPF_K] = jset_imm, 1997d9ae7f2bSJakub Kicinski [BPF_JMP | BPF_JNE | BPF_K] = jne_imm, 1998d9ae7f2bSJakub Kicinski [BPF_JMP | BPF_JEQ | BPF_X] = jeq_reg, 1999d9ae7f2bSJakub Kicinski [BPF_JMP | BPF_JGT | BPF_X] = jgt_reg, 2000d9ae7f2bSJakub Kicinski [BPF_JMP | BPF_JGE | BPF_X] = jge_reg, 20015dd294d4SDaniel Borkmann [BPF_JMP | BPF_JLT | BPF_X] = jlt_reg, 20025dd294d4SDaniel Borkmann [BPF_JMP | BPF_JLE | BPF_X] = jle_reg, 2003d9ae7f2bSJakub Kicinski [BPF_JMP | BPF_JSET | BPF_X] = jset_reg, 2004d9ae7f2bSJakub Kicinski [BPF_JMP | BPF_JNE | BPF_X] = jne_reg, 2005d9ae7f2bSJakub Kicinski [BPF_JMP | BPF_EXIT] = goto_out, 2006d9ae7f2bSJakub Kicinski }; 2007d9ae7f2bSJakub Kicinski 2008d9ae7f2bSJakub Kicinski /* --- Misc code --- */ 2009d9ae7f2bSJakub Kicinski static void br_set_offset(u64 *instr, u16 offset) 2010d9ae7f2bSJakub Kicinski { 2011d9ae7f2bSJakub Kicinski u16 addr_lo, addr_hi; 2012d9ae7f2bSJakub Kicinski 2013d9ae7f2bSJakub Kicinski addr_lo = offset & (OP_BR_ADDR_LO >> __bf_shf(OP_BR_ADDR_LO)); 2014d9ae7f2bSJakub Kicinski addr_hi = offset != addr_lo; 2015d9ae7f2bSJakub Kicinski *instr &= ~(OP_BR_ADDR_HI | OP_BR_ADDR_LO); 2016d9ae7f2bSJakub Kicinski *instr |= FIELD_PREP(OP_BR_ADDR_HI, addr_hi); 2017d9ae7f2bSJakub Kicinski *instr |= FIELD_PREP(OP_BR_ADDR_LO, addr_lo); 2018d9ae7f2bSJakub Kicinski } 2019d9ae7f2bSJakub Kicinski 2020d9ae7f2bSJakub Kicinski /* --- Assembler logic --- */ 2021d9ae7f2bSJakub Kicinski static int nfp_fixup_branches(struct nfp_prog *nfp_prog) 2022d9ae7f2bSJakub Kicinski { 20235b674140SJiong Wang struct nfp_insn_meta *meta, *jmp_dst; 2024854dc87dSJiong Wang u32 idx, br_idx; 2025d9ae7f2bSJakub Kicinski 2026854dc87dSJiong Wang list_for_each_entry(meta, &nfp_prog->insns, l) { 2027d9ae7f2bSJakub Kicinski if (meta->skip) 2028d9ae7f2bSJakub Kicinski continue; 2029d9ae7f2bSJakub Kicinski if (BPF_CLASS(meta->insn.code) != BPF_JMP) 2030d9ae7f2bSJakub Kicinski continue; 2031d9ae7f2bSJakub Kicinski 20325b674140SJiong Wang if (list_is_last(&meta->l, &nfp_prog->insns)) 2033854dc87dSJiong Wang idx = nfp_prog->last_bpf_off; 20345b674140SJiong Wang else 20355b674140SJiong Wang idx = list_next_entry(meta, l)->off - 1; 2036854dc87dSJiong Wang 2037854dc87dSJiong Wang br_idx = nfp_prog_offset_to_index(nfp_prog, idx); 2038854dc87dSJiong Wang 2039d9ae7f2bSJakub Kicinski if (!nfp_is_br(nfp_prog->prog[br_idx])) { 2040d9ae7f2bSJakub Kicinski pr_err("Fixup found block not ending in branch %d %02x %016llx!!\n", 2041d9ae7f2bSJakub Kicinski br_idx, meta->insn.code, nfp_prog->prog[br_idx]); 2042d9ae7f2bSJakub Kicinski return -ELOOP; 2043d9ae7f2bSJakub Kicinski } 2044d9ae7f2bSJakub Kicinski /* Leave special branches for later */ 2045d9ae7f2bSJakub Kicinski if (FIELD_GET(OP_BR_SPECIAL, nfp_prog->prog[br_idx])) 2046d9ae7f2bSJakub Kicinski continue; 2047d9ae7f2bSJakub Kicinski 20485b674140SJiong Wang if (!meta->jmp_dst) { 20495b674140SJiong Wang pr_err("Non-exit jump doesn't have destination info recorded!!\n"); 2050d9ae7f2bSJakub Kicinski return -ELOOP; 2051d9ae7f2bSJakub Kicinski } 2052d9ae7f2bSJakub Kicinski 20535b674140SJiong Wang jmp_dst = meta->jmp_dst; 2054854dc87dSJiong Wang 20555b674140SJiong Wang if (jmp_dst->skip) { 2056d9ae7f2bSJakub Kicinski pr_err("Branch landing on removed instruction!!\n"); 2057d9ae7f2bSJakub Kicinski return -ELOOP; 2058d9ae7f2bSJakub Kicinski } 2059d9ae7f2bSJakub Kicinski 2060d9ae7f2bSJakub Kicinski for (idx = nfp_prog_offset_to_index(nfp_prog, meta->off); 2061d9ae7f2bSJakub Kicinski idx <= br_idx; idx++) { 2062d9ae7f2bSJakub Kicinski if (!nfp_is_br(nfp_prog->prog[idx])) 2063d9ae7f2bSJakub Kicinski continue; 20645b674140SJiong Wang br_set_offset(&nfp_prog->prog[idx], jmp_dst->off); 2065d9ae7f2bSJakub Kicinski } 2066d9ae7f2bSJakub Kicinski } 2067d9ae7f2bSJakub Kicinski 2068d9ae7f2bSJakub Kicinski /* Fixup 'goto out's separately, they can be scattered around */ 2069d9ae7f2bSJakub Kicinski for (br_idx = 0; br_idx < nfp_prog->prog_len; br_idx++) { 2070d9ae7f2bSJakub Kicinski enum br_special special; 2071d9ae7f2bSJakub Kicinski 2072d9ae7f2bSJakub Kicinski if ((nfp_prog->prog[br_idx] & OP_BR_BASE_MASK) != OP_BR_BASE) 2073d9ae7f2bSJakub Kicinski continue; 2074d9ae7f2bSJakub Kicinski 2075d9ae7f2bSJakub Kicinski special = FIELD_GET(OP_BR_SPECIAL, nfp_prog->prog[br_idx]); 2076d9ae7f2bSJakub Kicinski switch (special) { 2077d9ae7f2bSJakub Kicinski case OP_BR_NORMAL: 2078d9ae7f2bSJakub Kicinski break; 2079d9ae7f2bSJakub Kicinski case OP_BR_GO_OUT: 2080d9ae7f2bSJakub Kicinski br_set_offset(&nfp_prog->prog[br_idx], 2081d9ae7f2bSJakub Kicinski nfp_prog->tgt_out); 2082d9ae7f2bSJakub Kicinski break; 2083d9ae7f2bSJakub Kicinski case OP_BR_GO_ABORT: 2084d9ae7f2bSJakub Kicinski br_set_offset(&nfp_prog->prog[br_idx], 2085d9ae7f2bSJakub Kicinski nfp_prog->tgt_abort); 2086d9ae7f2bSJakub Kicinski break; 2087d9ae7f2bSJakub Kicinski } 2088d9ae7f2bSJakub Kicinski 2089d9ae7f2bSJakub Kicinski nfp_prog->prog[br_idx] &= ~OP_BR_SPECIAL; 2090d9ae7f2bSJakub Kicinski } 2091d9ae7f2bSJakub Kicinski 2092d9ae7f2bSJakub Kicinski return 0; 2093d9ae7f2bSJakub Kicinski } 2094d9ae7f2bSJakub Kicinski 2095d9ae7f2bSJakub Kicinski static void nfp_intro(struct nfp_prog *nfp_prog) 2096d9ae7f2bSJakub Kicinski { 209718e53b6cSJakub Kicinski wrp_immed(nfp_prog, plen_reg(nfp_prog), GENMASK(13, 0)); 209818e53b6cSJakub Kicinski emit_alu(nfp_prog, plen_reg(nfp_prog), 209918e53b6cSJakub Kicinski plen_reg(nfp_prog), ALU_OP_AND, pv_len(nfp_prog)); 2100d9ae7f2bSJakub Kicinski } 2101d9ae7f2bSJakub Kicinski 2102d9ae7f2bSJakub Kicinski static void nfp_outro_tc_da(struct nfp_prog *nfp_prog) 2103d9ae7f2bSJakub Kicinski { 2104d9ae7f2bSJakub Kicinski /* TC direct-action mode: 2105d9ae7f2bSJakub Kicinski * 0,1 ok NOT SUPPORTED[1] 2106d9ae7f2bSJakub Kicinski * 2 drop 0x22 -> drop, count as stat1 2107d9ae7f2bSJakub Kicinski * 4,5 nuke 0x02 -> drop 2108d9ae7f2bSJakub Kicinski * 7 redir 0x44 -> redir, count as stat2 2109d9ae7f2bSJakub Kicinski * * unspec 0x11 -> pass, count as stat0 2110d9ae7f2bSJakub Kicinski * 2111d9ae7f2bSJakub Kicinski * [1] We can't support OK and RECLASSIFY because we can't tell TC 2112d9ae7f2bSJakub Kicinski * the exact decision made. We are forced to support UNSPEC 2113d9ae7f2bSJakub Kicinski * to handle aborts so that's the only one we handle for passing 2114d9ae7f2bSJakub Kicinski * packets up the stack. 2115d9ae7f2bSJakub Kicinski */ 2116d9ae7f2bSJakub Kicinski /* Target for aborts */ 2117d9ae7f2bSJakub Kicinski nfp_prog->tgt_abort = nfp_prog_current_offset(nfp_prog); 2118d9ae7f2bSJakub Kicinski 2119d9ae7f2bSJakub Kicinski emit_br_def(nfp_prog, nfp_prog->tgt_done, 2); 2120d9ae7f2bSJakub Kicinski 2121c000dfb5SJakub Kicinski wrp_mov(nfp_prog, reg_a(0), NFP_BPF_ABI_FLAGS); 2122d9ae7f2bSJakub Kicinski emit_ld_field(nfp_prog, reg_a(0), 0xc, reg_imm(0x11), SHF_SC_L_SHF, 16); 2123d9ae7f2bSJakub Kicinski 2124d9ae7f2bSJakub Kicinski /* Target for normal exits */ 2125d9ae7f2bSJakub Kicinski nfp_prog->tgt_out = nfp_prog_current_offset(nfp_prog); 2126d9ae7f2bSJakub Kicinski 2127d9ae7f2bSJakub Kicinski /* if R0 > 7 jump to abort */ 2128d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), reg_imm(7), ALU_OP_SUB, reg_b(0)); 2129d9ae7f2bSJakub Kicinski emit_br(nfp_prog, BR_BLO, nfp_prog->tgt_abort, 0); 2130c000dfb5SJakub Kicinski wrp_mov(nfp_prog, reg_a(0), NFP_BPF_ABI_FLAGS); 2131d9ae7f2bSJakub Kicinski 2132d9ae7f2bSJakub Kicinski wrp_immed(nfp_prog, reg_b(2), 0x41221211); 2133d9ae7f2bSJakub Kicinski wrp_immed(nfp_prog, reg_b(3), 0x41001211); 2134d9ae7f2bSJakub Kicinski 2135d9ae7f2bSJakub Kicinski emit_shf(nfp_prog, reg_a(1), 2136d9ae7f2bSJakub Kicinski reg_none(), SHF_OP_NONE, reg_b(0), SHF_SC_L_SHF, 2); 2137d9ae7f2bSJakub Kicinski 2138d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), reg_a(1), ALU_OP_OR, reg_imm(0)); 2139d9ae7f2bSJakub Kicinski emit_shf(nfp_prog, reg_a(2), 2140d9ae7f2bSJakub Kicinski reg_imm(0xf), SHF_OP_AND, reg_b(2), SHF_SC_R_SHF, 0); 2141d9ae7f2bSJakub Kicinski 2142d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), reg_a(1), ALU_OP_OR, reg_imm(0)); 2143d9ae7f2bSJakub Kicinski emit_shf(nfp_prog, reg_b(2), 2144d9ae7f2bSJakub Kicinski reg_imm(0xf), SHF_OP_AND, reg_b(3), SHF_SC_R_SHF, 0); 2145d9ae7f2bSJakub Kicinski 2146d9ae7f2bSJakub Kicinski emit_br_def(nfp_prog, nfp_prog->tgt_done, 2); 2147d9ae7f2bSJakub Kicinski 2148d9ae7f2bSJakub Kicinski emit_shf(nfp_prog, reg_b(2), 2149d9ae7f2bSJakub Kicinski reg_a(2), SHF_OP_OR, reg_b(2), SHF_SC_L_SHF, 4); 2150d9ae7f2bSJakub Kicinski emit_ld_field(nfp_prog, reg_a(0), 0xc, reg_b(2), SHF_SC_L_SHF, 16); 2151d9ae7f2bSJakub Kicinski } 2152d9ae7f2bSJakub Kicinski 2153d9ae7f2bSJakub Kicinski static void nfp_outro_xdp(struct nfp_prog *nfp_prog) 2154d9ae7f2bSJakub Kicinski { 2155d9ae7f2bSJakub Kicinski /* XDP return codes: 2156d9ae7f2bSJakub Kicinski * 0 aborted 0x82 -> drop, count as stat3 2157d9ae7f2bSJakub Kicinski * 1 drop 0x22 -> drop, count as stat1 2158d9ae7f2bSJakub Kicinski * 2 pass 0x11 -> pass, count as stat0 2159d9ae7f2bSJakub Kicinski * 3 tx 0x44 -> redir, count as stat2 2160d9ae7f2bSJakub Kicinski * * unknown 0x82 -> drop, count as stat3 2161d9ae7f2bSJakub Kicinski */ 2162d9ae7f2bSJakub Kicinski /* Target for aborts */ 2163d9ae7f2bSJakub Kicinski nfp_prog->tgt_abort = nfp_prog_current_offset(nfp_prog); 2164d9ae7f2bSJakub Kicinski 2165d9ae7f2bSJakub Kicinski emit_br_def(nfp_prog, nfp_prog->tgt_done, 2); 2166d9ae7f2bSJakub Kicinski 2167c000dfb5SJakub Kicinski wrp_mov(nfp_prog, reg_a(0), NFP_BPF_ABI_FLAGS); 2168d9ae7f2bSJakub Kicinski emit_ld_field(nfp_prog, reg_a(0), 0xc, reg_imm(0x82), SHF_SC_L_SHF, 16); 2169d9ae7f2bSJakub Kicinski 2170d9ae7f2bSJakub Kicinski /* Target for normal exits */ 2171d9ae7f2bSJakub Kicinski nfp_prog->tgt_out = nfp_prog_current_offset(nfp_prog); 2172d9ae7f2bSJakub Kicinski 2173d9ae7f2bSJakub Kicinski /* if R0 > 3 jump to abort */ 2174d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), reg_imm(3), ALU_OP_SUB, reg_b(0)); 2175d9ae7f2bSJakub Kicinski emit_br(nfp_prog, BR_BLO, nfp_prog->tgt_abort, 0); 2176d9ae7f2bSJakub Kicinski 2177d9ae7f2bSJakub Kicinski wrp_immed(nfp_prog, reg_b(2), 0x44112282); 2178d9ae7f2bSJakub Kicinski 2179d9ae7f2bSJakub Kicinski emit_shf(nfp_prog, reg_a(1), 2180d9ae7f2bSJakub Kicinski reg_none(), SHF_OP_NONE, reg_b(0), SHF_SC_L_SHF, 3); 2181d9ae7f2bSJakub Kicinski 2182d9ae7f2bSJakub Kicinski emit_alu(nfp_prog, reg_none(), reg_a(1), ALU_OP_OR, reg_imm(0)); 2183d9ae7f2bSJakub Kicinski emit_shf(nfp_prog, reg_b(2), 2184d9ae7f2bSJakub Kicinski reg_imm(0xff), SHF_OP_AND, reg_b(2), SHF_SC_R_SHF, 0); 2185d9ae7f2bSJakub Kicinski 2186d9ae7f2bSJakub Kicinski emit_br_def(nfp_prog, nfp_prog->tgt_done, 2); 2187d9ae7f2bSJakub Kicinski 2188c000dfb5SJakub Kicinski wrp_mov(nfp_prog, reg_a(0), NFP_BPF_ABI_FLAGS); 2189d9ae7f2bSJakub Kicinski emit_ld_field(nfp_prog, reg_a(0), 0xc, reg_b(2), SHF_SC_L_SHF, 16); 2190d9ae7f2bSJakub Kicinski } 2191d9ae7f2bSJakub Kicinski 2192d9ae7f2bSJakub Kicinski static void nfp_outro(struct nfp_prog *nfp_prog) 2193d9ae7f2bSJakub Kicinski { 2194012bb8a8SJakub Kicinski switch (nfp_prog->type) { 2195012bb8a8SJakub Kicinski case BPF_PROG_TYPE_SCHED_CLS: 2196d9ae7f2bSJakub Kicinski nfp_outro_tc_da(nfp_prog); 2197d9ae7f2bSJakub Kicinski break; 2198012bb8a8SJakub Kicinski case BPF_PROG_TYPE_XDP: 2199d9ae7f2bSJakub Kicinski nfp_outro_xdp(nfp_prog); 2200d9ae7f2bSJakub Kicinski break; 2201012bb8a8SJakub Kicinski default: 2202012bb8a8SJakub Kicinski WARN_ON(1); 2203d9ae7f2bSJakub Kicinski } 2204d9ae7f2bSJakub Kicinski } 2205d9ae7f2bSJakub Kicinski 2206d9ae7f2bSJakub Kicinski static int nfp_translate(struct nfp_prog *nfp_prog) 2207d9ae7f2bSJakub Kicinski { 2208d9ae7f2bSJakub Kicinski struct nfp_insn_meta *meta; 2209ff42bb9fSJakub Kicinski int err; 2210d9ae7f2bSJakub Kicinski 2211d9ae7f2bSJakub Kicinski nfp_intro(nfp_prog); 2212d9ae7f2bSJakub Kicinski if (nfp_prog->error) 2213d9ae7f2bSJakub Kicinski return nfp_prog->error; 2214d9ae7f2bSJakub Kicinski 2215d9ae7f2bSJakub Kicinski list_for_each_entry(meta, &nfp_prog->insns, l) { 2216d9ae7f2bSJakub Kicinski instr_cb_t cb = instr_cb[meta->insn.code]; 2217d9ae7f2bSJakub Kicinski 2218d9ae7f2bSJakub Kicinski meta->off = nfp_prog_current_offset(nfp_prog); 2219d9ae7f2bSJakub Kicinski 2220d9ae7f2bSJakub Kicinski if (meta->skip) { 2221d9ae7f2bSJakub Kicinski nfp_prog->n_translated++; 2222d9ae7f2bSJakub Kicinski continue; 2223d9ae7f2bSJakub Kicinski } 2224d9ae7f2bSJakub Kicinski 2225d9ae7f2bSJakub Kicinski if (nfp_meta_has_prev(nfp_prog, meta) && 2226d9ae7f2bSJakub Kicinski nfp_meta_prev(meta)->double_cb) 2227d9ae7f2bSJakub Kicinski cb = nfp_meta_prev(meta)->double_cb; 2228d9ae7f2bSJakub Kicinski if (!cb) 2229d9ae7f2bSJakub Kicinski return -ENOENT; 2230d9ae7f2bSJakub Kicinski err = cb(nfp_prog, meta); 2231d9ae7f2bSJakub Kicinski if (err) 2232d9ae7f2bSJakub Kicinski return err; 2233d9ae7f2bSJakub Kicinski 2234d9ae7f2bSJakub Kicinski nfp_prog->n_translated++; 2235d9ae7f2bSJakub Kicinski } 2236d9ae7f2bSJakub Kicinski 2237854dc87dSJiong Wang nfp_prog->last_bpf_off = nfp_prog_current_offset(nfp_prog) - 1; 2238854dc87dSJiong Wang 2239d9ae7f2bSJakub Kicinski nfp_outro(nfp_prog); 2240d9ae7f2bSJakub Kicinski if (nfp_prog->error) 2241d9ae7f2bSJakub Kicinski return nfp_prog->error; 2242d9ae7f2bSJakub Kicinski 2243ff42bb9fSJakub Kicinski wrp_nops(nfp_prog, NFP_USTORE_PREFETCH_WINDOW); 22441c03e03fSJakub Kicinski if (nfp_prog->error) 22451c03e03fSJakub Kicinski return nfp_prog->error; 22461c03e03fSJakub Kicinski 2247d9ae7f2bSJakub Kicinski return nfp_fixup_branches(nfp_prog); 2248d9ae7f2bSJakub Kicinski } 2249d9ae7f2bSJakub Kicinski 2250d9ae7f2bSJakub Kicinski /* --- Optimizations --- */ 2251d9ae7f2bSJakub Kicinski static void nfp_bpf_opt_reg_init(struct nfp_prog *nfp_prog) 2252d9ae7f2bSJakub Kicinski { 2253d9ae7f2bSJakub Kicinski struct nfp_insn_meta *meta; 2254d9ae7f2bSJakub Kicinski 2255d9ae7f2bSJakub Kicinski list_for_each_entry(meta, &nfp_prog->insns, l) { 2256d9ae7f2bSJakub Kicinski struct bpf_insn insn = meta->insn; 2257d9ae7f2bSJakub Kicinski 2258d9ae7f2bSJakub Kicinski /* Programs converted from cBPF start with register xoring */ 2259d9ae7f2bSJakub Kicinski if (insn.code == (BPF_ALU64 | BPF_XOR | BPF_X) && 2260d9ae7f2bSJakub Kicinski insn.src_reg == insn.dst_reg) 2261d9ae7f2bSJakub Kicinski continue; 2262d9ae7f2bSJakub Kicinski 2263d9ae7f2bSJakub Kicinski /* Programs start with R6 = R1 but we ignore the skb pointer */ 2264d9ae7f2bSJakub Kicinski if (insn.code == (BPF_ALU64 | BPF_MOV | BPF_X) && 2265d9ae7f2bSJakub Kicinski insn.src_reg == 1 && insn.dst_reg == 6) 2266d9ae7f2bSJakub Kicinski meta->skip = true; 2267d9ae7f2bSJakub Kicinski 2268d9ae7f2bSJakub Kicinski /* Return as soon as something doesn't match */ 2269d9ae7f2bSJakub Kicinski if (!meta->skip) 2270d9ae7f2bSJakub Kicinski return; 2271d9ae7f2bSJakub Kicinski } 2272d9ae7f2bSJakub Kicinski } 2273d9ae7f2bSJakub Kicinski 2274d9ae7f2bSJakub Kicinski /* Remove masking after load since our load guarantees this is not needed */ 2275d9ae7f2bSJakub Kicinski static void nfp_bpf_opt_ld_mask(struct nfp_prog *nfp_prog) 2276d9ae7f2bSJakub Kicinski { 2277d9ae7f2bSJakub Kicinski struct nfp_insn_meta *meta1, *meta2; 2278d9ae7f2bSJakub Kicinski const s32 exp_mask[] = { 2279d9ae7f2bSJakub Kicinski [BPF_B] = 0x000000ffU, 2280d9ae7f2bSJakub Kicinski [BPF_H] = 0x0000ffffU, 2281d9ae7f2bSJakub Kicinski [BPF_W] = 0xffffffffU, 2282d9ae7f2bSJakub Kicinski }; 2283d9ae7f2bSJakub Kicinski 2284d9ae7f2bSJakub Kicinski nfp_for_each_insn_walk2(nfp_prog, meta1, meta2) { 2285d9ae7f2bSJakub Kicinski struct bpf_insn insn, next; 2286d9ae7f2bSJakub Kicinski 2287d9ae7f2bSJakub Kicinski insn = meta1->insn; 2288d9ae7f2bSJakub Kicinski next = meta2->insn; 2289d9ae7f2bSJakub Kicinski 2290d9ae7f2bSJakub Kicinski if (BPF_CLASS(insn.code) != BPF_LD) 2291d9ae7f2bSJakub Kicinski continue; 2292d9ae7f2bSJakub Kicinski if (BPF_MODE(insn.code) != BPF_ABS && 2293d9ae7f2bSJakub Kicinski BPF_MODE(insn.code) != BPF_IND) 2294d9ae7f2bSJakub Kicinski continue; 2295d9ae7f2bSJakub Kicinski 2296d9ae7f2bSJakub Kicinski if (next.code != (BPF_ALU64 | BPF_AND | BPF_K)) 2297d9ae7f2bSJakub Kicinski continue; 2298d9ae7f2bSJakub Kicinski 2299d9ae7f2bSJakub Kicinski if (!exp_mask[BPF_SIZE(insn.code)]) 2300d9ae7f2bSJakub Kicinski continue; 2301d9ae7f2bSJakub Kicinski if (exp_mask[BPF_SIZE(insn.code)] != next.imm) 2302d9ae7f2bSJakub Kicinski continue; 2303d9ae7f2bSJakub Kicinski 2304d9ae7f2bSJakub Kicinski if (next.src_reg || next.dst_reg) 2305d9ae7f2bSJakub Kicinski continue; 2306d9ae7f2bSJakub Kicinski 23071266f5d6SJiong Wang if (meta2->flags & FLAG_INSN_IS_JUMP_DST) 23081266f5d6SJiong Wang continue; 23091266f5d6SJiong Wang 2310d9ae7f2bSJakub Kicinski meta2->skip = true; 2311d9ae7f2bSJakub Kicinski } 2312d9ae7f2bSJakub Kicinski } 2313d9ae7f2bSJakub Kicinski 2314d9ae7f2bSJakub Kicinski static void nfp_bpf_opt_ld_shift(struct nfp_prog *nfp_prog) 2315d9ae7f2bSJakub Kicinski { 2316d9ae7f2bSJakub Kicinski struct nfp_insn_meta *meta1, *meta2, *meta3; 2317d9ae7f2bSJakub Kicinski 2318d9ae7f2bSJakub Kicinski nfp_for_each_insn_walk3(nfp_prog, meta1, meta2, meta3) { 2319d9ae7f2bSJakub Kicinski struct bpf_insn insn, next1, next2; 2320d9ae7f2bSJakub Kicinski 2321d9ae7f2bSJakub Kicinski insn = meta1->insn; 2322d9ae7f2bSJakub Kicinski next1 = meta2->insn; 2323d9ae7f2bSJakub Kicinski next2 = meta3->insn; 2324d9ae7f2bSJakub Kicinski 2325d9ae7f2bSJakub Kicinski if (BPF_CLASS(insn.code) != BPF_LD) 2326d9ae7f2bSJakub Kicinski continue; 2327d9ae7f2bSJakub Kicinski if (BPF_MODE(insn.code) != BPF_ABS && 2328d9ae7f2bSJakub Kicinski BPF_MODE(insn.code) != BPF_IND) 2329d9ae7f2bSJakub Kicinski continue; 2330d9ae7f2bSJakub Kicinski if (BPF_SIZE(insn.code) != BPF_W) 2331d9ae7f2bSJakub Kicinski continue; 2332d9ae7f2bSJakub Kicinski 2333d9ae7f2bSJakub Kicinski if (!(next1.code == (BPF_LSH | BPF_K | BPF_ALU64) && 2334d9ae7f2bSJakub Kicinski next2.code == (BPF_RSH | BPF_K | BPF_ALU64)) && 2335d9ae7f2bSJakub Kicinski !(next1.code == (BPF_RSH | BPF_K | BPF_ALU64) && 2336d9ae7f2bSJakub Kicinski next2.code == (BPF_LSH | BPF_K | BPF_ALU64))) 2337d9ae7f2bSJakub Kicinski continue; 2338d9ae7f2bSJakub Kicinski 2339d9ae7f2bSJakub Kicinski if (next1.src_reg || next1.dst_reg || 2340d9ae7f2bSJakub Kicinski next2.src_reg || next2.dst_reg) 2341d9ae7f2bSJakub Kicinski continue; 2342d9ae7f2bSJakub Kicinski 2343d9ae7f2bSJakub Kicinski if (next1.imm != 0x20 || next2.imm != 0x20) 2344d9ae7f2bSJakub Kicinski continue; 2345d9ae7f2bSJakub Kicinski 234629fe46efSJiong Wang if (meta2->flags & FLAG_INSN_IS_JUMP_DST || 234729fe46efSJiong Wang meta3->flags & FLAG_INSN_IS_JUMP_DST) 234829fe46efSJiong Wang continue; 234929fe46efSJiong Wang 2350d9ae7f2bSJakub Kicinski meta2->skip = true; 2351d9ae7f2bSJakub Kicinski meta3->skip = true; 2352d9ae7f2bSJakub Kicinski } 2353d9ae7f2bSJakub Kicinski } 2354d9ae7f2bSJakub Kicinski 23556bc7103cSJiong Wang /* load/store pair that forms memory copy sould look like the following: 23566bc7103cSJiong Wang * 23576bc7103cSJiong Wang * ld_width R, [addr_src + offset_src] 23586bc7103cSJiong Wang * st_width [addr_dest + offset_dest], R 23596bc7103cSJiong Wang * 23606bc7103cSJiong Wang * The destination register of load and source register of store should 23616bc7103cSJiong Wang * be the same, load and store should also perform at the same width. 23626bc7103cSJiong Wang * If either of addr_src or addr_dest is stack pointer, we don't do the 23636bc7103cSJiong Wang * CPP optimization as stack is modelled by registers on NFP. 23646bc7103cSJiong Wang */ 23656bc7103cSJiong Wang static bool 23666bc7103cSJiong Wang curr_pair_is_memcpy(struct nfp_insn_meta *ld_meta, 23676bc7103cSJiong Wang struct nfp_insn_meta *st_meta) 23686bc7103cSJiong Wang { 23696bc7103cSJiong Wang struct bpf_insn *ld = &ld_meta->insn; 23706bc7103cSJiong Wang struct bpf_insn *st = &st_meta->insn; 23716bc7103cSJiong Wang 23726bc7103cSJiong Wang if (!is_mbpf_load(ld_meta) || !is_mbpf_store(st_meta)) 23736bc7103cSJiong Wang return false; 23746bc7103cSJiong Wang 23756bc7103cSJiong Wang if (ld_meta->ptr.type != PTR_TO_PACKET) 23766bc7103cSJiong Wang return false; 23776bc7103cSJiong Wang 23786bc7103cSJiong Wang if (st_meta->ptr.type != PTR_TO_PACKET) 23796bc7103cSJiong Wang return false; 23806bc7103cSJiong Wang 23816bc7103cSJiong Wang if (BPF_SIZE(ld->code) != BPF_SIZE(st->code)) 23826bc7103cSJiong Wang return false; 23836bc7103cSJiong Wang 23846bc7103cSJiong Wang if (ld->dst_reg != st->src_reg) 23856bc7103cSJiong Wang return false; 23866bc7103cSJiong Wang 23876bc7103cSJiong Wang /* There is jump to the store insn in this pair. */ 23886bc7103cSJiong Wang if (st_meta->flags & FLAG_INSN_IS_JUMP_DST) 23896bc7103cSJiong Wang return false; 23906bc7103cSJiong Wang 23916bc7103cSJiong Wang return true; 23926bc7103cSJiong Wang } 23936bc7103cSJiong Wang 23946bc7103cSJiong Wang /* Currently, we only support chaining load/store pairs if: 23956bc7103cSJiong Wang * 23966bc7103cSJiong Wang * - Their address base registers are the same. 23976bc7103cSJiong Wang * - Their address offsets are in the same order. 23986bc7103cSJiong Wang * - They operate at the same memory width. 23996bc7103cSJiong Wang * - There is no jump into the middle of them. 24006bc7103cSJiong Wang */ 24016bc7103cSJiong Wang static bool 24026bc7103cSJiong Wang curr_pair_chain_with_previous(struct nfp_insn_meta *ld_meta, 24036bc7103cSJiong Wang struct nfp_insn_meta *st_meta, 24046bc7103cSJiong Wang struct bpf_insn *prev_ld, 24056bc7103cSJiong Wang struct bpf_insn *prev_st) 24066bc7103cSJiong Wang { 24076bc7103cSJiong Wang u8 prev_size, curr_size, prev_ld_base, prev_st_base, prev_ld_dst; 24086bc7103cSJiong Wang struct bpf_insn *ld = &ld_meta->insn; 24096bc7103cSJiong Wang struct bpf_insn *st = &st_meta->insn; 24106bc7103cSJiong Wang s16 prev_ld_off, prev_st_off; 24116bc7103cSJiong Wang 24126bc7103cSJiong Wang /* This pair is the start pair. */ 24136bc7103cSJiong Wang if (!prev_ld) 24146bc7103cSJiong Wang return true; 24156bc7103cSJiong Wang 24166bc7103cSJiong Wang prev_size = BPF_LDST_BYTES(prev_ld); 24176bc7103cSJiong Wang curr_size = BPF_LDST_BYTES(ld); 24186bc7103cSJiong Wang prev_ld_base = prev_ld->src_reg; 24196bc7103cSJiong Wang prev_st_base = prev_st->dst_reg; 24206bc7103cSJiong Wang prev_ld_dst = prev_ld->dst_reg; 24216bc7103cSJiong Wang prev_ld_off = prev_ld->off; 24226bc7103cSJiong Wang prev_st_off = prev_st->off; 24236bc7103cSJiong Wang 24246bc7103cSJiong Wang if (ld->dst_reg != prev_ld_dst) 24256bc7103cSJiong Wang return false; 24266bc7103cSJiong Wang 24276bc7103cSJiong Wang if (ld->src_reg != prev_ld_base || st->dst_reg != prev_st_base) 24286bc7103cSJiong Wang return false; 24296bc7103cSJiong Wang 24306bc7103cSJiong Wang if (curr_size != prev_size) 24316bc7103cSJiong Wang return false; 24326bc7103cSJiong Wang 24336bc7103cSJiong Wang /* There is jump to the head of this pair. */ 24346bc7103cSJiong Wang if (ld_meta->flags & FLAG_INSN_IS_JUMP_DST) 24356bc7103cSJiong Wang return false; 24366bc7103cSJiong Wang 24376bc7103cSJiong Wang /* Both in ascending order. */ 24386bc7103cSJiong Wang if (prev_ld_off + prev_size == ld->off && 24396bc7103cSJiong Wang prev_st_off + prev_size == st->off) 24406bc7103cSJiong Wang return true; 24416bc7103cSJiong Wang 24426bc7103cSJiong Wang /* Both in descending order. */ 24436bc7103cSJiong Wang if (ld->off + curr_size == prev_ld_off && 24446bc7103cSJiong Wang st->off + curr_size == prev_st_off) 24456bc7103cSJiong Wang return true; 24466bc7103cSJiong Wang 24476bc7103cSJiong Wang return false; 24486bc7103cSJiong Wang } 24496bc7103cSJiong Wang 24506bc7103cSJiong Wang /* Return TRUE if cross memory access happens. Cross memory access means 24516bc7103cSJiong Wang * store area is overlapping with load area that a later load might load 24526bc7103cSJiong Wang * the value from previous store, for this case we can't treat the sequence 24536bc7103cSJiong Wang * as an memory copy. 24546bc7103cSJiong Wang */ 24556bc7103cSJiong Wang static bool 24566bc7103cSJiong Wang cross_mem_access(struct bpf_insn *ld, struct nfp_insn_meta *head_ld_meta, 24576bc7103cSJiong Wang struct nfp_insn_meta *head_st_meta) 24586bc7103cSJiong Wang { 24596bc7103cSJiong Wang s16 head_ld_off, head_st_off, ld_off; 24606bc7103cSJiong Wang 24616bc7103cSJiong Wang /* Different pointer types does not overlap. */ 24626bc7103cSJiong Wang if (head_ld_meta->ptr.type != head_st_meta->ptr.type) 24636bc7103cSJiong Wang return false; 24646bc7103cSJiong Wang 24656bc7103cSJiong Wang /* load and store are both PTR_TO_PACKET, check ID info. */ 24666bc7103cSJiong Wang if (head_ld_meta->ptr.id != head_st_meta->ptr.id) 24676bc7103cSJiong Wang return true; 24686bc7103cSJiong Wang 24696bc7103cSJiong Wang /* Canonicalize the offsets. Turn all of them against the original 24706bc7103cSJiong Wang * base register. 24716bc7103cSJiong Wang */ 24726bc7103cSJiong Wang head_ld_off = head_ld_meta->insn.off + head_ld_meta->ptr.off; 24736bc7103cSJiong Wang head_st_off = head_st_meta->insn.off + head_st_meta->ptr.off; 24746bc7103cSJiong Wang ld_off = ld->off + head_ld_meta->ptr.off; 24756bc7103cSJiong Wang 24766bc7103cSJiong Wang /* Ascending order cross. */ 24776bc7103cSJiong Wang if (ld_off > head_ld_off && 24786bc7103cSJiong Wang head_ld_off < head_st_off && ld_off >= head_st_off) 24796bc7103cSJiong Wang return true; 24806bc7103cSJiong Wang 24816bc7103cSJiong Wang /* Descending order cross. */ 24826bc7103cSJiong Wang if (ld_off < head_ld_off && 24836bc7103cSJiong Wang head_ld_off > head_st_off && ld_off <= head_st_off) 24846bc7103cSJiong Wang return true; 24856bc7103cSJiong Wang 24866bc7103cSJiong Wang return false; 24876bc7103cSJiong Wang } 24886bc7103cSJiong Wang 24896bc7103cSJiong Wang /* This pass try to identify the following instructoin sequences. 24906bc7103cSJiong Wang * 24916bc7103cSJiong Wang * load R, [regA + offA] 24926bc7103cSJiong Wang * store [regB + offB], R 24936bc7103cSJiong Wang * load R, [regA + offA + const_imm_A] 24946bc7103cSJiong Wang * store [regB + offB + const_imm_A], R 24956bc7103cSJiong Wang * load R, [regA + offA + 2 * const_imm_A] 24966bc7103cSJiong Wang * store [regB + offB + 2 * const_imm_A], R 24976bc7103cSJiong Wang * ... 24986bc7103cSJiong Wang * 24996bc7103cSJiong Wang * Above sequence is typically generated by compiler when lowering 25006bc7103cSJiong Wang * memcpy. NFP prefer using CPP instructions to accelerate it. 25016bc7103cSJiong Wang */ 25026bc7103cSJiong Wang static void nfp_bpf_opt_ldst_gather(struct nfp_prog *nfp_prog) 25036bc7103cSJiong Wang { 25046bc7103cSJiong Wang struct nfp_insn_meta *head_ld_meta = NULL; 25056bc7103cSJiong Wang struct nfp_insn_meta *head_st_meta = NULL; 25066bc7103cSJiong Wang struct nfp_insn_meta *meta1, *meta2; 25076bc7103cSJiong Wang struct bpf_insn *prev_ld = NULL; 25086bc7103cSJiong Wang struct bpf_insn *prev_st = NULL; 25096bc7103cSJiong Wang u8 count = 0; 25106bc7103cSJiong Wang 25116bc7103cSJiong Wang nfp_for_each_insn_walk2(nfp_prog, meta1, meta2) { 25126bc7103cSJiong Wang struct bpf_insn *ld = &meta1->insn; 25136bc7103cSJiong Wang struct bpf_insn *st = &meta2->insn; 25146bc7103cSJiong Wang 25156bc7103cSJiong Wang /* Reset record status if any of the following if true: 25166bc7103cSJiong Wang * - The current insn pair is not load/store. 25176bc7103cSJiong Wang * - The load/store pair doesn't chain with previous one. 25186bc7103cSJiong Wang * - The chained load/store pair crossed with previous pair. 25196bc7103cSJiong Wang * - The chained load/store pair has a total size of memory 25206bc7103cSJiong Wang * copy beyond 128 bytes which is the maximum length a 25216bc7103cSJiong Wang * single NFP CPP command can transfer. 25226bc7103cSJiong Wang */ 25236bc7103cSJiong Wang if (!curr_pair_is_memcpy(meta1, meta2) || 25246bc7103cSJiong Wang !curr_pair_chain_with_previous(meta1, meta2, prev_ld, 25256bc7103cSJiong Wang prev_st) || 25266bc7103cSJiong Wang (head_ld_meta && (cross_mem_access(ld, head_ld_meta, 25276bc7103cSJiong Wang head_st_meta) || 25286bc7103cSJiong Wang head_ld_meta->ldst_gather_len >= 128))) { 25296bc7103cSJiong Wang if (!count) 25306bc7103cSJiong Wang continue; 25316bc7103cSJiong Wang 25326bc7103cSJiong Wang if (count > 1) { 25336bc7103cSJiong Wang s16 prev_ld_off = prev_ld->off; 25346bc7103cSJiong Wang s16 prev_st_off = prev_st->off; 25356bc7103cSJiong Wang s16 head_ld_off = head_ld_meta->insn.off; 25366bc7103cSJiong Wang 25376bc7103cSJiong Wang if (prev_ld_off < head_ld_off) { 25386bc7103cSJiong Wang head_ld_meta->insn.off = prev_ld_off; 25396bc7103cSJiong Wang head_st_meta->insn.off = prev_st_off; 25406bc7103cSJiong Wang head_ld_meta->ldst_gather_len = 25416bc7103cSJiong Wang -head_ld_meta->ldst_gather_len; 25426bc7103cSJiong Wang } 25436bc7103cSJiong Wang 25446bc7103cSJiong Wang head_ld_meta->paired_st = &head_st_meta->insn; 25456bc7103cSJiong Wang head_st_meta->skip = true; 25466bc7103cSJiong Wang } else { 25476bc7103cSJiong Wang head_ld_meta->ldst_gather_len = 0; 25486bc7103cSJiong Wang } 25496bc7103cSJiong Wang 25506bc7103cSJiong Wang /* If the chain is ended by an load/store pair then this 25516bc7103cSJiong Wang * could serve as the new head of the the next chain. 25526bc7103cSJiong Wang */ 25536bc7103cSJiong Wang if (curr_pair_is_memcpy(meta1, meta2)) { 25546bc7103cSJiong Wang head_ld_meta = meta1; 25556bc7103cSJiong Wang head_st_meta = meta2; 25566bc7103cSJiong Wang head_ld_meta->ldst_gather_len = 25576bc7103cSJiong Wang BPF_LDST_BYTES(ld); 25586bc7103cSJiong Wang meta1 = nfp_meta_next(meta1); 25596bc7103cSJiong Wang meta2 = nfp_meta_next(meta2); 25606bc7103cSJiong Wang prev_ld = ld; 25616bc7103cSJiong Wang prev_st = st; 25626bc7103cSJiong Wang count = 1; 25636bc7103cSJiong Wang } else { 25646bc7103cSJiong Wang head_ld_meta = NULL; 25656bc7103cSJiong Wang head_st_meta = NULL; 25666bc7103cSJiong Wang prev_ld = NULL; 25676bc7103cSJiong Wang prev_st = NULL; 25686bc7103cSJiong Wang count = 0; 25696bc7103cSJiong Wang } 25706bc7103cSJiong Wang 25716bc7103cSJiong Wang continue; 25726bc7103cSJiong Wang } 25736bc7103cSJiong Wang 25746bc7103cSJiong Wang if (!head_ld_meta) { 25756bc7103cSJiong Wang head_ld_meta = meta1; 25766bc7103cSJiong Wang head_st_meta = meta2; 25776bc7103cSJiong Wang } else { 25786bc7103cSJiong Wang meta1->skip = true; 25796bc7103cSJiong Wang meta2->skip = true; 25806bc7103cSJiong Wang } 25816bc7103cSJiong Wang 25826bc7103cSJiong Wang head_ld_meta->ldst_gather_len += BPF_LDST_BYTES(ld); 25836bc7103cSJiong Wang meta1 = nfp_meta_next(meta1); 25846bc7103cSJiong Wang meta2 = nfp_meta_next(meta2); 25856bc7103cSJiong Wang prev_ld = ld; 25866bc7103cSJiong Wang prev_st = st; 25876bc7103cSJiong Wang count++; 25886bc7103cSJiong Wang } 25896bc7103cSJiong Wang } 25906bc7103cSJiong Wang 2591d9ae7f2bSJakub Kicinski static int nfp_bpf_optimize(struct nfp_prog *nfp_prog) 2592d9ae7f2bSJakub Kicinski { 2593d9ae7f2bSJakub Kicinski nfp_bpf_opt_reg_init(nfp_prog); 2594d9ae7f2bSJakub Kicinski 2595d9ae7f2bSJakub Kicinski nfp_bpf_opt_ld_mask(nfp_prog); 2596d9ae7f2bSJakub Kicinski nfp_bpf_opt_ld_shift(nfp_prog); 25976bc7103cSJiong Wang nfp_bpf_opt_ldst_gather(nfp_prog); 2598d9ae7f2bSJakub Kicinski 2599d9ae7f2bSJakub Kicinski return 0; 2600d9ae7f2bSJakub Kicinski } 2601d9ae7f2bSJakub Kicinski 26022e85d388SJakub Kicinski static int nfp_bpf_ustore_calc(struct nfp_prog *nfp_prog, __le64 *ustore) 2603fd068ddcSJakub Kicinski { 2604fd068ddcSJakub Kicinski int i; 2605fd068ddcSJakub Kicinski 2606fd068ddcSJakub Kicinski for (i = 0; i < nfp_prog->prog_len; i++) { 2607fd068ddcSJakub Kicinski int err; 2608fd068ddcSJakub Kicinski 2609fd068ddcSJakub Kicinski err = nfp_ustore_check_valid_no_ecc(nfp_prog->prog[i]); 2610fd068ddcSJakub Kicinski if (err) 2611fd068ddcSJakub Kicinski return err; 2612fd068ddcSJakub Kicinski 2613fd068ddcSJakub Kicinski nfp_prog->prog[i] = nfp_ustore_calc_ecc_insn(nfp_prog->prog[i]); 26142e85d388SJakub Kicinski 26152e85d388SJakub Kicinski ustore[i] = cpu_to_le64(nfp_prog->prog[i]); 2616fd068ddcSJakub Kicinski } 2617fd068ddcSJakub Kicinski 2618fd068ddcSJakub Kicinski return 0; 2619fd068ddcSJakub Kicinski } 2620fd068ddcSJakub Kicinski 2621c6c580d7SJakub Kicinski int nfp_bpf_jit(struct nfp_prog *nfp_prog) 2622d9ae7f2bSJakub Kicinski { 2623d9ae7f2bSJakub Kicinski int ret; 2624d9ae7f2bSJakub Kicinski 2625d9ae7f2bSJakub Kicinski ret = nfp_bpf_optimize(nfp_prog); 2626d9ae7f2bSJakub Kicinski if (ret) 26279314c442SJakub Kicinski return ret; 2628d9ae7f2bSJakub Kicinski 2629d9ae7f2bSJakub Kicinski ret = nfp_translate(nfp_prog); 2630d9ae7f2bSJakub Kicinski if (ret) { 2631d9ae7f2bSJakub Kicinski pr_err("Translation failed with error %d (translated: %u)\n", 2632d9ae7f2bSJakub Kicinski ret, nfp_prog->n_translated); 26339314c442SJakub Kicinski return -EINVAL; 2634d9ae7f2bSJakub Kicinski } 2635d9ae7f2bSJakub Kicinski 26369314c442SJakub Kicinski return nfp_bpf_ustore_calc(nfp_prog, (__force __le64 *)nfp_prog->prog); 2637d9ae7f2bSJakub Kicinski } 2638