2012-07-31 16:23:59 +02:00
/*
* BPF Jit compiler for s390 .
*
2015-04-01 16:08:32 +02:00
* Minimum build requirements :
*
* - HAVE_MARCH_Z196_FEATURES : laal , laalg
* - HAVE_MARCH_Z10_FEATURES : msfi , cgrj , clgrj
* - HAVE_MARCH_Z9_109_FEATURES : alfi , llilf , clfi , oilf , nilf
* - PACK_STACK
* - 64 BIT
*
* Copyright IBM Corp . 2012 , 2015
2012-07-31 16:23:59 +02:00
*
* Author ( s ) : Martin Schwidefsky < schwidefsky @ de . ibm . com >
2015-04-01 16:08:32 +02:00
* Michael Holzheu < holzheu @ linux . vnet . ibm . com >
2012-07-31 16:23:59 +02:00
*/
2015-04-01 16:08:32 +02:00
# define KMSG_COMPONENT "bpf_jit"
# define pr_fmt(fmt) KMSG_COMPONENT ": " fmt
2012-07-31 16:23:59 +02:00
# include <linux/netdevice.h>
# include <linux/filter.h>
2013-07-17 14:26:50 +02:00
# include <linux/init.h>
s390/bpf: implement bpf_tail_call() helper
bpf_tail_call() arguments:
- ctx......: Context pointer
- jmp_table: One of BPF_MAP_TYPE_PROG_ARRAY maps used as the jump table
- index....: Index in the jump table
In this implementation s390x JIT does stack unwinding and jumps into the
callee program prologue. Caller and callee use the same stack.
With this patch a tail call generates the following code on s390x:
if (index >= array->map.max_entries)
goto out
000003ff8001c7e4: e31030100016 llgf %r1,16(%r3)
000003ff8001c7ea: ec41001fa065 clgrj %r4,%r1,10,3ff8001c828
if (tail_call_cnt++ > MAX_TAIL_CALL_CNT)
goto out;
000003ff8001c7f0: a7080001 lhi %r0,1
000003ff8001c7f4: eb10f25000fa laal %r1,%r0,592(%r15)
000003ff8001c7fa: ec120017207f clij %r1,32,2,3ff8001c828
prog = array->prog[index];
if (prog == NULL)
goto out;
000003ff8001c800: eb140003000d sllg %r1,%r4,3
000003ff8001c806: e31310800004 lg %r1,128(%r3,%r1)
000003ff8001c80c: ec18000e007d clgij %r1,0,8,3ff8001c828
Restore registers before calling function
000003ff8001c812: eb68f2980004 lmg %r6,%r8,664(%r15)
000003ff8001c818: ebbff2c00004 lmg %r11,%r15,704(%r15)
goto *(prog->bpf_func + tail_call_start);
000003ff8001c81e: e31100200004 lg %r1,32(%r1,%r0)
000003ff8001c824: 47f01006 bc 15,6(%r1)
Reviewed-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
Signed-off-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Acked-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Alexei Starovoitov <ast@plumgrid.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2015-06-08 21:51:06 -07:00
# include <linux/bpf.h>
2012-07-31 16:23:59 +02:00
# include <asm/cacheflush.h>
2013-09-13 13:36:25 +02:00
# include <asm/dis.h>
2017-05-08 15:58:08 -07:00
# include <asm/set_memory.h>
2015-04-01 16:08:32 +02:00
# include "bpf_jit.h"
2012-07-31 16:23:59 +02:00
int bpf_jit_enable __read_mostly ;
2015-04-01 16:08:32 +02:00
struct bpf_jit {
u32 seen ; /* Flags to remember seen eBPF instructions */
u32 seen_reg [ 16 ] ; /* Array to remember which registers are used */
u32 * addrs ; /* Array with relative instruction addresses */
u8 * prg_buf ; /* Start of program */
int size ; /* Size of program and literal pool */
int size_prg ; /* Size of program */
int prg ; /* Current position in program */
int lit_start ; /* Start of literal pool */
int lit ; /* Current position in literal pool */
int base_ip ; /* Base address for literal pool */
int ret0_ip ; /* Address of return 0 */
int exit_ip ; /* Address of exit */
s390/bpf: implement bpf_tail_call() helper
bpf_tail_call() arguments:
- ctx......: Context pointer
- jmp_table: One of BPF_MAP_TYPE_PROG_ARRAY maps used as the jump table
- index....: Index in the jump table
In this implementation s390x JIT does stack unwinding and jumps into the
callee program prologue. Caller and callee use the same stack.
With this patch a tail call generates the following code on s390x:
if (index >= array->map.max_entries)
goto out
000003ff8001c7e4: e31030100016 llgf %r1,16(%r3)
000003ff8001c7ea: ec41001fa065 clgrj %r4,%r1,10,3ff8001c828
if (tail_call_cnt++ > MAX_TAIL_CALL_CNT)
goto out;
000003ff8001c7f0: a7080001 lhi %r0,1
000003ff8001c7f4: eb10f25000fa laal %r1,%r0,592(%r15)
000003ff8001c7fa: ec120017207f clij %r1,32,2,3ff8001c828
prog = array->prog[index];
if (prog == NULL)
goto out;
000003ff8001c800: eb140003000d sllg %r1,%r4,3
000003ff8001c806: e31310800004 lg %r1,128(%r3,%r1)
000003ff8001c80c: ec18000e007d clgij %r1,0,8,3ff8001c828
Restore registers before calling function
000003ff8001c812: eb68f2980004 lmg %r6,%r8,664(%r15)
000003ff8001c818: ebbff2c00004 lmg %r11,%r15,704(%r15)
goto *(prog->bpf_func + tail_call_start);
000003ff8001c81e: e31100200004 lg %r1,32(%r1,%r0)
000003ff8001c824: 47f01006 bc 15,6(%r1)
Reviewed-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
Signed-off-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Acked-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Alexei Starovoitov <ast@plumgrid.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2015-06-08 21:51:06 -07:00
int tail_call_start ; /* Tail call start offset */
int labels [ 1 ] ; /* Labels for local jumps */
2015-04-01 16:08:32 +02:00
} ;
2016-05-12 18:10:48 +02:00
# define BPF_SIZE_MAX 0xffff /* Max size for program (16 bit branches) */
2015-04-01 16:08:32 +02:00
# define SEEN_SKB 1 /* skb access */
# define SEEN_MEM 2 /* use mem[] for temporary storage */
# define SEEN_RET0 4 /* ret0_ip points to a valid return 0 */
# define SEEN_LITERAL 8 /* code uses literals */
# define SEEN_FUNC 16 /* calls C functions */
s390/bpf: implement bpf_tail_call() helper
bpf_tail_call() arguments:
- ctx......: Context pointer
- jmp_table: One of BPF_MAP_TYPE_PROG_ARRAY maps used as the jump table
- index....: Index in the jump table
In this implementation s390x JIT does stack unwinding and jumps into the
callee program prologue. Caller and callee use the same stack.
With this patch a tail call generates the following code on s390x:
if (index >= array->map.max_entries)
goto out
000003ff8001c7e4: e31030100016 llgf %r1,16(%r3)
000003ff8001c7ea: ec41001fa065 clgrj %r4,%r1,10,3ff8001c828
if (tail_call_cnt++ > MAX_TAIL_CALL_CNT)
goto out;
000003ff8001c7f0: a7080001 lhi %r0,1
000003ff8001c7f4: eb10f25000fa laal %r1,%r0,592(%r15)
000003ff8001c7fa: ec120017207f clij %r1,32,2,3ff8001c828
prog = array->prog[index];
if (prog == NULL)
goto out;
000003ff8001c800: eb140003000d sllg %r1,%r4,3
000003ff8001c806: e31310800004 lg %r1,128(%r3,%r1)
000003ff8001c80c: ec18000e007d clgij %r1,0,8,3ff8001c828
Restore registers before calling function
000003ff8001c812: eb68f2980004 lmg %r6,%r8,664(%r15)
000003ff8001c818: ebbff2c00004 lmg %r11,%r15,704(%r15)
goto *(prog->bpf_func + tail_call_start);
000003ff8001c81e: e31100200004 lg %r1,32(%r1,%r0)
000003ff8001c824: 47f01006 bc 15,6(%r1)
Reviewed-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
Signed-off-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Acked-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Alexei Starovoitov <ast@plumgrid.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2015-06-08 21:51:06 -07:00
# define SEEN_TAIL_CALL 32 /* code uses tail calls */
2015-07-29 21:15:18 +02:00
# define SEEN_SKB_CHANGE 64 /* code changes skb data */
2016-05-13 19:08:35 +02:00
# define SEEN_REG_AX 128 /* code uses constant blinding */
2015-04-01 16:08:32 +02:00
# define SEEN_STACK (SEEN_FUNC | SEEN_MEM | SEEN_SKB)
2012-07-31 16:23:59 +02:00
/*
2015-04-01 16:08:32 +02:00
* s390 registers
2012-07-31 16:23:59 +02:00
*/
2016-05-13 19:08:35 +02:00
# define REG_W0 (MAX_BPF_JIT_REG + 0) /* Work register 1 (even) */
# define REG_W1 (MAX_BPF_JIT_REG + 1) /* Work register 2 (odd) */
# define REG_SKB_DATA (MAX_BPF_JIT_REG + 2) /* SKB data register */
# define REG_L (MAX_BPF_JIT_REG + 3) /* Literal pool register */
# define REG_15 (MAX_BPF_JIT_REG + 4) /* Register 15 */
2015-04-01 16:08:32 +02:00
# define REG_0 REG_W0 /* Register 0 */
s390/bpf: implement bpf_tail_call() helper
bpf_tail_call() arguments:
- ctx......: Context pointer
- jmp_table: One of BPF_MAP_TYPE_PROG_ARRAY maps used as the jump table
- index....: Index in the jump table
In this implementation s390x JIT does stack unwinding and jumps into the
callee program prologue. Caller and callee use the same stack.
With this patch a tail call generates the following code on s390x:
if (index >= array->map.max_entries)
goto out
000003ff8001c7e4: e31030100016 llgf %r1,16(%r3)
000003ff8001c7ea: ec41001fa065 clgrj %r4,%r1,10,3ff8001c828
if (tail_call_cnt++ > MAX_TAIL_CALL_CNT)
goto out;
000003ff8001c7f0: a7080001 lhi %r0,1
000003ff8001c7f4: eb10f25000fa laal %r1,%r0,592(%r15)
000003ff8001c7fa: ec120017207f clij %r1,32,2,3ff8001c828
prog = array->prog[index];
if (prog == NULL)
goto out;
000003ff8001c800: eb140003000d sllg %r1,%r4,3
000003ff8001c806: e31310800004 lg %r1,128(%r3,%r1)
000003ff8001c80c: ec18000e007d clgij %r1,0,8,3ff8001c828
Restore registers before calling function
000003ff8001c812: eb68f2980004 lmg %r6,%r8,664(%r15)
000003ff8001c818: ebbff2c00004 lmg %r11,%r15,704(%r15)
goto *(prog->bpf_func + tail_call_start);
000003ff8001c81e: e31100200004 lg %r1,32(%r1,%r0)
000003ff8001c824: 47f01006 bc 15,6(%r1)
Reviewed-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
Signed-off-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Acked-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Alexei Starovoitov <ast@plumgrid.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2015-06-08 21:51:06 -07:00
# define REG_1 REG_W1 /* Register 1 */
2015-04-01 16:08:32 +02:00
# define REG_2 BPF_REG_1 /* Register 2 */
# define REG_14 BPF_REG_0 /* Register 14 */
2012-07-31 16:23:59 +02:00
2015-04-01 16:08:32 +02:00
/*
* Mapping of BPF registers to s390 registers
*/
static const int reg2hex [ ] = {
/* Return code */
[ BPF_REG_0 ] = 14 ,
/* Function parameters */
[ BPF_REG_1 ] = 2 ,
[ BPF_REG_2 ] = 3 ,
[ BPF_REG_3 ] = 4 ,
[ BPF_REG_4 ] = 5 ,
[ BPF_REG_5 ] = 6 ,
/* Call saved registers */
[ BPF_REG_6 ] = 7 ,
[ BPF_REG_7 ] = 8 ,
[ BPF_REG_8 ] = 9 ,
[ BPF_REG_9 ] = 10 ,
/* BPF stack pointer */
[ BPF_REG_FP ] = 13 ,
2016-05-13 19:08:35 +02:00
/* Register for blinding (shared with REG_SKB_DATA) */
[ BPF_REG_AX ] = 12 ,
2015-04-01 16:08:32 +02:00
/* SKB data pointer */
[ REG_SKB_DATA ] = 12 ,
/* Work registers for s390x backend */
[ REG_W0 ] = 0 ,
[ REG_W1 ] = 1 ,
[ REG_L ] = 11 ,
[ REG_15 ] = 15 ,
2012-07-31 16:23:59 +02:00
} ;
2015-04-01 16:08:32 +02:00
static inline u32 reg ( u32 dst_reg , u32 src_reg )
{
return reg2hex [ dst_reg ] < < 4 | reg2hex [ src_reg ] ;
}
static inline u32 reg_high ( u32 reg )
{
return reg2hex [ reg ] < < 4 ;
}
static inline void reg_set_seen ( struct bpf_jit * jit , u32 b1 )
{
u32 r1 = reg2hex [ b1 ] ;
if ( ! jit - > seen_reg [ r1 ] & & r1 > = 6 & & r1 < = 15 )
jit - > seen_reg [ r1 ] = 1 ;
}
# define REG_SET_SEEN(b1) \
( { \
reg_set_seen ( jit , b1 ) ; \
} )
# define REG_SEEN(b1) jit->seen_reg[reg2hex[(b1)]]
/*
* EMIT macros for code generation
*/
# define _EMIT2(op) \
( { \
if ( jit - > prg_buf ) \
* ( u16 * ) ( jit - > prg_buf + jit - > prg ) = op ; \
jit - > prg + = 2 ; \
} )
2012-07-31 16:23:59 +02:00
2015-04-01 16:08:32 +02:00
# define EMIT2(op, b1, b2) \
( { \
_EMIT2 ( op | reg ( b1 , b2 ) ) ; \
REG_SET_SEEN ( b1 ) ; \
REG_SET_SEEN ( b2 ) ; \
2012-07-31 16:23:59 +02:00
} )
2015-04-01 16:08:32 +02:00
# define _EMIT4(op) \
( { \
if ( jit - > prg_buf ) \
* ( u32 * ) ( jit - > prg_buf + jit - > prg ) = op ; \
jit - > prg + = 4 ; \
2012-07-31 16:23:59 +02:00
} )
2015-04-01 16:08:32 +02:00
# define EMIT4(op, b1, b2) \
( { \
_EMIT4 ( op | reg ( b1 , b2 ) ) ; \
REG_SET_SEEN ( b1 ) ; \
REG_SET_SEEN ( b2 ) ; \
2012-07-31 16:23:59 +02:00
} )
2015-04-01 16:08:32 +02:00
# define EMIT4_RRF(op, b1, b2, b3) \
( { \
_EMIT4 ( op | reg_high ( b3 ) < < 8 | reg ( b1 , b2 ) ) ; \
REG_SET_SEEN ( b1 ) ; \
REG_SET_SEEN ( b2 ) ; \
REG_SET_SEEN ( b3 ) ; \
2012-07-31 16:23:59 +02:00
} )
2015-04-01 16:08:32 +02:00
# define _EMIT4_DISP(op, disp) \
( { \
unsigned int __disp = ( disp ) & 0xfff ; \
_EMIT4 ( op | __disp ) ; \
2012-07-31 16:23:59 +02:00
} )
2015-04-01 16:08:32 +02:00
# define EMIT4_DISP(op, b1, b2, disp) \
( { \
_EMIT4_DISP ( op | reg_high ( b1 ) < < 16 | \
reg_high ( b2 ) < < 8 , disp ) ; \
REG_SET_SEEN ( b1 ) ; \
REG_SET_SEEN ( b2 ) ; \
2012-07-31 16:23:59 +02:00
} )
2015-04-01 16:08:32 +02:00
# define EMIT4_IMM(op, b1, imm) \
( { \
unsigned int __imm = ( imm ) & 0xffff ; \
_EMIT4 ( op | reg_high ( b1 ) < < 16 | __imm ) ; \
REG_SET_SEEN ( b1 ) ; \
2012-07-31 16:23:59 +02:00
} )
2015-04-01 16:08:32 +02:00
# define EMIT4_PCREL(op, pcrel) \
( { \
long __pcrel = ( ( pcrel ) > > 1 ) & 0xffff ; \
_EMIT4 ( op | __pcrel ) ; \
2012-08-28 15:36:14 +02:00
} )
2015-04-01 16:08:32 +02:00
# define _EMIT6(op1, op2) \
( { \
if ( jit - > prg_buf ) { \
* ( u32 * ) ( jit - > prg_buf + jit - > prg ) = op1 ; \
* ( u16 * ) ( jit - > prg_buf + jit - > prg + 4 ) = op2 ; \
} \
jit - > prg + = 6 ; \
2012-07-31 16:23:59 +02:00
} )
2015-04-01 16:08:32 +02:00
# define _EMIT6_DISP(op1, op2, disp) \
( { \
unsigned int __disp = ( disp ) & 0xfff ; \
_EMIT6 ( op1 | __disp , op2 ) ; \
2012-07-31 16:23:59 +02:00
} )
2015-04-01 16:08:32 +02:00
# define _EMIT6_DISP_LH(op1, op2, disp) \
( { \
2015-07-29 21:15:15 +02:00
u32 _disp = ( u32 ) disp ; \
unsigned int __disp_h = _disp & 0xff000 ; \
unsigned int __disp_l = _disp & 0x00fff ; \
2015-04-01 16:08:32 +02:00
_EMIT6 ( op1 | __disp_l , op2 | __disp_h > > 4 ) ; \
} )
# define EMIT6_DISP_LH(op1, op2, b1, b2, b3, disp) \
( { \
_EMIT6_DISP_LH ( op1 | reg ( b1 , b2 ) < < 16 | \
reg_high ( b3 ) < < 8 , op2 , disp ) ; \
REG_SET_SEEN ( b1 ) ; \
REG_SET_SEEN ( b2 ) ; \
REG_SET_SEEN ( b3 ) ; \
} )
s390/bpf: implement bpf_tail_call() helper
bpf_tail_call() arguments:
- ctx......: Context pointer
- jmp_table: One of BPF_MAP_TYPE_PROG_ARRAY maps used as the jump table
- index....: Index in the jump table
In this implementation s390x JIT does stack unwinding and jumps into the
callee program prologue. Caller and callee use the same stack.
With this patch a tail call generates the following code on s390x:
if (index >= array->map.max_entries)
goto out
000003ff8001c7e4: e31030100016 llgf %r1,16(%r3)
000003ff8001c7ea: ec41001fa065 clgrj %r4,%r1,10,3ff8001c828
if (tail_call_cnt++ > MAX_TAIL_CALL_CNT)
goto out;
000003ff8001c7f0: a7080001 lhi %r0,1
000003ff8001c7f4: eb10f25000fa laal %r1,%r0,592(%r15)
000003ff8001c7fa: ec120017207f clij %r1,32,2,3ff8001c828
prog = array->prog[index];
if (prog == NULL)
goto out;
000003ff8001c800: eb140003000d sllg %r1,%r4,3
000003ff8001c806: e31310800004 lg %r1,128(%r3,%r1)
000003ff8001c80c: ec18000e007d clgij %r1,0,8,3ff8001c828
Restore registers before calling function
000003ff8001c812: eb68f2980004 lmg %r6,%r8,664(%r15)
000003ff8001c818: ebbff2c00004 lmg %r11,%r15,704(%r15)
goto *(prog->bpf_func + tail_call_start);
000003ff8001c81e: e31100200004 lg %r1,32(%r1,%r0)
000003ff8001c824: 47f01006 bc 15,6(%r1)
Reviewed-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
Signed-off-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Acked-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Alexei Starovoitov <ast@plumgrid.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2015-06-08 21:51:06 -07:00
# define EMIT6_PCREL_LABEL(op1, op2, b1, b2, label, mask) \
( { \
int rel = ( jit - > labels [ label ] - jit - > prg ) > > 1 ; \
_EMIT6 ( op1 | reg ( b1 , b2 ) < < 16 | ( rel & 0xffff ) , \
op2 | mask < < 12 ) ; \
REG_SET_SEEN ( b1 ) ; \
REG_SET_SEEN ( b2 ) ; \
} )
# define EMIT6_PCREL_IMM_LABEL(op1, op2, b1, imm, label, mask) \
( { \
int rel = ( jit - > labels [ label ] - jit - > prg ) > > 1 ; \
_EMIT6 ( op1 | ( reg_high ( b1 ) | mask ) < < 16 | \
( rel & 0xffff ) , op2 | ( imm & 0xff ) < < 8 ) ; \
REG_SET_SEEN ( b1 ) ; \
BUILD_BUG_ON ( ( ( unsigned long ) imm ) > 0xff ) ; \
} )
2015-04-01 16:08:32 +02:00
# define EMIT6_PCREL(op1, op2, b1, b2, i, off, mask) \
( { \
/* Branch instruction needs 6 bytes */ \
int rel = ( addrs [ i + off + 1 ] - ( addrs [ i + 1 ] - 6 ) ) / 2 ; \
2015-05-21 15:39:31 +02:00
_EMIT6 ( op1 | reg ( b1 , b2 ) < < 16 | ( rel & 0xffff ) , op2 | mask ) ; \
2015-04-01 16:08:32 +02:00
REG_SET_SEEN ( b1 ) ; \
REG_SET_SEEN ( b2 ) ; \
} )
# define _EMIT6_IMM(op, imm) \
( { \
unsigned int __imm = ( imm ) ; \
_EMIT6 ( op | ( __imm > > 16 ) , __imm & 0xffff ) ; \
} )
# define EMIT6_IMM(op, b1, imm) \
( { \
_EMIT6_IMM ( op | reg_high ( b1 ) < < 16 , imm ) ; \
REG_SET_SEEN ( b1 ) ; \
} )
# define EMIT_CONST_U32(val) \
( { \
unsigned int ret ; \
ret = jit - > lit - jit - > base_ip ; \
jit - > seen | = SEEN_LITERAL ; \
if ( jit - > prg_buf ) \
* ( u32 * ) ( jit - > prg_buf + jit - > lit ) = ( u32 ) val ; \
jit - > lit + = 4 ; \
ret ; \
} )
# define EMIT_CONST_U64(val) \
( { \
unsigned int ret ; \
ret = jit - > lit - jit - > base_ip ; \
jit - > seen | = SEEN_LITERAL ; \
if ( jit - > prg_buf ) \
* ( u64 * ) ( jit - > prg_buf + jit - > lit ) = ( u64 ) val ; \
jit - > lit + = 8 ; \
ret ; \
} )
# define EMIT_ZERO(b1) \
( { \
/* llgfr %dst,%dst (zero extend to 64 bit) */ \
EMIT4 ( 0xb9160000 , b1 , b1 ) ; \
REG_SET_SEEN ( b1 ) ; \
} )
/*
* Fill whole space with illegal instructions
*/
static void jit_fill_hole ( void * area , unsigned int size )
2014-09-08 08:04:47 +02:00
{
memset ( area , 0 , size ) ;
}
2015-04-01 16:08:32 +02:00
/*
* Save registers from " rs " ( register start ) to " re " ( register end ) on stack
*/
static void save_regs ( struct bpf_jit * jit , u32 rs , u32 re )
{
s390/bpf: implement bpf_tail_call() helper
bpf_tail_call() arguments:
- ctx......: Context pointer
- jmp_table: One of BPF_MAP_TYPE_PROG_ARRAY maps used as the jump table
- index....: Index in the jump table
In this implementation s390x JIT does stack unwinding and jumps into the
callee program prologue. Caller and callee use the same stack.
With this patch a tail call generates the following code on s390x:
if (index >= array->map.max_entries)
goto out
000003ff8001c7e4: e31030100016 llgf %r1,16(%r3)
000003ff8001c7ea: ec41001fa065 clgrj %r4,%r1,10,3ff8001c828
if (tail_call_cnt++ > MAX_TAIL_CALL_CNT)
goto out;
000003ff8001c7f0: a7080001 lhi %r0,1
000003ff8001c7f4: eb10f25000fa laal %r1,%r0,592(%r15)
000003ff8001c7fa: ec120017207f clij %r1,32,2,3ff8001c828
prog = array->prog[index];
if (prog == NULL)
goto out;
000003ff8001c800: eb140003000d sllg %r1,%r4,3
000003ff8001c806: e31310800004 lg %r1,128(%r3,%r1)
000003ff8001c80c: ec18000e007d clgij %r1,0,8,3ff8001c828
Restore registers before calling function
000003ff8001c812: eb68f2980004 lmg %r6,%r8,664(%r15)
000003ff8001c818: ebbff2c00004 lmg %r11,%r15,704(%r15)
goto *(prog->bpf_func + tail_call_start);
000003ff8001c81e: e31100200004 lg %r1,32(%r1,%r0)
000003ff8001c824: 47f01006 bc 15,6(%r1)
Reviewed-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
Signed-off-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Acked-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Alexei Starovoitov <ast@plumgrid.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2015-06-08 21:51:06 -07:00
u32 off = STK_OFF_R6 + ( rs - 6 ) * 8 ;
2015-04-01 16:08:32 +02:00
if ( rs = = re )
/* stg %rs,off(%r15) */
_EMIT6 ( 0xe300f000 | rs < < 20 | off , 0x0024 ) ;
else
/* stmg %rs,%re,off(%r15) */
_EMIT6_DISP ( 0xeb00f000 | rs < < 20 | re < < 16 , 0x0024 , off ) ;
}
/*
* Restore registers from " rs " ( register start ) to " re " ( register end ) on stack
*/
static void restore_regs ( struct bpf_jit * jit , u32 rs , u32 re )
2012-07-31 16:23:59 +02:00
{
s390/bpf: implement bpf_tail_call() helper
bpf_tail_call() arguments:
- ctx......: Context pointer
- jmp_table: One of BPF_MAP_TYPE_PROG_ARRAY maps used as the jump table
- index....: Index in the jump table
In this implementation s390x JIT does stack unwinding and jumps into the
callee program prologue. Caller and callee use the same stack.
With this patch a tail call generates the following code on s390x:
if (index >= array->map.max_entries)
goto out
000003ff8001c7e4: e31030100016 llgf %r1,16(%r3)
000003ff8001c7ea: ec41001fa065 clgrj %r4,%r1,10,3ff8001c828
if (tail_call_cnt++ > MAX_TAIL_CALL_CNT)
goto out;
000003ff8001c7f0: a7080001 lhi %r0,1
000003ff8001c7f4: eb10f25000fa laal %r1,%r0,592(%r15)
000003ff8001c7fa: ec120017207f clij %r1,32,2,3ff8001c828
prog = array->prog[index];
if (prog == NULL)
goto out;
000003ff8001c800: eb140003000d sllg %r1,%r4,3
000003ff8001c806: e31310800004 lg %r1,128(%r3,%r1)
000003ff8001c80c: ec18000e007d clgij %r1,0,8,3ff8001c828
Restore registers before calling function
000003ff8001c812: eb68f2980004 lmg %r6,%r8,664(%r15)
000003ff8001c818: ebbff2c00004 lmg %r11,%r15,704(%r15)
goto *(prog->bpf_func + tail_call_start);
000003ff8001c81e: e31100200004 lg %r1,32(%r1,%r0)
000003ff8001c824: 47f01006 bc 15,6(%r1)
Reviewed-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
Signed-off-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Acked-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Alexei Starovoitov <ast@plumgrid.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2015-06-08 21:51:06 -07:00
u32 off = STK_OFF_R6 + ( rs - 6 ) * 8 ;
2015-04-01 16:08:32 +02:00
if ( jit - > seen & SEEN_STACK )
off + = STK_OFF ;
if ( rs = = re )
/* lg %rs,off(%r15) */
_EMIT6 ( 0xe300f000 | rs < < 20 | off , 0x0004 ) ;
else
/* lmg %rs,%re,off(%r15) */
_EMIT6_DISP ( 0xeb00f000 | rs < < 20 | re < < 16 , 0x0004 , off ) ;
}
2012-07-31 16:23:59 +02:00
2015-04-01 16:08:32 +02:00
/*
* Return first seen register ( from start )
*/
static int get_start ( struct bpf_jit * jit , int start )
{
int i ;
for ( i = start ; i < = 15 ; i + + ) {
if ( jit - > seen_reg [ i ] )
return i ;
}
return 0 ;
}
/*
* Return last seen register ( from start ) ( gap > = 2 )
*/
static int get_end ( struct bpf_jit * jit , int start )
{
int i ;
for ( i = start ; i < 15 ; i + + ) {
if ( ! jit - > seen_reg [ i ] & & ! jit - > seen_reg [ i + 1 ] )
return i - 1 ;
}
return jit - > seen_reg [ 15 ] ? 15 : 14 ;
}
# define REGS_SAVE 1
# define REGS_RESTORE 0
/*
* Save and restore clobbered registers ( 6 - 15 ) on stack .
* We save / restore registers in chunks with gap > = 2 registers .
*/
static void save_restore_regs ( struct bpf_jit * jit , int op )
{
int re = 6 , rs ;
do {
rs = get_start ( jit , re ) ;
if ( ! rs )
break ;
re = get_end ( jit , rs + 1 ) ;
if ( op = = REGS_SAVE )
save_regs ( jit , rs , re ) ;
else
restore_regs ( jit , rs , re ) ;
re + + ;
} while ( re < = 15 ) ;
}
2015-07-29 21:15:18 +02:00
/*
* For SKB access % b1 contains the SKB pointer . For " bpf_jit.S "
* we store the SKB header length on the stack and the SKB data
2016-05-13 19:08:35 +02:00
* pointer in REG_SKB_DATA if BPF_REG_AX is not used .
2015-07-29 21:15:18 +02:00
*/
static void emit_load_skb_data_hlen ( struct bpf_jit * jit )
{
/* Header length: llgf %w1,<len>(%b1) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0016 , REG_W1 , REG_0 , BPF_REG_1 ,
offsetof ( struct sk_buff , len ) ) ;
/* s %w1,<data_len>(%b1) */
EMIT4_DISP ( 0x5b000000 , REG_W1 , BPF_REG_1 ,
offsetof ( struct sk_buff , data_len ) ) ;
/* stg %w1,ST_OFF_HLEN(%r0,%r15) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0024 , REG_W1 , REG_0 , REG_15 , STK_OFF_HLEN ) ;
2016-05-13 19:08:35 +02:00
if ( ! ( jit - > seen & SEEN_REG_AX ) )
/* lg %skb_data,data_off(%b1) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0004 , REG_SKB_DATA , REG_0 ,
BPF_REG_1 , offsetof ( struct sk_buff , data ) ) ;
2015-07-29 21:15:18 +02:00
}
2015-04-01 16:08:32 +02:00
/*
* Emit function prologue
*
* Save registers and create stack frame if necessary .
* See stack frame layout desription in " bpf_jit.h " !
*/
bpf: move clearing of A/X into classic to eBPF migration prologue
Back in the days where eBPF (or back then "internal BPF" ;->) was not
exposed to user space, and only the classic BPF programs internally
translated into eBPF programs, we missed the fact that for classic BPF
A and X needed to be cleared. It was fixed back then via 83d5b7ef99c9
("net: filter: initialize A and X registers"), and thus classic BPF
specifics were added to the eBPF interpreter core to work around it.
This added some confusion for JIT developers later on that take the
eBPF interpreter code as an example for deriving their JIT. F.e. in
f75298f5c3fe ("s390/bpf: clear correct BPF accumulator register"), at
least X could leak stack memory. Furthermore, since this is only needed
for classic BPF translations and not for eBPF (verifier takes care
that read access to regs cannot be done uninitialized), more complexity
is added to JITs as they need to determine whether they deal with
migrations or native eBPF where they can just omit clearing A/X in
their prologue and thus reduce image size a bit, see f.e. cde66c2d88da
("s390/bpf: Only clear A and X for converted BPF programs"). In other
cases (x86, arm64), A and X is being cleared in the prologue also for
eBPF case, which is unnecessary.
Lets move this into the BPF migration in bpf_convert_filter() where it
actually belongs as long as the number of eBPF JITs are still few. It
can thus be done generically; allowing us to remove the quirk from
__bpf_prog_run() and to slightly reduce JIT image size in case of eBPF,
while reducing code duplication on this matter in current(/future) eBPF
JITs.
Signed-off-by: Daniel Borkmann <daniel@iogearbox.net>
Acked-by: Alexei Starovoitov <ast@kernel.org>
Reviewed-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Tested-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Cc: Zi Shen Lim <zlim.lnx@gmail.com>
Cc: Yang Shi <yang.shi@linaro.org>
Acked-by: Yang Shi <yang.shi@linaro.org>
Acked-by: Zi Shen Lim <zlim.lnx@gmail.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2015-12-17 23:51:54 +01:00
static void bpf_jit_prologue ( struct bpf_jit * jit )
2015-04-01 16:08:32 +02:00
{
s390/bpf: implement bpf_tail_call() helper
bpf_tail_call() arguments:
- ctx......: Context pointer
- jmp_table: One of BPF_MAP_TYPE_PROG_ARRAY maps used as the jump table
- index....: Index in the jump table
In this implementation s390x JIT does stack unwinding and jumps into the
callee program prologue. Caller and callee use the same stack.
With this patch a tail call generates the following code on s390x:
if (index >= array->map.max_entries)
goto out
000003ff8001c7e4: e31030100016 llgf %r1,16(%r3)
000003ff8001c7ea: ec41001fa065 clgrj %r4,%r1,10,3ff8001c828
if (tail_call_cnt++ > MAX_TAIL_CALL_CNT)
goto out;
000003ff8001c7f0: a7080001 lhi %r0,1
000003ff8001c7f4: eb10f25000fa laal %r1,%r0,592(%r15)
000003ff8001c7fa: ec120017207f clij %r1,32,2,3ff8001c828
prog = array->prog[index];
if (prog == NULL)
goto out;
000003ff8001c800: eb140003000d sllg %r1,%r4,3
000003ff8001c806: e31310800004 lg %r1,128(%r3,%r1)
000003ff8001c80c: ec18000e007d clgij %r1,0,8,3ff8001c828
Restore registers before calling function
000003ff8001c812: eb68f2980004 lmg %r6,%r8,664(%r15)
000003ff8001c818: ebbff2c00004 lmg %r11,%r15,704(%r15)
goto *(prog->bpf_func + tail_call_start);
000003ff8001c81e: e31100200004 lg %r1,32(%r1,%r0)
000003ff8001c824: 47f01006 bc 15,6(%r1)
Reviewed-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
Signed-off-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Acked-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Alexei Starovoitov <ast@plumgrid.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2015-06-08 21:51:06 -07:00
if ( jit - > seen & SEEN_TAIL_CALL ) {
/* xc STK_OFF_TCCNT(4,%r15),STK_OFF_TCCNT(%r15) */
_EMIT6 ( 0xd703f000 | STK_OFF_TCCNT , 0xf000 | STK_OFF_TCCNT ) ;
} else {
/* j tail_call_start: NOP if no tail calls are used */
EMIT4_PCREL ( 0xa7f40000 , 6 ) ;
_EMIT2 ( 0 ) ;
}
/* Tail calls have to skip above initialization */
jit - > tail_call_start = jit - > prg ;
2015-04-01 16:08:32 +02:00
/* Save registers */
save_restore_regs ( jit , REGS_SAVE ) ;
2012-07-31 16:23:59 +02:00
/* Setup literal pool */
if ( jit - > seen & SEEN_LITERAL ) {
/* basr %r13,0 */
2015-04-01 16:08:32 +02:00
EMIT2 ( 0x0d00 , REG_L , REG_0 ) ;
2012-07-31 16:23:59 +02:00
jit - > base_ip = jit - > prg ;
}
2015-04-01 16:08:32 +02:00
/* Setup stack and backchain */
if ( jit - > seen & SEEN_STACK ) {
2015-06-01 22:48:35 -07:00
if ( jit - > seen & SEEN_FUNC )
/* lgr %w1,%r15 (backchain) */
EMIT4 ( 0xb9040000 , REG_W1 , REG_15 ) ;
/* la %bfp,STK_160_UNUSED(%r15) (BPF frame pointer) */
EMIT4_DISP ( 0x41000000 , BPF_REG_FP , REG_15 , STK_160_UNUSED ) ;
2015-04-01 16:08:32 +02:00
/* aghi %r15,-STK_OFF */
EMIT4_IMM ( 0xa70b0000 , REG_15 , - STK_OFF ) ;
if ( jit - > seen & SEEN_FUNC )
2015-06-01 22:48:35 -07:00
/* stg %w1,152(%r15) (backchain) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0024 , REG_W1 , REG_0 ,
2015-04-01 16:08:32 +02:00
REG_15 , 152 ) ;
}
2015-07-29 21:15:18 +02:00
if ( jit - > seen & SEEN_SKB )
emit_load_skb_data_hlen ( jit ) ;
if ( jit - > seen & SEEN_SKB_CHANGE )
/* stg %b1,ST_OFF_SKBP(%r0,%r15) */
2016-05-11 21:13:13 +02:00
EMIT6_DISP_LH ( 0xe3000000 , 0x0024 , BPF_REG_1 , REG_0 , REG_15 ,
2015-07-29 21:15:18 +02:00
STK_OFF_SKBP ) ;
2012-07-31 16:23:59 +02:00
}
2015-04-01 16:08:32 +02:00
/*
* Function epilogue
*/
2012-07-31 16:23:59 +02:00
static void bpf_jit_epilogue ( struct bpf_jit * jit )
{
/* Return 0 */
if ( jit - > seen & SEEN_RET0 ) {
jit - > ret0_ip = jit - > prg ;
2015-04-01 16:08:32 +02:00
/* lghi %b0,0 */
EMIT4_IMM ( 0xa7090000 , BPF_REG_0 , 0 ) ;
2012-07-31 16:23:59 +02:00
}
jit - > exit_ip = jit - > prg ;
2015-04-01 16:08:32 +02:00
/* Load exit code: lgr %r2,%b0 */
EMIT4 ( 0xb9040000 , REG_2 , BPF_REG_0 ) ;
2012-07-31 16:23:59 +02:00
/* Restore registers */
2015-04-01 16:08:32 +02:00
save_restore_regs ( jit , REGS_RESTORE ) ;
2012-07-31 16:23:59 +02:00
/* br %r14 */
2015-04-01 16:08:32 +02:00
_EMIT2 ( 0x07fe ) ;
2012-07-31 16:23:59 +02:00
}
/*
2015-04-01 16:08:32 +02:00
* Compile one eBPF instruction into s390x code
s390/bpf: Fix gcov stack space problem
When compiling the kernel for GCOV (CONFIG_GCOV_KERNEL,-fprofile-arcs),
gcc allocates a lot of stack space because of the large switch statement
in bpf_jit_insn().
This leads to the following compile warning:
arch/s390/net/bpf_jit_comp.c: In function 'bpf_jit_prog':
arch/s390/net/bpf_jit_comp.c:1144:1: warning: frame size of
function 'bpf_jit_prog' is 12592 bytes which is more than
half the stack size. The dynamic check would not be reliable.
No check emitted for this function.
arch/s390/net/bpf_jit_comp.c:1144:1: warning: the frame size of 12504
bytes is larger than 1024 bytes [-Wframe-larger-than=]
And indead gcc allocates 12592 bytes of stack space:
# objdump -d arch/s390/net/bpf_jit_comp.o
...
0000000000000c60 <bpf_jit_prog>:
c60: eb 6f f0 48 00 24 stmg %r6,%r15,72(%r15)
c66: b9 04 00 ef lgr %r14,%r15
c6a: e3 f0 fe d0 fc 71 lay %r15,-12592(%r15)
As a workaround of that problem we now define bpf_jit_insn() as
noinline which then reduces the stack space.
# objdump -d arch/s390/net/bpf_jit_comp.o
...
0000000000000070 <bpf_jit_insn>:
70: eb 6f f0 48 00 24 stmg %r6,%r15,72(%r15)
76: c0 d0 00 00 00 00 larl %r13,76 <bpf_jit_insn+0x6>
7c: a7 f1 3f 80 tmll %r15,16256
80: b9 04 00 ef lgr %r14,%r15
84: e3 f0 ff a0 ff 71 lay %r15,-96(%r15)
Signed-off-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Signed-off-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
2015-04-29 18:45:03 +02:00
*
* NOTE : Use noinline because for gcov ( - fprofile - arcs ) gcc allocates a lot of
* stack space for the large switch statement .
2012-07-31 16:23:59 +02:00
*/
s390/bpf: Fix gcov stack space problem
When compiling the kernel for GCOV (CONFIG_GCOV_KERNEL,-fprofile-arcs),
gcc allocates a lot of stack space because of the large switch statement
in bpf_jit_insn().
This leads to the following compile warning:
arch/s390/net/bpf_jit_comp.c: In function 'bpf_jit_prog':
arch/s390/net/bpf_jit_comp.c:1144:1: warning: frame size of
function 'bpf_jit_prog' is 12592 bytes which is more than
half the stack size. The dynamic check would not be reliable.
No check emitted for this function.
arch/s390/net/bpf_jit_comp.c:1144:1: warning: the frame size of 12504
bytes is larger than 1024 bytes [-Wframe-larger-than=]
And indead gcc allocates 12592 bytes of stack space:
# objdump -d arch/s390/net/bpf_jit_comp.o
...
0000000000000c60 <bpf_jit_prog>:
c60: eb 6f f0 48 00 24 stmg %r6,%r15,72(%r15)
c66: b9 04 00 ef lgr %r14,%r15
c6a: e3 f0 fe d0 fc 71 lay %r15,-12592(%r15)
As a workaround of that problem we now define bpf_jit_insn() as
noinline which then reduces the stack space.
# objdump -d arch/s390/net/bpf_jit_comp.o
...
0000000000000070 <bpf_jit_insn>:
70: eb 6f f0 48 00 24 stmg %r6,%r15,72(%r15)
76: c0 d0 00 00 00 00 larl %r13,76 <bpf_jit_insn+0x6>
7c: a7 f1 3f 80 tmll %r15,16256
80: b9 04 00 ef lgr %r14,%r15
84: e3 f0 ff a0 ff 71 lay %r15,-96(%r15)
Signed-off-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Signed-off-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
2015-04-29 18:45:03 +02:00
static noinline int bpf_jit_insn ( struct bpf_jit * jit , struct bpf_prog * fp , int i )
2012-07-31 16:23:59 +02:00
{
2015-04-01 16:08:32 +02:00
struct bpf_insn * insn = & fp - > insnsi [ i ] ;
int jmp_off , last , insn_count = 1 ;
unsigned int func_addr , mask ;
u32 dst_reg = insn - > dst_reg ;
u32 src_reg = insn - > src_reg ;
u32 * addrs = jit - > addrs ;
s32 imm = insn - > imm ;
s16 off = insn - > off ;
2012-07-31 16:23:59 +02:00
2016-05-13 19:08:35 +02:00
if ( dst_reg = = BPF_REG_AX | | src_reg = = BPF_REG_AX )
jit - > seen | = SEEN_REG_AX ;
2015-04-01 16:08:32 +02:00
switch ( insn - > code ) {
/*
* BPF_MOV
*/
case BPF_ALU | BPF_MOV | BPF_X : /* dst = (u32) src */
/* llgfr %dst,%src */
EMIT4 ( 0xb9160000 , dst_reg , src_reg ) ;
break ;
case BPF_ALU64 | BPF_MOV | BPF_X : /* dst = src */
/* lgr %dst,%src */
EMIT4 ( 0xb9040000 , dst_reg , src_reg ) ;
break ;
case BPF_ALU | BPF_MOV | BPF_K : /* dst = (u32) imm */
/* llilf %dst,imm */
EMIT6_IMM ( 0xc00f0000 , dst_reg , imm ) ;
break ;
case BPF_ALU64 | BPF_MOV | BPF_K : /* dst = imm */
/* lgfi %dst,imm */
EMIT6_IMM ( 0xc0010000 , dst_reg , imm ) ;
break ;
/*
* BPF_LD 64
*/
case BPF_LD | BPF_IMM | BPF_DW : /* dst = (u64) imm */
{
/* 16 byte instruction that uses two 'struct bpf_insn' */
u64 imm64 ;
imm64 = ( u64 ) ( u32 ) insn [ 0 ] . imm | ( ( u64 ) ( u32 ) insn [ 1 ] . imm ) < < 32 ;
/* lg %dst,<d(imm)>(%l) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0004 , dst_reg , REG_0 , REG_L ,
EMIT_CONST_U64 ( imm64 ) ) ;
insn_count = 2 ;
break ;
}
/*
* BPF_ADD
*/
case BPF_ALU | BPF_ADD | BPF_X : /* dst = (u32) dst + (u32) src */
/* ar %dst,%src */
EMIT2 ( 0x1a00 , dst_reg , src_reg ) ;
EMIT_ZERO ( dst_reg ) ;
break ;
case BPF_ALU64 | BPF_ADD | BPF_X : /* dst = dst + src */
/* agr %dst,%src */
EMIT4 ( 0xb9080000 , dst_reg , src_reg ) ;
break ;
case BPF_ALU | BPF_ADD | BPF_K : /* dst = (u32) dst + (u32) imm */
if ( ! imm )
2012-07-31 16:23:59 +02:00
break ;
2015-04-01 16:08:32 +02:00
/* alfi %dst,imm */
EMIT6_IMM ( 0xc20b0000 , dst_reg , imm ) ;
EMIT_ZERO ( dst_reg ) ;
break ;
case BPF_ALU64 | BPF_ADD | BPF_K : /* dst = dst + imm */
if ( ! imm )
break ;
/* agfi %dst,imm */
EMIT6_IMM ( 0xc2080000 , dst_reg , imm ) ;
break ;
/*
* BPF_SUB
*/
case BPF_ALU | BPF_SUB | BPF_X : /* dst = (u32) dst - (u32) src */
/* sr %dst,%src */
EMIT2 ( 0x1b00 , dst_reg , src_reg ) ;
EMIT_ZERO ( dst_reg ) ;
2012-07-31 16:23:59 +02:00
break ;
2015-04-01 16:08:32 +02:00
case BPF_ALU64 | BPF_SUB | BPF_X : /* dst = dst - src */
/* sgr %dst,%src */
EMIT4 ( 0xb9090000 , dst_reg , src_reg ) ;
2012-07-31 16:23:59 +02:00
break ;
2015-04-01 16:08:32 +02:00
case BPF_ALU | BPF_SUB | BPF_K : /* dst = (u32) dst - (u32) imm */
if ( ! imm )
2012-07-31 16:23:59 +02:00
break ;
2015-04-01 16:08:32 +02:00
/* alfi %dst,-imm */
EMIT6_IMM ( 0xc20b0000 , dst_reg , - imm ) ;
EMIT_ZERO ( dst_reg ) ;
2012-07-31 16:23:59 +02:00
break ;
2015-04-01 16:08:32 +02:00
case BPF_ALU64 | BPF_SUB | BPF_K : /* dst = dst - imm */
if ( ! imm )
break ;
/* agfi %dst,-imm */
EMIT6_IMM ( 0xc2080000 , dst_reg , - imm ) ;
break ;
/*
* BPF_MUL
*/
case BPF_ALU | BPF_MUL | BPF_X : /* dst = (u32) dst * (u32) src */
/* msr %dst,%src */
EMIT4 ( 0xb2520000 , dst_reg , src_reg ) ;
EMIT_ZERO ( dst_reg ) ;
break ;
case BPF_ALU64 | BPF_MUL | BPF_X : /* dst = dst * src */
/* msgr %dst,%src */
EMIT4 ( 0xb90c0000 , dst_reg , src_reg ) ;
break ;
case BPF_ALU | BPF_MUL | BPF_K : /* dst = (u32) dst * (u32) imm */
if ( imm = = 1 )
break ;
/* msfi %r5,imm */
EMIT6_IMM ( 0xc2010000 , dst_reg , imm ) ;
EMIT_ZERO ( dst_reg ) ;
break ;
case BPF_ALU64 | BPF_MUL | BPF_K : /* dst = dst * imm */
if ( imm = = 1 )
2014-01-15 06:50:07 -08:00
break ;
2015-04-01 16:08:32 +02:00
/* msgfi %dst,imm */
EMIT6_IMM ( 0xc2000000 , dst_reg , imm ) ;
break ;
/*
* BPF_DIV / BPF_MOD
*/
case BPF_ALU | BPF_DIV | BPF_X : /* dst = (u32) dst / (u32) src */
case BPF_ALU | BPF_MOD | BPF_X : /* dst = (u32) dst % (u32) src */
{
int rc_reg = BPF_OP ( insn - > code ) = = BPF_DIV ? REG_W1 : REG_W0 ;
jit - > seen | = SEEN_RET0 ;
/* ltr %src,%src (if src == 0 goto fail) */
EMIT2 ( 0x1200 , src_reg , src_reg ) ;
/* jz <ret0> */
EMIT4_PCREL ( 0xa7840000 , jit - > ret0_ip - jit - > prg ) ;
/* lhi %w0,0 */
EMIT4_IMM ( 0xa7080000 , REG_W0 , 0 ) ;
/* lr %w1,%dst */
EMIT2 ( 0x1800 , REG_W1 , dst_reg ) ;
/* dlr %w0,%src */
EMIT4 ( 0xb9970000 , REG_W0 , src_reg ) ;
/* llgfr %dst,%rc */
EMIT4 ( 0xb9160000 , dst_reg , rc_reg ) ;
break ;
}
2015-04-27 11:12:25 +02:00
case BPF_ALU64 | BPF_DIV | BPF_X : /* dst = dst / src */
case BPF_ALU64 | BPF_MOD | BPF_X : /* dst = dst % src */
2015-04-01 16:08:32 +02:00
{
int rc_reg = BPF_OP ( insn - > code ) = = BPF_DIV ? REG_W1 : REG_W0 ;
jit - > seen | = SEEN_RET0 ;
/* ltgr %src,%src (if src == 0 goto fail) */
EMIT4 ( 0xb9020000 , src_reg , src_reg ) ;
2012-12-01 12:29:08 +01:00
/* jz <ret0> */
2015-04-01 16:08:32 +02:00
EMIT4_PCREL ( 0xa7840000 , jit - > ret0_ip - jit - > prg ) ;
/* lghi %w0,0 */
EMIT4_IMM ( 0xa7090000 , REG_W0 , 0 ) ;
/* lgr %w1,%dst */
EMIT4 ( 0xb9040000 , REG_W1 , dst_reg ) ;
/* dlgr %w0,%dst */
2015-04-27 11:12:25 +02:00
EMIT4 ( 0xb9870000 , REG_W0 , src_reg ) ;
2015-04-01 16:08:32 +02:00
/* lgr %dst,%rc */
EMIT4 ( 0xb9040000 , dst_reg , rc_reg ) ;
break ;
}
case BPF_ALU | BPF_DIV | BPF_K : /* dst = (u32) dst / (u32) imm */
case BPF_ALU | BPF_MOD | BPF_K : /* dst = (u32) dst % (u32) imm */
{
int rc_reg = BPF_OP ( insn - > code ) = = BPF_DIV ? REG_W1 : REG_W0 ;
if ( imm = = 1 ) {
if ( BPF_OP ( insn - > code ) = = BPF_MOD )
/* lhgi %dst,0 */
EMIT4_IMM ( 0xa7090000 , dst_reg , 0 ) ;
2014-01-15 06:50:07 -08:00
break ;
}
2015-04-01 16:08:32 +02:00
/* lhi %w0,0 */
EMIT4_IMM ( 0xa7080000 , REG_W0 , 0 ) ;
/* lr %w1,%dst */
EMIT2 ( 0x1800 , REG_W1 , dst_reg ) ;
/* dl %w0,<d(imm)>(%l) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0097 , REG_W0 , REG_0 , REG_L ,
EMIT_CONST_U32 ( imm ) ) ;
/* llgfr %dst,%rc */
EMIT4 ( 0xb9160000 , dst_reg , rc_reg ) ;
break ;
}
2015-04-27 11:12:25 +02:00
case BPF_ALU64 | BPF_DIV | BPF_K : /* dst = dst / imm */
case BPF_ALU64 | BPF_MOD | BPF_K : /* dst = dst % imm */
2015-04-01 16:08:32 +02:00
{
int rc_reg = BPF_OP ( insn - > code ) = = BPF_DIV ? REG_W1 : REG_W0 ;
if ( imm = = 1 ) {
if ( BPF_OP ( insn - > code ) = = BPF_MOD )
/* lhgi %dst,0 */
EMIT4_IMM ( 0xa7090000 , dst_reg , 0 ) ;
break ;
}
/* lghi %w0,0 */
EMIT4_IMM ( 0xa7090000 , REG_W0 , 0 ) ;
/* lgr %w1,%dst */
EMIT4 ( 0xb9040000 , REG_W1 , dst_reg ) ;
/* dlg %w0,<d(imm)>(%l) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0087 , REG_W0 , REG_0 , REG_L ,
2015-04-27 11:12:25 +02:00
EMIT_CONST_U64 ( imm ) ) ;
2015-04-01 16:08:32 +02:00
/* lgr %dst,%rc */
EMIT4 ( 0xb9040000 , dst_reg , rc_reg ) ;
break ;
}
/*
* BPF_AND
*/
case BPF_ALU | BPF_AND | BPF_X : /* dst = (u32) dst & (u32) src */
/* nr %dst,%src */
EMIT2 ( 0x1400 , dst_reg , src_reg ) ;
EMIT_ZERO ( dst_reg ) ;
break ;
case BPF_ALU64 | BPF_AND | BPF_X : /* dst = dst & src */
/* ngr %dst,%src */
EMIT4 ( 0xb9800000 , dst_reg , src_reg ) ;
break ;
case BPF_ALU | BPF_AND | BPF_K : /* dst = (u32) dst & (u32) imm */
/* nilf %dst,imm */
EMIT6_IMM ( 0xc00b0000 , dst_reg , imm ) ;
EMIT_ZERO ( dst_reg ) ;
2012-07-31 16:23:59 +02:00
break ;
2015-04-01 16:08:32 +02:00
case BPF_ALU64 | BPF_AND | BPF_K : /* dst = dst & imm */
/* ng %dst,<d(imm)>(%l) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0080 , dst_reg , REG_0 , REG_L ,
EMIT_CONST_U64 ( imm ) ) ;
2012-09-24 08:31:35 +02:00
break ;
2015-04-01 16:08:32 +02:00
/*
* BPF_OR
*/
case BPF_ALU | BPF_OR | BPF_X : /* dst = (u32) dst | (u32) src */
/* or %dst,%src */
EMIT2 ( 0x1600 , dst_reg , src_reg ) ;
EMIT_ZERO ( dst_reg ) ;
break ;
case BPF_ALU64 | BPF_OR | BPF_X : /* dst = dst | src */
/* ogr %dst,%src */
EMIT4 ( 0xb9810000 , dst_reg , src_reg ) ;
break ;
case BPF_ALU | BPF_OR | BPF_K : /* dst = (u32) dst | (u32) imm */
/* oilf %dst,imm */
EMIT6_IMM ( 0xc00d0000 , dst_reg , imm ) ;
EMIT_ZERO ( dst_reg ) ;
break ;
case BPF_ALU64 | BPF_OR | BPF_K : /* dst = dst | imm */
/* og %dst,<d(imm)>(%l) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0081 , dst_reg , REG_0 , REG_L ,
EMIT_CONST_U64 ( imm ) ) ;
break ;
/*
* BPF_XOR
*/
case BPF_ALU | BPF_XOR | BPF_X : /* dst = (u32) dst ^ (u32) src */
/* xr %dst,%src */
EMIT2 ( 0x1700 , dst_reg , src_reg ) ;
EMIT_ZERO ( dst_reg ) ;
break ;
case BPF_ALU64 | BPF_XOR | BPF_X : /* dst = dst ^ src */
/* xgr %dst,%src */
EMIT4 ( 0xb9820000 , dst_reg , src_reg ) ;
break ;
case BPF_ALU | BPF_XOR | BPF_K : /* dst = (u32) dst ^ (u32) imm */
if ( ! imm )
2012-12-01 12:42:32 +01:00
break ;
2015-04-01 16:08:32 +02:00
/* xilf %dst,imm */
EMIT6_IMM ( 0xc0070000 , dst_reg , imm ) ;
EMIT_ZERO ( dst_reg ) ;
break ;
case BPF_ALU64 | BPF_XOR | BPF_K : /* dst = dst ^ imm */
/* xg %dst,<d(imm)>(%l) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0082 , dst_reg , REG_0 , REG_L ,
EMIT_CONST_U64 ( imm ) ) ;
break ;
/*
* BPF_LSH
*/
case BPF_ALU | BPF_LSH | BPF_X : /* dst = (u32) dst << (u32) src */
/* sll %dst,0(%src) */
EMIT4_DISP ( 0x89000000 , dst_reg , src_reg , 0 ) ;
EMIT_ZERO ( dst_reg ) ;
2012-12-01 12:42:32 +01:00
break ;
2015-04-01 16:08:32 +02:00
case BPF_ALU64 | BPF_LSH | BPF_X : /* dst = dst << src */
/* sllg %dst,%dst,0(%src) */
EMIT6_DISP_LH ( 0xeb000000 , 0x000d , dst_reg , dst_reg , src_reg , 0 ) ;
2012-07-31 16:23:59 +02:00
break ;
2015-04-01 16:08:32 +02:00
case BPF_ALU | BPF_LSH | BPF_K : /* dst = (u32) dst << (u32) imm */
if ( imm = = 0 )
2012-07-31 16:23:59 +02:00
break ;
2015-04-01 16:08:32 +02:00
/* sll %dst,imm(%r0) */
EMIT4_DISP ( 0x89000000 , dst_reg , REG_0 , imm ) ;
EMIT_ZERO ( dst_reg ) ;
2012-07-31 16:23:59 +02:00
break ;
2015-04-01 16:08:32 +02:00
case BPF_ALU64 | BPF_LSH | BPF_K : /* dst = dst << imm */
if ( imm = = 0 )
break ;
/* sllg %dst,%dst,imm(%r0) */
EMIT6_DISP_LH ( 0xeb000000 , 0x000d , dst_reg , dst_reg , REG_0 , imm ) ;
break ;
/*
* BPF_RSH
*/
case BPF_ALU | BPF_RSH | BPF_X : /* dst = (u32) dst >> (u32) src */
/* srl %dst,0(%src) */
EMIT4_DISP ( 0x88000000 , dst_reg , src_reg , 0 ) ;
EMIT_ZERO ( dst_reg ) ;
2012-07-31 16:23:59 +02:00
break ;
2015-04-01 16:08:32 +02:00
case BPF_ALU64 | BPF_RSH | BPF_X : /* dst = dst >> src */
/* srlg %dst,%dst,0(%src) */
EMIT6_DISP_LH ( 0xeb000000 , 0x000c , dst_reg , dst_reg , src_reg , 0 ) ;
break ;
case BPF_ALU | BPF_RSH | BPF_K : /* dst = (u32) dst >> (u32) imm */
if ( imm = = 0 )
2012-07-31 16:23:59 +02:00
break ;
2015-04-01 16:08:32 +02:00
/* srl %dst,imm(%r0) */
EMIT4_DISP ( 0x88000000 , dst_reg , REG_0 , imm ) ;
EMIT_ZERO ( dst_reg ) ;
break ;
case BPF_ALU64 | BPF_RSH | BPF_K : /* dst = dst >> imm */
if ( imm = = 0 )
2012-07-31 16:23:59 +02:00
break ;
2015-04-01 16:08:32 +02:00
/* srlg %dst,%dst,imm(%r0) */
EMIT6_DISP_LH ( 0xeb000000 , 0x000c , dst_reg , dst_reg , REG_0 , imm ) ;
2012-07-31 16:23:59 +02:00
break ;
2015-04-01 16:08:32 +02:00
/*
* BPF_ARSH
*/
case BPF_ALU64 | BPF_ARSH | BPF_X : /* ((s64) dst) >>= src */
/* srag %dst,%dst,0(%src) */
EMIT6_DISP_LH ( 0xeb000000 , 0x000a , dst_reg , dst_reg , src_reg , 0 ) ;
break ;
case BPF_ALU64 | BPF_ARSH | BPF_K : /* ((s64) dst) >>= imm */
if ( imm = = 0 )
break ;
/* srag %dst,%dst,imm(%r0) */
EMIT6_DISP_LH ( 0xeb000000 , 0x000a , dst_reg , dst_reg , REG_0 , imm ) ;
break ;
/*
* BPF_NEG
*/
case BPF_ALU | BPF_NEG : /* dst = (u32) -dst */
/* lcr %dst,%dst */
EMIT2 ( 0x1300 , dst_reg , dst_reg ) ;
EMIT_ZERO ( dst_reg ) ;
break ;
case BPF_ALU64 | BPF_NEG : /* dst = -dst */
/* lcgr %dst,%dst */
EMIT4 ( 0xb9130000 , dst_reg , dst_reg ) ;
break ;
/*
* BPF_FROM_BE / LE
*/
case BPF_ALU | BPF_END | BPF_FROM_BE :
/* s390 is big endian, therefore only clear high order bytes */
switch ( imm ) {
case 16 : /* dst = (u16) cpu_to_be16(dst) */
/* llghr %dst,%dst */
EMIT4 ( 0xb9850000 , dst_reg , dst_reg ) ;
break ;
case 32 : /* dst = (u32) cpu_to_be32(dst) */
/* llgfr %dst,%dst */
EMIT4 ( 0xb9160000 , dst_reg , dst_reg ) ;
break ;
case 64 : /* dst = (u64) cpu_to_be64(dst) */
break ;
2012-07-31 16:23:59 +02:00
}
break ;
2015-04-01 16:08:32 +02:00
case BPF_ALU | BPF_END | BPF_FROM_LE :
switch ( imm ) {
case 16 : /* dst = (u16) cpu_to_le16(dst) */
/* lrvr %dst,%dst */
EMIT4 ( 0xb91f0000 , dst_reg , dst_reg ) ;
/* srl %dst,16(%r0) */
EMIT4_DISP ( 0x88000000 , dst_reg , REG_0 , 16 ) ;
/* llghr %dst,%dst */
EMIT4 ( 0xb9850000 , dst_reg , dst_reg ) ;
break ;
case 32 : /* dst = (u32) cpu_to_le32(dst) */
/* lrvr %dst,%dst */
EMIT4 ( 0xb91f0000 , dst_reg , dst_reg ) ;
/* llgfr %dst,%dst */
EMIT4 ( 0xb9160000 , dst_reg , dst_reg ) ;
break ;
case 64 : /* dst = (u64) cpu_to_le64(dst) */
/* lrvgr %dst,%dst */
EMIT4 ( 0xb90f0000 , dst_reg , dst_reg ) ;
2012-07-31 16:23:59 +02:00
break ;
}
break ;
2015-04-01 16:08:32 +02:00
/*
* BPF_ST ( X )
*/
case BPF_STX | BPF_MEM | BPF_B : /* *(u8 *)(dst + off) = src_reg */
/* stcy %src,off(%dst) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0072 , src_reg , dst_reg , REG_0 , off ) ;
jit - > seen | = SEEN_MEM ;
break ;
case BPF_STX | BPF_MEM | BPF_H : /* (u16 *)(dst + off) = src */
/* sthy %src,off(%dst) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0070 , src_reg , dst_reg , REG_0 , off ) ;
jit - > seen | = SEEN_MEM ;
break ;
case BPF_STX | BPF_MEM | BPF_W : /* *(u32 *)(dst + off) = src */
/* sty %src,off(%dst) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0050 , src_reg , dst_reg , REG_0 , off ) ;
jit - > seen | = SEEN_MEM ;
break ;
case BPF_STX | BPF_MEM | BPF_DW : /* (u64 *)(dst + off) = src */
/* stg %src,off(%dst) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0024 , src_reg , dst_reg , REG_0 , off ) ;
jit - > seen | = SEEN_MEM ;
break ;
case BPF_ST | BPF_MEM | BPF_B : /* *(u8 *)(dst + off) = imm */
/* lhi %w0,imm */
EMIT4_IMM ( 0xa7080000 , REG_W0 , ( u8 ) imm ) ;
/* stcy %w0,off(dst) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0072 , REG_W0 , dst_reg , REG_0 , off ) ;
jit - > seen | = SEEN_MEM ;
break ;
case BPF_ST | BPF_MEM | BPF_H : /* (u16 *)(dst + off) = imm */
/* lhi %w0,imm */
EMIT4_IMM ( 0xa7080000 , REG_W0 , ( u16 ) imm ) ;
/* sthy %w0,off(dst) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0070 , REG_W0 , dst_reg , REG_0 , off ) ;
2012-07-31 16:23:59 +02:00
jit - > seen | = SEEN_MEM ;
break ;
2015-04-01 16:08:32 +02:00
case BPF_ST | BPF_MEM | BPF_W : /* *(u32 *)(dst + off) = imm */
/* llilf %w0,imm */
EMIT6_IMM ( 0xc00f0000 , REG_W0 , ( u32 ) imm ) ;
/* sty %w0,off(%dst) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0050 , REG_W0 , dst_reg , REG_0 , off ) ;
jit - > seen | = SEEN_MEM ;
break ;
case BPF_ST | BPF_MEM | BPF_DW : /* *(u64 *)(dst + off) = imm */
/* lgfi %w0,imm */
EMIT6_IMM ( 0xc0010000 , REG_W0 , imm ) ;
/* stg %w0,off(%dst) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0024 , REG_W0 , dst_reg , REG_0 , off ) ;
jit - > seen | = SEEN_MEM ;
break ;
/*
* BPF_STX XADD ( atomic_add )
*/
case BPF_STX | BPF_XADD | BPF_W : /* *(u32 *)(dst + off) += src */
/* laal %w0,%src,off(%dst) */
EMIT6_DISP_LH ( 0xeb000000 , 0x00fa , REG_W0 , src_reg ,
dst_reg , off ) ;
jit - > seen | = SEEN_MEM ;
break ;
case BPF_STX | BPF_XADD | BPF_DW : /* *(u64 *)(dst + off) += src */
/* laalg %w0,%src,off(%dst) */
EMIT6_DISP_LH ( 0xeb000000 , 0x00ea , REG_W0 , src_reg ,
dst_reg , off ) ;
jit - > seen | = SEEN_MEM ;
break ;
/*
* BPF_LDX
*/
case BPF_LDX | BPF_MEM | BPF_B : /* dst = *(u8 *)(ul) (src + off) */
/* llgc %dst,0(off,%src) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0090 , dst_reg , src_reg , REG_0 , off ) ;
jit - > seen | = SEEN_MEM ;
break ;
case BPF_LDX | BPF_MEM | BPF_H : /* dst = *(u16 *)(ul) (src + off) */
/* llgh %dst,0(off,%src) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0091 , dst_reg , src_reg , REG_0 , off ) ;
jit - > seen | = SEEN_MEM ;
break ;
case BPF_LDX | BPF_MEM | BPF_W : /* dst = *(u32 *)(ul) (src + off) */
/* llgf %dst,off(%src) */
jit - > seen | = SEEN_MEM ;
EMIT6_DISP_LH ( 0xe3000000 , 0x0016 , dst_reg , src_reg , REG_0 , off ) ;
break ;
case BPF_LDX | BPF_MEM | BPF_DW : /* dst = *(u64 *)(ul) (src + off) */
/* lg %dst,0(off,%src) */
jit - > seen | = SEEN_MEM ;
EMIT6_DISP_LH ( 0xe3000000 , 0x0004 , dst_reg , src_reg , REG_0 , off ) ;
break ;
/*
* BPF_JMP / CALL
*/
case BPF_JMP | BPF_CALL :
{
/*
* b0 = ( __bpf_call_base + imm ) ( b1 , b2 , b3 , b4 , b5 )
*/
const u64 func = ( u64 ) __bpf_call_base + imm ;
REG_SET_SEEN ( BPF_REG_5 ) ;
jit - > seen | = SEEN_FUNC ;
/* lg %w1,<d(imm)>(%l) */
2015-07-29 21:15:16 +02:00
EMIT6_DISP_LH ( 0xe3000000 , 0x0004 , REG_W1 , REG_0 , REG_L ,
EMIT_CONST_U64 ( func ) ) ;
2015-04-01 16:08:32 +02:00
/* basr %r14,%w1 */
EMIT2 ( 0x0d00 , REG_14 , REG_W1 ) ;
/* lgr %b0,%r2: load return value into %b0 */
EMIT4 ( 0xb9040000 , BPF_REG_0 , REG_2 ) ;
2016-12-07 15:53:11 -08:00
if ( bpf_helper_changes_pkt_data ( ( void * ) func ) ) {
2015-07-29 21:15:18 +02:00
jit - > seen | = SEEN_SKB_CHANGE ;
/* lg %b1,ST_OFF_SKBP(%r15) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0004 , BPF_REG_1 , REG_0 ,
REG_15 , STK_OFF_SKBP ) ;
emit_load_skb_data_hlen ( jit ) ;
}
2015-04-01 16:08:32 +02:00
break ;
}
2017-05-30 13:31:27 -07:00
case BPF_JMP | BPF_TAIL_CALL :
s390/bpf: implement bpf_tail_call() helper
bpf_tail_call() arguments:
- ctx......: Context pointer
- jmp_table: One of BPF_MAP_TYPE_PROG_ARRAY maps used as the jump table
- index....: Index in the jump table
In this implementation s390x JIT does stack unwinding and jumps into the
callee program prologue. Caller and callee use the same stack.
With this patch a tail call generates the following code on s390x:
if (index >= array->map.max_entries)
goto out
000003ff8001c7e4: e31030100016 llgf %r1,16(%r3)
000003ff8001c7ea: ec41001fa065 clgrj %r4,%r1,10,3ff8001c828
if (tail_call_cnt++ > MAX_TAIL_CALL_CNT)
goto out;
000003ff8001c7f0: a7080001 lhi %r0,1
000003ff8001c7f4: eb10f25000fa laal %r1,%r0,592(%r15)
000003ff8001c7fa: ec120017207f clij %r1,32,2,3ff8001c828
prog = array->prog[index];
if (prog == NULL)
goto out;
000003ff8001c800: eb140003000d sllg %r1,%r4,3
000003ff8001c806: e31310800004 lg %r1,128(%r3,%r1)
000003ff8001c80c: ec18000e007d clgij %r1,0,8,3ff8001c828
Restore registers before calling function
000003ff8001c812: eb68f2980004 lmg %r6,%r8,664(%r15)
000003ff8001c818: ebbff2c00004 lmg %r11,%r15,704(%r15)
goto *(prog->bpf_func + tail_call_start);
000003ff8001c81e: e31100200004 lg %r1,32(%r1,%r0)
000003ff8001c824: 47f01006 bc 15,6(%r1)
Reviewed-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
Signed-off-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Acked-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Alexei Starovoitov <ast@plumgrid.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2015-06-08 21:51:06 -07:00
/*
* Implicit input :
* B1 : pointer to ctx
* B2 : pointer to bpf_array
* B3 : index in bpf_array
*/
jit - > seen | = SEEN_TAIL_CALL ;
/*
* if ( index > = array - > map . max_entries )
* goto out ;
*/
/* llgf %w1,map.max_entries(%b2) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0016 , REG_W1 , REG_0 , BPF_REG_2 ,
offsetof ( struct bpf_array , map . max_entries ) ) ;
/* clgrj %b3,%w1,0xa,label0: if %b3 >= %w1 goto out */
EMIT6_PCREL_LABEL ( 0xec000000 , 0x0065 , BPF_REG_3 ,
REG_W1 , 0 , 0xa ) ;
/*
* if ( tail_call_cnt + + > MAX_TAIL_CALL_CNT )
* goto out ;
*/
if ( jit - > seen & SEEN_STACK )
off = STK_OFF_TCCNT + STK_OFF ;
else
off = STK_OFF_TCCNT ;
/* lhi %w0,1 */
EMIT4_IMM ( 0xa7080000 , REG_W0 , 1 ) ;
/* laal %w1,%w0,off(%r15) */
EMIT6_DISP_LH ( 0xeb000000 , 0x00fa , REG_W1 , REG_W0 , REG_15 , off ) ;
/* clij %w1,MAX_TAIL_CALL_CNT,0x2,label0 */
EMIT6_PCREL_IMM_LABEL ( 0xec000000 , 0x007f , REG_W1 ,
MAX_TAIL_CALL_CNT , 0 , 0x2 ) ;
/*
2015-08-11 08:56:51 +00:00
* prog = array - > ptrs [ index ] ;
s390/bpf: implement bpf_tail_call() helper
bpf_tail_call() arguments:
- ctx......: Context pointer
- jmp_table: One of BPF_MAP_TYPE_PROG_ARRAY maps used as the jump table
- index....: Index in the jump table
In this implementation s390x JIT does stack unwinding and jumps into the
callee program prologue. Caller and callee use the same stack.
With this patch a tail call generates the following code on s390x:
if (index >= array->map.max_entries)
goto out
000003ff8001c7e4: e31030100016 llgf %r1,16(%r3)
000003ff8001c7ea: ec41001fa065 clgrj %r4,%r1,10,3ff8001c828
if (tail_call_cnt++ > MAX_TAIL_CALL_CNT)
goto out;
000003ff8001c7f0: a7080001 lhi %r0,1
000003ff8001c7f4: eb10f25000fa laal %r1,%r0,592(%r15)
000003ff8001c7fa: ec120017207f clij %r1,32,2,3ff8001c828
prog = array->prog[index];
if (prog == NULL)
goto out;
000003ff8001c800: eb140003000d sllg %r1,%r4,3
000003ff8001c806: e31310800004 lg %r1,128(%r3,%r1)
000003ff8001c80c: ec18000e007d clgij %r1,0,8,3ff8001c828
Restore registers before calling function
000003ff8001c812: eb68f2980004 lmg %r6,%r8,664(%r15)
000003ff8001c818: ebbff2c00004 lmg %r11,%r15,704(%r15)
goto *(prog->bpf_func + tail_call_start);
000003ff8001c81e: e31100200004 lg %r1,32(%r1,%r0)
000003ff8001c824: 47f01006 bc 15,6(%r1)
Reviewed-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
Signed-off-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Acked-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Alexei Starovoitov <ast@plumgrid.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2015-06-08 21:51:06 -07:00
* if ( prog = = NULL )
* goto out ;
*/
/* sllg %r1,%b3,3: %r1 = index * 8 */
EMIT6_DISP_LH ( 0xeb000000 , 0x000d , REG_1 , BPF_REG_3 , REG_0 , 3 ) ;
/* lg %r1,prog(%b2,%r1) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0004 , REG_1 , BPF_REG_2 ,
2015-08-11 08:56:51 +00:00
REG_1 , offsetof ( struct bpf_array , ptrs ) ) ;
s390/bpf: implement bpf_tail_call() helper
bpf_tail_call() arguments:
- ctx......: Context pointer
- jmp_table: One of BPF_MAP_TYPE_PROG_ARRAY maps used as the jump table
- index....: Index in the jump table
In this implementation s390x JIT does stack unwinding and jumps into the
callee program prologue. Caller and callee use the same stack.
With this patch a tail call generates the following code on s390x:
if (index >= array->map.max_entries)
goto out
000003ff8001c7e4: e31030100016 llgf %r1,16(%r3)
000003ff8001c7ea: ec41001fa065 clgrj %r4,%r1,10,3ff8001c828
if (tail_call_cnt++ > MAX_TAIL_CALL_CNT)
goto out;
000003ff8001c7f0: a7080001 lhi %r0,1
000003ff8001c7f4: eb10f25000fa laal %r1,%r0,592(%r15)
000003ff8001c7fa: ec120017207f clij %r1,32,2,3ff8001c828
prog = array->prog[index];
if (prog == NULL)
goto out;
000003ff8001c800: eb140003000d sllg %r1,%r4,3
000003ff8001c806: e31310800004 lg %r1,128(%r3,%r1)
000003ff8001c80c: ec18000e007d clgij %r1,0,8,3ff8001c828
Restore registers before calling function
000003ff8001c812: eb68f2980004 lmg %r6,%r8,664(%r15)
000003ff8001c818: ebbff2c00004 lmg %r11,%r15,704(%r15)
goto *(prog->bpf_func + tail_call_start);
000003ff8001c81e: e31100200004 lg %r1,32(%r1,%r0)
000003ff8001c824: 47f01006 bc 15,6(%r1)
Reviewed-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
Signed-off-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Acked-by: Heiko Carstens <heiko.carstens@de.ibm.com>
Signed-off-by: Alexei Starovoitov <ast@plumgrid.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2015-06-08 21:51:06 -07:00
/* clgij %r1,0,0x8,label0 */
EMIT6_PCREL_IMM_LABEL ( 0xec000000 , 0x007d , REG_1 , 0 , 0 , 0x8 ) ;
/*
* Restore registers before calling function
*/
save_restore_regs ( jit , REGS_RESTORE ) ;
/*
* goto * ( prog - > bpf_func + tail_call_start ) ;
*/
/* lg %r1,bpf_func(%r1) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0004 , REG_1 , REG_1 , REG_0 ,
offsetof ( struct bpf_prog , bpf_func ) ) ;
/* bc 0xf,tail_call_start(%r1) */
_EMIT4 ( 0x47f01000 + jit - > tail_call_start ) ;
/* out: */
jit - > labels [ 0 ] = jit - > prg ;
break ;
2015-04-01 16:08:32 +02:00
case BPF_JMP | BPF_EXIT : /* return b0 */
last = ( i = = fp - > len - 1 ) ? 1 : 0 ;
if ( last & & ! ( jit - > seen & SEEN_RET0 ) )
break ;
2012-07-31 16:23:59 +02:00
/* j <exit> */
EMIT4_PCREL ( 0xa7f40000 , jit - > exit_ip - jit - > prg ) ;
break ;
2015-04-01 16:08:32 +02:00
/*
* Branch relative ( number of skipped instructions ) to offset on
* condition .
*
* Condition code to mask mapping :
*
* CC | Description | Mask
* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
* 0 | Operands equal | 8
* 1 | First operand low | 4
* 2 | First operand high | 2
* 3 | Unused | 1
*
* For s390x relative branches : ip = ip + off_bytes
* For BPF relative branches : insn = insn + off_insns + 1
*
* For example for s390x with offset 0 we jump to the branch
* instruction itself ( loop ) and for BPF with offset 0 we
* branch to the instruction behind the branch .
*/
case BPF_JMP | BPF_JA : /* if (true) */
mask = 0xf000 ; /* j */
goto branch_oc ;
case BPF_JMP | BPF_JSGT | BPF_K : /* ((s64) dst > (s64) imm) */
mask = 0x2000 ; /* jh */
goto branch_ks ;
case BPF_JMP | BPF_JSGE | BPF_K : /* ((s64) dst >= (s64) imm) */
mask = 0xa000 ; /* jhe */
goto branch_ks ;
case BPF_JMP | BPF_JGT | BPF_K : /* (dst_reg > imm) */
mask = 0x2000 ; /* jh */
goto branch_ku ;
case BPF_JMP | BPF_JGE | BPF_K : /* (dst_reg >= imm) */
mask = 0xa000 ; /* jhe */
goto branch_ku ;
case BPF_JMP | BPF_JNE | BPF_K : /* (dst_reg != imm) */
mask = 0x7000 ; /* jne */
goto branch_ku ;
case BPF_JMP | BPF_JEQ | BPF_K : /* (dst_reg == imm) */
mask = 0x8000 ; /* je */
goto branch_ku ;
case BPF_JMP | BPF_JSET | BPF_K : /* (dst_reg & imm) */
mask = 0x7000 ; /* jnz */
/* lgfi %w1,imm (load sign extend imm) */
EMIT6_IMM ( 0xc0010000 , REG_W1 , imm ) ;
/* ngr %w1,%dst */
EMIT4 ( 0xb9800000 , REG_W1 , dst_reg ) ;
goto branch_oc ;
case BPF_JMP | BPF_JSGT | BPF_X : /* ((s64) dst > (s64) src) */
mask = 0x2000 ; /* jh */
goto branch_xs ;
case BPF_JMP | BPF_JSGE | BPF_X : /* ((s64) dst >= (s64) src) */
mask = 0xa000 ; /* jhe */
goto branch_xs ;
case BPF_JMP | BPF_JGT | BPF_X : /* (dst > src) */
mask = 0x2000 ; /* jh */
goto branch_xu ;
case BPF_JMP | BPF_JGE | BPF_X : /* (dst >= src) */
mask = 0xa000 ; /* jhe */
goto branch_xu ;
case BPF_JMP | BPF_JNE | BPF_X : /* (dst != src) */
mask = 0x7000 ; /* jne */
goto branch_xu ;
case BPF_JMP | BPF_JEQ | BPF_X : /* (dst == src) */
mask = 0x8000 ; /* je */
goto branch_xu ;
case BPF_JMP | BPF_JSET | BPF_X : /* (dst & src) */
mask = 0x7000 ; /* jnz */
/* ngrk %w1,%dst,%src */
EMIT4_RRF ( 0xb9e40000 , REG_W1 , dst_reg , src_reg ) ;
goto branch_oc ;
branch_ks :
/* lgfi %w1,imm (load sign extend imm) */
EMIT6_IMM ( 0xc0010000 , REG_W1 , imm ) ;
/* cgrj %dst,%w1,mask,off */
EMIT6_PCREL ( 0xec000000 , 0x0064 , dst_reg , REG_W1 , i , off , mask ) ;
break ;
branch_ku :
/* lgfi %w1,imm (load sign extend imm) */
EMIT6_IMM ( 0xc0010000 , REG_W1 , imm ) ;
/* clgrj %dst,%w1,mask,off */
EMIT6_PCREL ( 0xec000000 , 0x0065 , dst_reg , REG_W1 , i , off , mask ) ;
break ;
branch_xs :
/* cgrj %dst,%src,mask,off */
EMIT6_PCREL ( 0xec000000 , 0x0064 , dst_reg , src_reg , i , off , mask ) ;
break ;
branch_xu :
/* clgrj %dst,%src,mask,off */
EMIT6_PCREL ( 0xec000000 , 0x0065 , dst_reg , src_reg , i , off , mask ) ;
break ;
branch_oc :
/* brc mask,jmp_off (branch instruction needs 4 bytes) */
jmp_off = addrs [ i + off + 1 ] - ( addrs [ i + 1 ] - 4 ) ;
EMIT4_PCREL ( 0xa7040000 | mask < < 8 , jmp_off ) ;
2013-02-09 14:07:50 +01:00
break ;
2015-04-01 16:08:32 +02:00
/*
* BPF_LD
*/
case BPF_LD | BPF_ABS | BPF_B : /* b0 = *(u8 *) (skb->data+imm) */
case BPF_LD | BPF_IND | BPF_B : /* b0 = *(u8 *) (skb->data+imm+src) */
if ( ( BPF_MODE ( insn - > code ) = = BPF_ABS ) & & ( imm > = 0 ) )
func_addr = __pa ( sk_load_byte_pos ) ;
else
func_addr = __pa ( sk_load_byte ) ;
goto call_fn ;
case BPF_LD | BPF_ABS | BPF_H : /* b0 = *(u16 *) (skb->data+imm) */
case BPF_LD | BPF_IND | BPF_H : /* b0 = *(u16 *) (skb->data+imm+src) */
if ( ( BPF_MODE ( insn - > code ) = = BPF_ABS ) & & ( imm > = 0 ) )
func_addr = __pa ( sk_load_half_pos ) ;
else
func_addr = __pa ( sk_load_half ) ;
goto call_fn ;
case BPF_LD | BPF_ABS | BPF_W : /* b0 = *(u32 *) (skb->data+imm) */
case BPF_LD | BPF_IND | BPF_W : /* b0 = *(u32 *) (skb->data+imm+src) */
if ( ( BPF_MODE ( insn - > code ) = = BPF_ABS ) & & ( imm > = 0 ) )
func_addr = __pa ( sk_load_word_pos ) ;
else
func_addr = __pa ( sk_load_word ) ;
goto call_fn ;
call_fn :
jit - > seen | = SEEN_SKB | SEEN_RET0 | SEEN_FUNC ;
REG_SET_SEEN ( REG_14 ) ; /* Return address of possible func call */
/*
* Implicit input :
* BPF_REG_6 ( R7 ) : skb pointer
2016-05-13 19:08:35 +02:00
* REG_SKB_DATA ( R12 ) : skb data pointer ( if no BPF_REG_AX )
2015-04-01 16:08:32 +02:00
*
* Calculated input :
* BPF_REG_2 ( R3 ) : offset of byte ( s ) to fetch in skb
* BPF_REG_5 ( R6 ) : return address
*
* Output :
* BPF_REG_0 ( R14 ) : data read from skb
*
* Scratch registers ( BPF_REG_1 - 5 )
*/
/* Call function: llilf %w1,func_addr */
EMIT6_IMM ( 0xc00f0000 , REG_W1 , func_addr ) ;
/* Offset: lgfi %b2,imm */
EMIT6_IMM ( 0xc0010000 , BPF_REG_2 , imm ) ;
if ( BPF_MODE ( insn - > code ) = = BPF_IND )
/* agfr %b2,%src (%src is s32 here) */
EMIT4 ( 0xb9180000 , BPF_REG_2 , src_reg ) ;
2016-05-13 19:08:35 +02:00
/* Reload REG_SKB_DATA if BPF_REG_AX is used */
if ( jit - > seen & SEEN_REG_AX )
/* lg %skb_data,data_off(%b6) */
EMIT6_DISP_LH ( 0xe3000000 , 0x0004 , REG_SKB_DATA , REG_0 ,
BPF_REG_6 , offsetof ( struct sk_buff , data ) ) ;
2015-04-01 16:08:32 +02:00
/* basr %b5,%w1 (%b5 is call saved) */
EMIT2 ( 0x0d00 , BPF_REG_5 , REG_W1 ) ;
/*
* Note : For fast access we jump directly after the
* jnz instruction from bpf_jit . S
*/
/* jnz <ret0> */
EMIT4_PCREL ( 0xa7740000 , jit - > ret0_ip - jit - > prg ) ;
2012-07-31 16:23:59 +02:00
break ;
default : /* too complex, give up */
2015-04-01 16:08:32 +02:00
pr_err ( " Unknown opcode %02x \n " , insn - > code ) ;
return - 1 ;
}
return insn_count ;
}
/*
* Compile eBPF program into s390x code
*/
static int bpf_jit_prog ( struct bpf_jit * jit , struct bpf_prog * fp )
{
int i , insn_count ;
jit - > lit = jit - > lit_start ;
jit - > prg = 0 ;
bpf: move clearing of A/X into classic to eBPF migration prologue
Back in the days where eBPF (or back then "internal BPF" ;->) was not
exposed to user space, and only the classic BPF programs internally
translated into eBPF programs, we missed the fact that for classic BPF
A and X needed to be cleared. It was fixed back then via 83d5b7ef99c9
("net: filter: initialize A and X registers"), and thus classic BPF
specifics were added to the eBPF interpreter core to work around it.
This added some confusion for JIT developers later on that take the
eBPF interpreter code as an example for deriving their JIT. F.e. in
f75298f5c3fe ("s390/bpf: clear correct BPF accumulator register"), at
least X could leak stack memory. Furthermore, since this is only needed
for classic BPF translations and not for eBPF (verifier takes care
that read access to regs cannot be done uninitialized), more complexity
is added to JITs as they need to determine whether they deal with
migrations or native eBPF where they can just omit clearing A/X in
their prologue and thus reduce image size a bit, see f.e. cde66c2d88da
("s390/bpf: Only clear A and X for converted BPF programs"). In other
cases (x86, arm64), A and X is being cleared in the prologue also for
eBPF case, which is unnecessary.
Lets move this into the BPF migration in bpf_convert_filter() where it
actually belongs as long as the number of eBPF JITs are still few. It
can thus be done generically; allowing us to remove the quirk from
__bpf_prog_run() and to slightly reduce JIT image size in case of eBPF,
while reducing code duplication on this matter in current(/future) eBPF
JITs.
Signed-off-by: Daniel Borkmann <daniel@iogearbox.net>
Acked-by: Alexei Starovoitov <ast@kernel.org>
Reviewed-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Tested-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Cc: Zi Shen Lim <zlim.lnx@gmail.com>
Cc: Yang Shi <yang.shi@linaro.org>
Acked-by: Yang Shi <yang.shi@linaro.org>
Acked-by: Zi Shen Lim <zlim.lnx@gmail.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2015-12-17 23:51:54 +01:00
bpf_jit_prologue ( jit ) ;
2015-04-01 16:08:32 +02:00
for ( i = 0 ; i < fp - > len ; i + = insn_count ) {
insn_count = bpf_jit_insn ( jit , fp , i ) ;
if ( insn_count < 0 )
return - 1 ;
bpf, s390: fix jit branch offset related to ldimm64
While testing some other work that required JIT modifications, I
run into test_bpf causing a hang when JIT enabled on s390. The
problematic test case was the one from ddc665a4bb4b (bpf, arm64:
fix jit branch offset related to ldimm64), and turns out that we
do have a similar issue on s390 as well. In bpf_jit_prog() we
update next instruction address after returning from bpf_jit_insn()
with an insn_count. bpf_jit_insn() returns either -1 in case of
error (e.g. unsupported insn), 1 or 2. The latter is only the
case for ldimm64 due to spanning 2 insns, however, next address
is only set to i + 1 not taking actual insn_count into account,
thus fix is to use insn_count instead of 1. bpf_jit_enable in
mode 2 provides also disasm on s390:
Before fix:
000003ff800349b6: a7f40003 brc 15,3ff800349bc ; target
000003ff800349ba: 0000 unknown
000003ff800349bc: e3b0f0700024 stg %r11,112(%r15)
000003ff800349c2: e3e0f0880024 stg %r14,136(%r15)
000003ff800349c8: 0db0 basr %r11,%r0
000003ff800349ca: c0ef00000000 llilf %r14,0
000003ff800349d0: e320b0360004 lg %r2,54(%r11)
000003ff800349d6: e330b03e0004 lg %r3,62(%r11)
000003ff800349dc: ec23ffeda065 clgrj %r2,%r3,10,3ff800349b6 ; jmp
000003ff800349e2: e3e0b0460004 lg %r14,70(%r11)
000003ff800349e8: e3e0b04e0004 lg %r14,78(%r11)
000003ff800349ee: b904002e lgr %r2,%r14
000003ff800349f2: e3b0f0700004 lg %r11,112(%r15)
000003ff800349f8: e3e0f0880004 lg %r14,136(%r15)
000003ff800349fe: 07fe bcr 15,%r14
After fix:
000003ff80ef3db4: a7f40003 brc 15,3ff80ef3dba
000003ff80ef3db8: 0000 unknown
000003ff80ef3dba: e3b0f0700024 stg %r11,112(%r15)
000003ff80ef3dc0: e3e0f0880024 stg %r14,136(%r15)
000003ff80ef3dc6: 0db0 basr %r11,%r0
000003ff80ef3dc8: c0ef00000000 llilf %r14,0
000003ff80ef3dce: e320b0360004 lg %r2,54(%r11)
000003ff80ef3dd4: e330b03e0004 lg %r3,62(%r11)
000003ff80ef3dda: ec230006a065 clgrj %r2,%r3,10,3ff80ef3de6 ; jmp
000003ff80ef3de0: e3e0b0460004 lg %r14,70(%r11)
000003ff80ef3de6: e3e0b04e0004 lg %r14,78(%r11) ; target
000003ff80ef3dec: b904002e lgr %r2,%r14
000003ff80ef3df0: e3b0f0700004 lg %r11,112(%r15)
000003ff80ef3df6: e3e0f0880004 lg %r14,136(%r15)
000003ff80ef3dfc: 07fe bcr 15,%r14
test_bpf.ko suite runs fine after the fix.
Fixes: 054623105728 ("s390/bpf: Add s390x eBPF JIT compiler backend")
Signed-off-by: Daniel Borkmann <daniel@iogearbox.net>
Tested-by: Michael Holzheu <holzheu@linux.vnet.ibm.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2017-08-04 14:20:54 +02:00
/* Next instruction address */
jit - > addrs [ i + insn_count ] = jit - > prg ;
2012-07-31 16:23:59 +02:00
}
2015-04-01 16:08:32 +02:00
bpf_jit_epilogue ( jit ) ;
jit - > lit_start = jit - > prg ;
jit - > size = jit - > lit ;
jit - > size_prg = jit - > prg ;
2012-07-31 16:23:59 +02:00
return 0 ;
}
2015-04-01 16:08:32 +02:00
/*
* Compile eBPF program " fp "
*/
2016-05-13 19:08:31 +02:00
struct bpf_prog * bpf_int_jit_compile ( struct bpf_prog * fp )
2015-04-01 16:08:32 +02:00
{
2016-05-13 19:08:35 +02:00
struct bpf_prog * tmp , * orig_fp = fp ;
2015-04-01 16:08:32 +02:00
struct bpf_binary_header * header ;
2016-05-13 19:08:35 +02:00
bool tmp_blinded = false ;
2015-04-01 16:08:32 +02:00
struct bpf_jit jit ;
int pass ;
2012-07-31 16:23:59 +02:00
if ( ! bpf_jit_enable )
2016-05-13 19:08:35 +02:00
return orig_fp ;
tmp = bpf_jit_blind_constants ( fp ) ;
/*
* If blinding was requested and we failed during blinding ,
* we must fall back to the interpreter .
*/
if ( IS_ERR ( tmp ) )
return orig_fp ;
if ( tmp ! = fp ) {
tmp_blinded = true ;
fp = tmp ;
}
2016-05-13 19:08:31 +02:00
2015-04-01 16:08:32 +02:00
memset ( & jit , 0 , sizeof ( jit ) ) ;
jit . addrs = kcalloc ( fp - > len + 1 , sizeof ( * jit . addrs ) , GFP_KERNEL ) ;
2016-05-13 19:08:35 +02:00
if ( jit . addrs = = NULL ) {
fp = orig_fp ;
goto out ;
}
2015-04-01 16:08:32 +02:00
/*
* Three initial passes :
* - 1 / 2 : Determine clobbered registers
* - 3 : Calculate program size and addrs arrray
*/
for ( pass = 1 ; pass < = 3 ; pass + + ) {
2016-05-13 19:08:35 +02:00
if ( bpf_jit_prog ( & jit , fp ) ) {
fp = orig_fp ;
2015-04-01 16:08:32 +02:00
goto free_addrs ;
2016-05-13 19:08:35 +02:00
}
2012-07-31 16:23:59 +02:00
}
2015-04-01 16:08:32 +02:00
/*
* Final pass : Allocate and generate program
*/
2016-05-13 19:08:35 +02:00
if ( jit . size > = BPF_SIZE_MAX ) {
fp = orig_fp ;
2015-04-01 16:08:32 +02:00
goto free_addrs ;
2016-05-13 19:08:35 +02:00
}
2015-04-01 16:08:32 +02:00
header = bpf_jit_binary_alloc ( jit . size , & jit . prg_buf , 2 , jit_fill_hole ) ;
2016-05-13 19:08:35 +02:00
if ( ! header ) {
fp = orig_fp ;
2015-04-01 16:08:32 +02:00
goto free_addrs ;
2016-05-13 19:08:35 +02:00
}
if ( bpf_jit_prog ( & jit , fp ) ) {
fp = orig_fp ;
2015-04-01 16:08:32 +02:00
goto free_addrs ;
2016-05-13 19:08:35 +02:00
}
2012-07-31 16:23:59 +02:00
if ( bpf_jit_enable > 1 ) {
2015-04-01 16:08:32 +02:00
bpf_jit_dump ( fp - > len , jit . size , pass , jit . prg_buf ) ;
2017-01-14 01:48:24 +01:00
print_fn_code ( jit . prg_buf , jit . size_prg ) ;
2013-07-16 13:25:49 +02:00
}
2017-02-22 10:20:04 -08:00
bpf_jit_binary_lock_ro ( header ) ;
2017-01-14 01:48:24 +01:00
fp - > bpf_func = ( void * ) jit . prg_buf ;
fp - > jited = 1 ;
2017-06-05 12:15:51 -07:00
fp - > jited_len = jit . size ;
2015-04-01 16:08:32 +02:00
free_addrs :
kfree ( jit . addrs ) ;
2016-05-13 19:08:35 +02:00
out :
if ( tmp_blinded )
bpf_jit_prog_release_other ( fp , fp = = orig_fp ?
tmp : orig_fp ) ;
2016-05-13 19:08:31 +02:00
return fp ;
2012-07-31 16:23:59 +02:00
}