diff mbox series

[bpf-next,v2,6/8] bpftool: Add LLVM as default library for disassembling JIT-ed programs

Message ID 20220911201451.12368-7-quentin@isovalent.com (mailing list archive)
State Changes Requested
Delegated to: BPF
Headers show
Series bpftool: Add LLVM as default library for disassembling JIT-ed programs | expand

Checks

Context Check Description
netdev/tree_selection success Clearly marked for bpf-next
netdev/fixes_present success Fixes tag not required for -next series
netdev/subject_prefix success Link
netdev/cover_letter success Series has a cover letter
netdev/patch_count success Link
netdev/header_inline success No static functions without inline keyword in header files
netdev/build_32bit success Errors and warnings before: 0 this patch: 0
netdev/cc_maintainers warning 6 maintainers not CCed: nathan@kernel.org song@kernel.org llvm@lists.linux.dev trix@redhat.com ndesaulniers@google.com martin.lau@linux.dev
netdev/build_clang success Errors and warnings before: 0 this patch: 0
netdev/module_param success Was 0 now: 0
netdev/verify_signedoff success Signed-off-by tag matches author and committer
netdev/check_selftest success No net selftest shell script
netdev/verify_fixes success No Fixes tag
netdev/build_allmodconfig_warn success Errors and warnings before: 0 this patch: 0
netdev/checkpatch warning WARNING: do not add new typedefs
netdev/kdoc success Errors and warnings before: 0 this patch: 0
netdev/source_inline success Was 0 now: 0
bpf/vmtest-bpf-next-VM_Test-7 success Logs for test_maps on x86_64 with gcc
bpf/vmtest-bpf-next-VM_Test-8 success Logs for test_maps on x86_64 with llvm-16
bpf/vmtest-bpf-next-VM_Test-9 success Logs for test_progs on s390x with gcc
bpf/vmtest-bpf-next-VM_Test-10 success Logs for test_progs on x86_64 with gcc
bpf/vmtest-bpf-next-VM_Test-11 success Logs for test_progs on x86_64 with llvm-16
bpf/vmtest-bpf-next-VM_Test-12 success Logs for test_progs_no_alu32 on s390x with gcc
bpf/vmtest-bpf-next-VM_Test-13 success Logs for test_progs_no_alu32 on x86_64 with gcc
bpf/vmtest-bpf-next-VM_Test-14 success Logs for test_progs_no_alu32 on x86_64 with llvm-16
bpf/vmtest-bpf-next-VM_Test-15 success Logs for test_verifier on s390x with gcc
bpf/vmtest-bpf-next-PR fail PR summary
bpf/vmtest-bpf-next-VM_Test-6 success Logs for set-matrix
bpf/vmtest-bpf-next-VM_Test-2 success Logs for build for x86_64 with gcc
bpf/vmtest-bpf-next-VM_Test-3 success Logs for build for x86_64 with llvm-16
bpf/vmtest-bpf-next-VM_Test-1 success Logs for build for s390x with gcc
bpf/vmtest-bpf-next-VM_Test-16 success Logs for test_verifier on x86_64 with gcc
bpf/vmtest-bpf-next-VM_Test-17 success Logs for test_verifier on x86_64 with llvm-16
bpf/vmtest-bpf-next-VM_Test-4 success Logs for llvm-toolchain
bpf/vmtest-bpf-next-VM_Test-5 success Logs for set-matrix

Commit Message

Quentin Monnet Sept. 11, 2022, 8:14 p.m. UTC
To disassemble instructions for JIT-ed programs, bpftool has relied on
the libbfd library. This has been problematic in the past: libbfd's
interface is not meant to be stable and has changed several times. For
building bpftool, we have to detect how the libbfd version on the system
behaves, which is why we have to handle features disassembler-four-args
and disassembler-init-styled in the Makefile. When it comes to shipping
bpftool, this has also caused issues with several distribution
maintainers unwilling to support the feature (see for example Debian's
page for binutils-dev, which ships libbfd: "Note that building Debian
packages which depend on the shared libbfd is Not Allowed." [0]).

For these reasons, we add support for LLVM as an alternative to libbfd
for disassembling instructions of JIT-ed programs. Thanks to the
preparation work in the previous commits, it's easy to add the library
by passing the relevant compilation options in the Makefile, and by
adding the functions for setting up the LLVM disassembler in file
jit_disasm.c.

Naturally, the display of disassembled instructions comes with a few
minor differences. Here is a sample output with libbfd (already
supported before this patch):

    # bpftool prog dump jited id 56
    bpf_prog_6deef7357e7b4530:
       0:   nopl   0x0(%rax,%rax,1)
       5:   xchg   %ax,%ax
       7:   push   %rbp
       8:   mov    %rsp,%rbp
       b:   push   %rbx
       c:   push   %r13
       e:   push   %r14
      10:   mov    %rdi,%rbx
      13:   movzwq 0xb4(%rbx),%r13
      1b:   xor    %r14d,%r14d
      1e:   or     $0x2,%r14d
      22:   mov    $0x1,%eax
      27:   cmp    $0x2,%r14
      2b:   jne    0x000000000000002f
      2d:   xor    %eax,%eax
      2f:   pop    %r14
      31:   pop    %r13
      33:   pop    %rbx
      34:   leave
      35:   ret

LLVM supports several variants that we could set when initialising the
disassembler, for example with:

    LLVMSetDisasmOptions(*ctx,
                         LLVMDisassembler_Option_AsmPrinterVariant);

but the default printer is used for now. Here is the output with LLVM:

    # bpftool prog dump jited id 56
    bpf_prog_6deef7357e7b4530:
       0:   nopl    (%rax,%rax)
       5:   nop
       7:   pushq   %rbp
       8:   movq    %rsp, %rbp
       b:   pushq   %rbx
       c:   pushq   %r13
       e:   pushq   %r14
      10:   movq    %rdi, %rbx
      13:   movzwq  180(%rbx), %r13
      1b:   xorl    %r14d, %r14d
      1e:   orl     $2, %r14d
      22:   movl    $1, %eax
      27:   cmpq    $2, %r14
      2b:   jne     0x2f
      2d:   xorl    %eax, %eax
      2f:   popq    %r14
      31:   popq    %r13
      33:   popq    %rbx
      34:   leave
      35:   retq

The LLVM disassembler comes as the default choice, with libbfd as a
fall-back.

Of course, we could replace libbfd entirely and avoid supporting two
different libraries. One reason for keeping libbfd is that, right now,
it works well, we have all we need in terms of features detection in the
Makefile, so it provides a fallback for disassembling JIT-ed programs if
libbfd is installed but LLVM is not. The other motivation is that libbfd
supports nfp instruction for Netronome's SmartNICs and can be used to
disassemble offloaded programs, something that LLVM cannot do. If
libbfd's interface breaks again in the future, we might reconsider
keeping support for it.

[0] https://packages.debian.org/buster/binutils-dev

Signed-off-by: Quentin Monnet <quentin@isovalent.com>
Tested-by: Niklas Söderlund <niklas.soderlund@corigine.com>
---
 tools/bpf/bpftool/Makefile     |  46 +++++++++-----
 tools/bpf/bpftool/jit_disasm.c | 112 ++++++++++++++++++++++++++++++++-
 tools/bpf/bpftool/main.h       |   4 +-
 3 files changed, 140 insertions(+), 22 deletions(-)

Comments

Daniel Borkmann Sept. 16, 2022, 9:09 p.m. UTC | #1
On 9/11/22 10:14 PM, Quentin Monnet wrote:
> To disassemble instructions for JIT-ed programs, bpftool has relied on
> the libbfd library. This has been problematic in the past: libbfd's
> interface is not meant to be stable and has changed several times. For
> building bpftool, we have to detect how the libbfd version on the system
> behaves, which is why we have to handle features disassembler-four-args
> and disassembler-init-styled in the Makefile. When it comes to shipping
> bpftool, this has also caused issues with several distribution
> maintainers unwilling to support the feature (see for example Debian's
> page for binutils-dev, which ships libbfd: "Note that building Debian
> packages which depend on the shared libbfd is Not Allowed." [0]).
> 
> For these reasons, we add support for LLVM as an alternative to libbfd
> for disassembling instructions of JIT-ed programs. Thanks to the
> preparation work in the previous commits, it's easy to add the library
> by passing the relevant compilation options in the Makefile, and by
> adding the functions for setting up the LLVM disassembler in file
> jit_disasm.c.

Could you add more context around the LLVM lib? The motivation is that libbfd's
interface is not meant to be stable and has changed several times. How does this
look on the LLVM's library side? Also, for the 2nd part, what is Debian's stance
related to the LLVM lib? Would be good if both is explained in the commit message.
Right now it mainly reads 'that libbfd has all these issues, so we're moving to
something else', so would be good to provide more context to the ready why the
'something else' is better than current one.

> Naturally, the display of disassembled instructions comes with a few
> minor differences. Here is a sample output with libbfd (already
> supported before this patch):
> 
>      # bpftool prog dump jited id 56
>      bpf_prog_6deef7357e7b4530:
>         0:   nopl   0x0(%rax,%rax,1)
>         5:   xchg   %ax,%ax
>         7:   push   %rbp
>         8:   mov    %rsp,%rbp
>         b:   push   %rbx
>         c:   push   %r13
>         e:   push   %r14
>        10:   mov    %rdi,%rbx
>        13:   movzwq 0xb4(%rbx),%r13
>        1b:   xor    %r14d,%r14d
>        1e:   or     $0x2,%r14d
>        22:   mov    $0x1,%eax
>        27:   cmp    $0x2,%r14
>        2b:   jne    0x000000000000002f
>        2d:   xor    %eax,%eax
>        2f:   pop    %r14
>        31:   pop    %r13
>        33:   pop    %rbx
>        34:   leave
>        35:   ret
> 
> LLVM supports several variants that we could set when initialising the
> disassembler, for example with:
> 
>      LLVMSetDisasmOptions(*ctx,
>                           LLVMDisassembler_Option_AsmPrinterVariant);
> 
> but the default printer is used for now. Here is the output with LLVM:
> 
>      # bpftool prog dump jited id 56
>      bpf_prog_6deef7357e7b4530:
>         0:   nopl    (%rax,%rax)
>         5:   nop
>         7:   pushq   %rbp
>         8:   movq    %rsp, %rbp
>         b:   pushq   %rbx
>         c:   pushq   %r13
>         e:   pushq   %r14
>        10:   movq    %rdi, %rbx
>        13:   movzwq  180(%rbx), %r13
>        1b:   xorl    %r14d, %r14d
>        1e:   orl     $2, %r14d
>        22:   movl    $1, %eax
>        27:   cmpq    $2, %r14
>        2b:   jne     0x2f
>        2d:   xorl    %eax, %eax
>        2f:   popq    %r14
>        31:   popq    %r13
>        33:   popq    %rbx
>        34:   leave
>        35:   retq
> 
> The LLVM disassembler comes as the default choice, with libbfd as a
> fall-back.
> 
> Of course, we could replace libbfd entirely and avoid supporting two
> different libraries. One reason for keeping libbfd is that, right now,
> it works well, we have all we need in terms of features detection in the
> Makefile, so it provides a fallback for disassembling JIT-ed programs if
> libbfd is installed but LLVM is not. The other motivation is that libbfd
> supports nfp instruction for Netronome's SmartNICs and can be used to
> disassemble offloaded programs, something that LLVM cannot do. If
> libbfd's interface breaks again in the future, we might reconsider
> keeping support for it.
> 
> [0] https://packages.debian.org/buster/binutils-dev
> 
> Signed-off-by: Quentin Monnet <quentin@isovalent.com>
> Tested-by: Niklas Söderlund <niklas.soderlund@corigine.com>

Thanks,
Daniel
Yonghong Song Sept. 19, 2022, 11:58 p.m. UTC | #2
On 9/11/22 1:14 PM, Quentin Monnet wrote:
> To disassemble instructions for JIT-ed programs, bpftool has relied on
> the libbfd library. This has been problematic in the past: libbfd's
> interface is not meant to be stable and has changed several times. For
> building bpftool, we have to detect how the libbfd version on the system
> behaves, which is why we have to handle features disassembler-four-args
> and disassembler-init-styled in the Makefile. When it comes to shipping
> bpftool, this has also caused issues with several distribution
> maintainers unwilling to support the feature (see for example Debian's
> page for binutils-dev, which ships libbfd: "Note that building Debian
> packages which depend on the shared libbfd is Not Allowed." [0]).
> 
> For these reasons, we add support for LLVM as an alternative to libbfd
> for disassembling instructions of JIT-ed programs. Thanks to the
> preparation work in the previous commits, it's easy to add the library
> by passing the relevant compilation options in the Makefile, and by
> adding the functions for setting up the LLVM disassembler in file
> jit_disasm.c.
> 
> Naturally, the display of disassembled instructions comes with a few
> minor differences. Here is a sample output with libbfd (already
> supported before this patch):
> 
>      # bpftool prog dump jited id 56
>      bpf_prog_6deef7357e7b4530:
>         0:   nopl   0x0(%rax,%rax,1)
>         5:   xchg   %ax,%ax
>         7:   push   %rbp
>         8:   mov    %rsp,%rbp
>         b:   push   %rbx
>         c:   push   %r13
>         e:   push   %r14
>        10:   mov    %rdi,%rbx
>        13:   movzwq 0xb4(%rbx),%r13
>        1b:   xor    %r14d,%r14d
>        1e:   or     $0x2,%r14d
>        22:   mov    $0x1,%eax
>        27:   cmp    $0x2,%r14
>        2b:   jne    0x000000000000002f
>        2d:   xor    %eax,%eax
>        2f:   pop    %r14
>        31:   pop    %r13
>        33:   pop    %rbx
>        34:   leave
>        35:   ret
> 
> LLVM supports several variants that we could set when initialising the
> disassembler, for example with:
> 
>      LLVMSetDisasmOptions(*ctx,
>                           LLVMDisassembler_Option_AsmPrinterVariant);
> 
> but the default printer is used for now. Here is the output with LLVM:
> 
>      # bpftool prog dump jited id 56
>      bpf_prog_6deef7357e7b4530:
>         0:   nopl    (%rax,%rax)
>         5:   nop
>         7:   pushq   %rbp
>         8:   movq    %rsp, %rbp
>         b:   pushq   %rbx
>         c:   pushq   %r13
>         e:   pushq   %r14
>        10:   movq    %rdi, %rbx
>        13:   movzwq  180(%rbx), %r13
>        1b:   xorl    %r14d, %r14d
>        1e:   orl     $2, %r14d
>        22:   movl    $1, %eax
>        27:   cmpq    $2, %r14
>        2b:   jne     0x2f
>        2d:   xorl    %eax, %eax
>        2f:   popq    %r14
>        31:   popq    %r13
>        33:   popq    %rbx
>        34:   leave
>        35:   retq
> 
> The LLVM disassembler comes as the default choice, with libbfd as a
> fall-back.
> 
> Of course, we could replace libbfd entirely and avoid supporting two
> different libraries. One reason for keeping libbfd is that, right now,
> it works well, we have all we need in terms of features detection in the
> Makefile, so it provides a fallback for disassembling JIT-ed programs if
> libbfd is installed but LLVM is not. The other motivation is that libbfd
> supports nfp instruction for Netronome's SmartNICs and can be used to
> disassemble offloaded programs, something that LLVM cannot do. If
> libbfd's interface breaks again in the future, we might reconsider
> keeping support for it.
> 
> [0] https://packages.debian.org/buster/binutils-dev
> 
> Signed-off-by: Quentin Monnet <quentin@isovalent.com>
> Tested-by: Niklas Söderlund <niklas.soderlund@corigine.com>

Acked-by: Yonghong Song <yhs@fb.com>
Yonghong Song Sept. 20, 2022, 4:08 a.m. UTC | #3
On 9/16/22 2:09 PM, Daniel Borkmann wrote:
> On 9/11/22 10:14 PM, Quentin Monnet wrote:
>> To disassemble instructions for JIT-ed programs, bpftool has relied on
>> the libbfd library. This has been problematic in the past: libbfd's
>> interface is not meant to be stable and has changed several times. For
>> building bpftool, we have to detect how the libbfd version on the system
>> behaves, which is why we have to handle features disassembler-four-args
>> and disassembler-init-styled in the Makefile. When it comes to shipping
>> bpftool, this has also caused issues with several distribution
>> maintainers unwilling to support the feature (see for example Debian's
>> page for binutils-dev, which ships libbfd: "Note that building Debian
>> packages which depend on the shared libbfd is Not Allowed." [0]).
>>
>> For these reasons, we add support for LLVM as an alternative to libbfd
>> for disassembling instructions of JIT-ed programs. Thanks to the
>> preparation work in the previous commits, it's easy to add the library
>> by passing the relevant compilation options in the Makefile, and by
>> adding the functions for setting up the LLVM disassembler in file
>> jit_disasm.c.
> 
> Could you add more context around the LLVM lib? The motivation is that 
> libbfd's
> interface is not meant to be stable and has changed several times. How 
> does this
> look on the LLVM's library side? Also, for the 2nd part, what is 
> Debian's stance
> related to the LLVM lib? Would be good if both is explained in the 
> commit message.
> Right now it mainly reads 'that libbfd has all these issues, so we're 
> moving to
> something else', so would be good to provide more context to the ready 
> why the
> 'something else' is better than current one.

It will be good to mention that e.g., llvm development package
(e.g., llvm-devel for fedora) is needed for bpftool build with llvm.

> 
>> Naturally, the display of disassembled instructions comes with a few
>> minor differences. Here is a sample output with libbfd (already
>> supported before this patch):
>>
>>      # bpftool prog dump jited id 56
>>      bpf_prog_6deef7357e7b4530:
>>         0:   nopl   0x0(%rax,%rax,1)
>>         5:   xchg   %ax,%ax
>>         7:   push   %rbp
>>         8:   mov    %rsp,%rbp
>>         b:   push   %rbx
>>         c:   push   %r13
>>         e:   push   %r14
>>        10:   mov    %rdi,%rbx
>>        13:   movzwq 0xb4(%rbx),%r13
>>        1b:   xor    %r14d,%r14d
>>        1e:   or     $0x2,%r14d
>>        22:   mov    $0x1,%eax
>>        27:   cmp    $0x2,%r14
>>        2b:   jne    0x000000000000002f
>>        2d:   xor    %eax,%eax
>>        2f:   pop    %r14
>>        31:   pop    %r13
>>        33:   pop    %rbx
>>        34:   leave
>>        35:   ret
>>
>> LLVM supports several variants that we could set when initialising the
>> disassembler, for example with:
>>
>>      LLVMSetDisasmOptions(*ctx,
>>                           LLVMDisassembler_Option_AsmPrinterVariant);
>>
>> but the default printer is used for now. Here is the output with LLVM:
>>
>>      # bpftool prog dump jited id 56
>>      bpf_prog_6deef7357e7b4530:
>>         0:   nopl    (%rax,%rax)
>>         5:   nop
>>         7:   pushq   %rbp
>>         8:   movq    %rsp, %rbp
>>         b:   pushq   %rbx
>>         c:   pushq   %r13
>>         e:   pushq   %r14
>>        10:   movq    %rdi, %rbx
>>        13:   movzwq  180(%rbx), %r13
>>        1b:   xorl    %r14d, %r14d
>>        1e:   orl     $2, %r14d
>>        22:   movl    $1, %eax
>>        27:   cmpq    $2, %r14
>>        2b:   jne     0x2f
>>        2d:   xorl    %eax, %eax
>>        2f:   popq    %r14
>>        31:   popq    %r13
>>        33:   popq    %rbx
>>        34:   leave
>>        35:   retq
>>
>> The LLVM disassembler comes as the default choice, with libbfd as a
>> fall-back.
>>
>> Of course, we could replace libbfd entirely and avoid supporting two
>> different libraries. One reason for keeping libbfd is that, right now,
>> it works well, we have all we need in terms of features detection in the
>> Makefile, so it provides a fallback for disassembling JIT-ed programs if
>> libbfd is installed but LLVM is not. The other motivation is that libbfd
>> supports nfp instruction for Netronome's SmartNICs and can be used to
>> disassemble offloaded programs, something that LLVM cannot do. If
>> libbfd's interface breaks again in the future, we might reconsider
>> keeping support for it.
>>
>> [0] 
>> https://packages.debian.org/buster/binutils-dev
>> Signed-off-by: Quentin Monnet <quentin@isovalent.com>
>> Tested-by: Niklas Söderlund <niklas.soderlund@corigine.com>
> 
> Thanks,
> Daniel
Quentin Monnet Sept. 23, 2022, 11:23 a.m. UTC | #4
Hi Yonghong,

Tue Sep 20 2022 05:08:04 GMT+0100 (British Summer Time) ~ Yonghong Song
<yhs@fb.com>
> 
> 
> On 9/16/22 2:09 PM, Daniel Borkmann wrote:
>> On 9/11/22 10:14 PM, Quentin Monnet wrote:
>>> To disassemble instructions for JIT-ed programs, bpftool has relied on
>>> the libbfd library. This has been problematic in the past: libbfd's
>>> interface is not meant to be stable and has changed several times. For
>>> building bpftool, we have to detect how the libbfd version on the system
>>> behaves, which is why we have to handle features disassembler-four-args
>>> and disassembler-init-styled in the Makefile. When it comes to shipping
>>> bpftool, this has also caused issues with several distribution
>>> maintainers unwilling to support the feature (see for example Debian's
>>> page for binutils-dev, which ships libbfd: "Note that building Debian
>>> packages which depend on the shared libbfd is Not Allowed." [0]).
>>>
>>> For these reasons, we add support for LLVM as an alternative to libbfd
>>> for disassembling instructions of JIT-ed programs. Thanks to the
>>> preparation work in the previous commits, it's easy to add the library
>>> by passing the relevant compilation options in the Makefile, and by
>>> adding the functions for setting up the LLVM disassembler in file
>>> jit_disasm.c.
>>
>> Could you add more context around the LLVM lib? The motivation is that
>> libbfd's
>> interface is not meant to be stable and has changed several times. How
>> does this
>> look on the LLVM's library side? Also, for the 2nd part, what is
>> Debian's stance
>> related to the LLVM lib? Would be good if both is explained in the
>> commit message.
>> Right now it mainly reads 'that libbfd has all these issues, so we're
>> moving to
>> something else', so would be good to provide more context to the ready
>> why the
>> 'something else' is better than current one.
> 
> It will be good to mention that e.g., llvm development package
> (e.g., llvm-devel for fedora) is needed for bpftool build with llvm.

Right. I didn't mention it because I noticed that on my distro, llvm-dev
came as a dependency for llvm (so simply having llvm installed is enough
to ensure the development package is present too). But this may not be
the case everywhere (do you know for Fedora?), so I'll add it to the
commit log for the next version.

Thanks for the review!
Quentin
Quentin Monnet Sept. 23, 2022, 11:23 a.m. UTC | #5
Fri Sep 16 2022 22:09:54 GMT+0100 (British Summer Time) ~ Daniel
Borkmann <daniel@iogearbox.net>
> On 9/11/22 10:14 PM, Quentin Monnet wrote:
>> To disassemble instructions for JIT-ed programs, bpftool has relied on
>> the libbfd library. This has been problematic in the past: libbfd's
>> interface is not meant to be stable and has changed several times. For
>> building bpftool, we have to detect how the libbfd version on the system
>> behaves, which is why we have to handle features disassembler-four-args
>> and disassembler-init-styled in the Makefile. When it comes to shipping
>> bpftool, this has also caused issues with several distribution
>> maintainers unwilling to support the feature (see for example Debian's
>> page for binutils-dev, which ships libbfd: "Note that building Debian
>> packages which depend on the shared libbfd is Not Allowed." [0]).
>>
>> For these reasons, we add support for LLVM as an alternative to libbfd
>> for disassembling instructions of JIT-ed programs. Thanks to the
>> preparation work in the previous commits, it's easy to add the library
>> by passing the relevant compilation options in the Makefile, and by
>> adding the functions for setting up the LLVM disassembler in file
>> jit_disasm.c.
> 
> Could you add more context around the LLVM lib? The motivation is that
> libbfd's
> interface is not meant to be stable and has changed several times. How
> does this
> look on the LLVM's library side? Also, for the 2nd part, what is
> Debian's stance
> related to the LLVM lib? Would be good if both is explained in the
> commit message.
> Right now it mainly reads 'that libbfd has all these issues, so we're
> moving to
> something else', so would be good to provide more context to the ready
> why the
> 'something else' is better than current one.
Hi Daniel,

This was based on two things. First, there is a note in LLVM's Developer
Policy [0] stating that the stability for the C API is “best effort” and
not guaranteed, but at least there is some effort to keep compatibility
when possible (which hasn't really been the case for libbfd so far). I
am under the impression that there is little intent for libbfd to be
used outside of gdb/binutils. Second: the relevant .deb page does not
caution against linking to the lib, as binutils-dev page does.

I can add this info to the commit log for the next version.

[0] https://llvm.org/docs/DeveloperPolicy.html#c-api-changes
diff mbox series

Patch

diff --git a/tools/bpf/bpftool/Makefile b/tools/bpf/bpftool/Makefile
index 1c81f4d514bb..787b857d3fb5 100644
--- a/tools/bpf/bpftool/Makefile
+++ b/tools/bpf/bpftool/Makefile
@@ -95,6 +95,7 @@  RM ?= rm -f
 FEATURE_USER = .bpftool
 
 FEATURE_TESTS := clang-bpf-co-re
+FEATURE_TESTS += llvm
 FEATURE_TESTS += libcap
 FEATURE_TESTS += libbfd
 FEATURE_TESTS += libbfd-liberty
@@ -103,6 +104,7 @@  FEATURE_TESTS += disassembler-four-args
 FEATURE_TESTS += disassembler-init-styled
 
 FEATURE_DISPLAY := clang-bpf-co-re
+FEATURE_DISPLAY += llvm
 FEATURE_DISPLAY += libcap
 FEATURE_DISPLAY += libbfd
 FEATURE_DISPLAY += libbfd-liberty
@@ -137,27 +139,37 @@  all: $(OUTPUT)bpftool
 
 SRCS := $(wildcard *.c)
 
-ifeq ($(feature-libbfd),1)
-  LIBS += -lbfd -ldl -lopcodes
-else ifeq ($(feature-libbfd-liberty),1)
-  LIBS += -lbfd -ldl -lopcodes -liberty
-else ifeq ($(feature-libbfd-liberty-z),1)
-  LIBS += -lbfd -ldl -lopcodes -liberty -lz
-endif
+ifeq ($(feature-llvm),1)
+  # If LLVM is available, use it for JIT disassembly
+  CFLAGS  += -DHAVE_LLVM_SUPPORT
+  LLVM_CONFIG_LIB_COMPONENTS := mcdisassembler all-targets
+  CFLAGS  += $(shell $(LLVM_CONFIG) --cflags --libs $(LLVM_CONFIG_LIB_COMPONENTS))
+  LIBS    += $(shell $(LLVM_CONFIG) --libs $(LLVM_CONFIG_LIB_COMPONENTS))
+  LDFLAGS += $(shell $(LLVM_CONFIG) --ldflags)
+else
+  # Fall back on libbfd
+  ifeq ($(feature-libbfd),1)
+    LIBS += -lbfd -ldl -lopcodes
+  else ifeq ($(feature-libbfd-liberty),1)
+    LIBS += -lbfd -ldl -lopcodes -liberty
+  else ifeq ($(feature-libbfd-liberty-z),1)
+    LIBS += -lbfd -ldl -lopcodes -liberty -lz
+  endif
 
-# If one of the above feature combinations is set, we support libbfd
-ifneq ($(filter -lbfd,$(LIBS)),)
-  CFLAGS += -DHAVE_LIBBFD_SUPPORT
+  # If one of the above feature combinations is set, we support libbfd
+  ifneq ($(filter -lbfd,$(LIBS)),)
+    CFLAGS += -DHAVE_LIBBFD_SUPPORT
 
-  # Libbfd interface changed over time, figure out what we need
-  ifeq ($(feature-disassembler-four-args), 1)
-    CFLAGS += -DDISASM_FOUR_ARGS_SIGNATURE
-  endif
-  ifeq ($(feature-disassembler-init-styled), 1)
-    CFLAGS += -DDISASM_INIT_STYLED
+    # Libbfd interface changed over time, figure out what we need
+    ifeq ($(feature-disassembler-four-args), 1)
+      CFLAGS += -DDISASM_FOUR_ARGS_SIGNATURE
+    endif
+    ifeq ($(feature-disassembler-init-styled), 1)
+      CFLAGS += -DDISASM_INIT_STYLED
+    endif
   endif
 endif
-ifeq ($(filter -DHAVE_LIBBFD_SUPPORT,$(CFLAGS)),)
+ifeq ($(filter -DHAVE_LLVM_SUPPORT -DHAVE_LIBBFD_SUPPORT,$(CFLAGS)),)
   # No support for JIT disassembly
   SRCS := $(filter-out jit_disasm.c,$(SRCS))
 endif
diff --git a/tools/bpf/bpftool/jit_disasm.c b/tools/bpf/bpftool/jit_disasm.c
index e31ad3950fd6..c28b21f90cb9 100644
--- a/tools/bpf/bpftool/jit_disasm.c
+++ b/tools/bpf/bpftool/jit_disasm.c
@@ -20,18 +20,123 @@ 
 #include <stdlib.h>
 #include <unistd.h>
 #include <string.h>
-#include <bfd.h>
-#include <dis-asm.h>
 #include <sys/stat.h>
 #include <limits.h>
 #include <bpf/libbpf.h>
+
+#ifdef HAVE_LLVM_SUPPORT
+#include <llvm-c/Core.h>
+#include <llvm-c/Disassembler.h>
+#include <llvm-c/Target.h>
+#include <llvm-c/TargetMachine.h>
+#endif
+
+#ifdef HAVE_LIBBFD_SUPPORT
+#include <bfd.h>
+#include <dis-asm.h>
 #include <tools/dis-asm-compat.h>
+#endif
 
 #include "json_writer.h"
 #include "main.h"
 
 static int oper_count;
 
+#ifdef HAVE_LLVM_SUPPORT
+#define DISASM_SPACER
+
+typedef LLVMDisasmContextRef disasm_ctx_t;
+
+static int printf_json(char *s)
+{
+	s = strtok(s, " \t");
+	jsonw_string_field(json_wtr, "operation", s);
+
+	jsonw_name(json_wtr, "operands");
+	jsonw_start_array(json_wtr);
+	oper_count = 1;
+
+	while ((s = strtok(NULL, " \t,()")) != 0) {
+		jsonw_string(json_wtr, s);
+		oper_count++;
+	}
+	return 0;
+}
+
+/* This callback to set the ref_type is necessary to have the LLVM disassembler
+ * print PC-relative addresses instead of byte offsets for branch instruction
+ * targets.
+ */
+static const char *
+symbol_lookup_callback(__maybe_unused void *disasm_info,
+		       __maybe_unused uint64_t ref_value,
+		       uint64_t *ref_type, __maybe_unused uint64_t ref_PC,
+		       __maybe_unused const char **ref_name)
+{
+	*ref_type = LLVMDisassembler_ReferenceType_InOut_None;
+	return NULL;
+}
+
+static int
+init_context(disasm_ctx_t *ctx, const char *arch,
+	     __maybe_unused const char *disassembler_options,
+	     __maybe_unused unsigned char *image, __maybe_unused ssize_t len)
+{
+	char *triple;
+
+	if (arch) {
+		p_err("Architecture %s not supported", arch);
+		return -1;
+	}
+
+	triple = LLVMGetDefaultTargetTriple();
+	if (!triple) {
+		p_err("Failed to retrieve triple");
+		return -1;
+	}
+	*ctx = LLVMCreateDisasm(triple, NULL, 0, NULL, symbol_lookup_callback);
+	LLVMDisposeMessage(triple);
+
+	if (!*ctx) {
+		p_err("Failed to create disassembler");
+		return -1;
+	}
+
+	return 0;
+}
+
+static void destroy_context(disasm_ctx_t *ctx)
+{
+	LLVMDisposeMessage(*ctx);
+}
+
+static int
+disassemble_insn(disasm_ctx_t *ctx, unsigned char *image, ssize_t len, int pc)
+{
+	char buf[256];
+	int count;
+
+	count = LLVMDisasmInstruction(*ctx, image + pc, len - pc, pc,
+				      buf, sizeof(buf));
+	if (json_output)
+		printf_json(buf);
+	else
+		printf("%s", buf);
+
+	return count;
+}
+
+int disasm_init(void)
+{
+	LLVMInitializeNativeTarget();
+	LLVMInitializeNativeDisassembler();
+	return 0;
+}
+#endif /* HAVE_LLVM_SUPPORT */
+
+#ifdef HAVE_LIBBFD_SUPPORT
+#define DISASM_SPACER "\t"
+
 typedef struct {
 	struct disassemble_info *info;
 	disassembler_ftype disassemble;
@@ -210,6 +315,7 @@  int disasm_init(void)
 	bfd_init();
 	return 0;
 }
+#endif /* HAVE_LIBBPFD_SUPPORT */
 
 int disasm_print_insn(unsigned char *image, ssize_t len, int opcodes,
 		      const char *arch, const char *disassembler_options,
@@ -252,7 +358,7 @@  int disasm_print_insn(unsigned char *image, ssize_t len, int opcodes,
 			if (linfo)
 				btf_dump_linfo_plain(btf, linfo, "; ",
 						     linum);
-			printf("%4x:\t", pc);
+			printf("%4x:" DISASM_SPACER, pc);
 		}
 
 		count = disassemble_insn(&ctx, image, len, pc);
diff --git a/tools/bpf/bpftool/main.h b/tools/bpf/bpftool/main.h
index c9e171082cf6..9a149c67aa5d 100644
--- a/tools/bpf/bpftool/main.h
+++ b/tools/bpf/bpftool/main.h
@@ -172,7 +172,7 @@  int map_parse_fds(int *argc, char ***argv, int **fds);
 int map_parse_fd_and_info(int *argc, char ***argv, void *info, __u32 *info_len);
 
 struct bpf_prog_linfo;
-#ifdef HAVE_LIBBFD_SUPPORT
+#if defined(HAVE_LLVM_SUPPORT) || defined(HAVE_LIBBFD_SUPPORT)
 int disasm_print_insn(unsigned char *image, ssize_t len, int opcodes,
 		      const char *arch, const char *disassembler_options,
 		      const struct btf *btf,
@@ -193,7 +193,7 @@  int disasm_print_insn(unsigned char *image, ssize_t len, int opcodes,
 }
 static inline int disasm_init(void)
 {
-	p_err("No libbfd support");
+	p_err("No JIT disassembly support");
 	return -1;
 }
 #endif