mirror of
https://sourceware.org/git/binutils-gdb.git
synced 2025-01-24 12:35:55 +08:00
496 lines
20 KiB
C
496 lines
20 KiB
C
/* Interface between the opcode library and its callers.
|
||
|
||
Copyright (C) 1999-2023 Free Software Foundation, Inc.
|
||
|
||
This program is free software; you can redistribute it and/or modify
|
||
it under the terms of the GNU General Public License as published by
|
||
the Free Software Foundation; either version 3, or (at your option)
|
||
any later version.
|
||
|
||
This program is distributed in the hope that it will be useful,
|
||
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
GNU General Public License for more details.
|
||
|
||
You should have received a copy of the GNU General Public License
|
||
along with this program; if not, write to the Free Software
|
||
Foundation, Inc., 51 Franklin Street - Fifth Floor,
|
||
Boston, MA 02110-1301, USA.
|
||
|
||
Written by Cygnus Support, 1993.
|
||
|
||
The opcode library (libopcodes.a) provides instruction decoders for
|
||
a large variety of instruction sets, callable with an identical
|
||
interface, for making instruction-processing programs more independent
|
||
of the instruction set being processed. */
|
||
|
||
#ifndef DIS_ASM_H
|
||
#define DIS_ASM_H
|
||
|
||
#ifdef __cplusplus
|
||
extern "C" {
|
||
#endif
|
||
|
||
#include <stdio.h>
|
||
#include <string.h>
|
||
#include "bfd.h"
|
||
|
||
enum dis_insn_type
|
||
{
|
||
dis_noninsn, /* Not a valid instruction. */
|
||
dis_nonbranch, /* Not a branch instruction. */
|
||
dis_branch, /* Unconditional branch. */
|
||
dis_condbranch, /* Conditional branch. */
|
||
dis_jsr, /* Jump to subroutine. */
|
||
dis_condjsr, /* Conditional jump to subroutine. */
|
||
dis_dref, /* Data reference instruction. */
|
||
dis_dref2 /* Two data references in instruction. */
|
||
};
|
||
|
||
/* When printing styled disassembler output, this describes what style
|
||
should be used. */
|
||
|
||
enum disassembler_style
|
||
{
|
||
/* This is the default style, use this for any additional syntax
|
||
(e.g. commas between operands, brackets, etc), or just as a default if
|
||
no other style seems appropriate. */
|
||
dis_style_text,
|
||
|
||
/* Use this for all instruction mnemonics, or aliases for mnemonics.
|
||
These should be things that correspond to real machine
|
||
instructions. */
|
||
dis_style_mnemonic,
|
||
|
||
/* Some architectures include additional mnemonic like fields within the
|
||
instruction operands, e.g. on aarch64 'add w16, w7, w1, lsl #2' where
|
||
the 'lsl' is an additional piece of text that describes how the
|
||
instruction should behave. This sub-mnemonic style can be used for
|
||
these pieces of text. */
|
||
dis_style_sub_mnemonic,
|
||
|
||
/* For things that aren't real machine instructions, but rather
|
||
assembler directives, e.g. .byte, etc. */
|
||
dis_style_assembler_directive,
|
||
|
||
/* Use this for any register names. This may or may-not include any
|
||
register prefix, e.g. '$', '%', at the discretion of the target,
|
||
though within each target the choice to include prefixes for not
|
||
should be kept consistent. If the prefix is not printed with this
|
||
style, then dis_style_text should be used. */
|
||
dis_style_register,
|
||
|
||
/* Use this for any constant values used within instructions or
|
||
directives, unless the value is an absolute address, or an offset
|
||
that will be added to an address (no matter where the address comes
|
||
from) before use. This style may, or may-not be used for any
|
||
prefix to the immediate value, e.g. '$', at the discretion of the
|
||
target, though within each target the choice to include these
|
||
prefixes should be kept consistent. */
|
||
dis_style_immediate,
|
||
|
||
/* The style for the numerical representation of an absolute address.
|
||
Anything that is an address offset should use the immediate style.
|
||
This style may, or may-not be used for any prefix to the immediate
|
||
value, e.g. '$', at the discretion of the target, though within
|
||
each target the choice to include these prefixes should be kept
|
||
consistent. */
|
||
dis_style_address,
|
||
|
||
/* The style for any constant value within an instruction or directive
|
||
that represents an offset that will be added to an address before
|
||
use. This style may, or may-not be used for any prefix to the
|
||
immediate value, e.g. '$', at the discretion of the target, though
|
||
within each target the choice to include these prefixes should be
|
||
kept consistent. */
|
||
dis_style_address_offset,
|
||
|
||
/* The style for a symbol's name. The numerical address of a symbol
|
||
should use the address style above, this style is reserved for the
|
||
name. */
|
||
dis_style_symbol,
|
||
|
||
/* The start of a comment that runs to the end of the line. Anything
|
||
printed after a comment start might be styled differently,
|
||
e.g. everything might be styled as a comment, regardless of the
|
||
actual style used. The disassembler itself should not try to adjust
|
||
the style emitted for comment content, e.g. an address emitted within
|
||
a comment should still be given dis_style_address, in this way it is
|
||
up to the user of the disassembler to decide how comments should be
|
||
styled. */
|
||
dis_style_comment_start
|
||
};
|
||
|
||
typedef int (*fprintf_ftype) (void *, const char*, ...) ATTRIBUTE_FPTR_PRINTF_2;
|
||
typedef int (*fprintf_styled_ftype) (void *, enum disassembler_style, const char*, ...) ATTRIBUTE_FPTR_PRINTF_3;
|
||
|
||
/* This struct is passed into the instruction decoding routine,
|
||
and is passed back out into each callback. The various fields are used
|
||
for conveying information from your main routine into your callbacks,
|
||
for passing information into the instruction decoders (such as the
|
||
addresses of the callback functions), or for passing information
|
||
back from the instruction decoders to their callers.
|
||
|
||
It must be initialized before it is first passed; this can be done
|
||
by hand, or using one of the initialization macros below. */
|
||
|
||
typedef struct disassemble_info
|
||
{
|
||
fprintf_ftype fprintf_func;
|
||
fprintf_styled_ftype fprintf_styled_func;
|
||
void *stream;
|
||
void *application_data;
|
||
|
||
/* Target description. We could replace this with a pointer to the bfd,
|
||
but that would require one. There currently isn't any such requirement
|
||
so to avoid introducing one we record these explicitly. */
|
||
/* The bfd_flavour. This can be bfd_target_unknown_flavour. */
|
||
enum bfd_flavour flavour;
|
||
/* The bfd_arch value. */
|
||
enum bfd_architecture arch;
|
||
/* The bfd_mach value. */
|
||
unsigned long mach;
|
||
/* Endianness (for bi-endian cpus). Mono-endian cpus can ignore this. */
|
||
enum bfd_endian endian;
|
||
/* Endianness of code, for mixed-endian situations such as ARM BE8. */
|
||
enum bfd_endian endian_code;
|
||
|
||
/* Some targets need information about the current section to accurately
|
||
display insns. If this is NULL, the target disassembler function
|
||
will have to make its best guess. */
|
||
asection *section;
|
||
|
||
/* An array of pointers to symbols either at the location being disassembled
|
||
or at the start of the function being disassembled. The array is sorted
|
||
so that the first symbol is intended to be the one used. The others are
|
||
present for any misc. purposes. This is not set reliably, but if it is
|
||
not NULL, it is correct. */
|
||
asymbol **symbols;
|
||
/* Number of symbols in array. */
|
||
int num_symbols;
|
||
|
||
/* Symbol table provided for targets that want to look at it. This is
|
||
used on Arm to find mapping symbols and determine Arm/Thumb code. */
|
||
asymbol **symtab;
|
||
int symtab_pos;
|
||
int symtab_size;
|
||
|
||
/* For use by the disassembler.
|
||
The top 16 bits are reserved for public use (and are documented here).
|
||
The bottom 16 bits are for the internal use of the disassembler. */
|
||
unsigned long flags;
|
||
/* Set if the disassembler has determined that there are one or more
|
||
relocations associated with the instruction being disassembled. */
|
||
#define INSN_HAS_RELOC (1u << 31)
|
||
/* Set if the user has requested the disassembly of data as well as code. */
|
||
#define DISASSEMBLE_DATA (1u << 30)
|
||
/* Set if the user has specifically set the machine type encoded in the
|
||
mach field of this structure. */
|
||
#define USER_SPECIFIED_MACHINE_TYPE (1u << 29)
|
||
/* Set if the user has requested wide output. */
|
||
#define WIDE_OUTPUT (1u << 28)
|
||
|
||
/* Dynamic relocations, if they have been loaded. */
|
||
arelent **dynrelbuf;
|
||
long dynrelcount;
|
||
|
||
/* Use internally by the target specific disassembly code. */
|
||
void *private_data;
|
||
|
||
/* Function used to get bytes to disassemble. MEMADDR is the
|
||
address of the stuff to be disassembled, MYADDR is the address to
|
||
put the bytes in, and LENGTH is the number of bytes to read.
|
||
INFO is a pointer to this struct.
|
||
Returns an errno value or 0 for success. */
|
||
int (*read_memory_func)
|
||
(bfd_vma memaddr, bfd_byte *myaddr, unsigned int length,
|
||
struct disassemble_info *dinfo);
|
||
|
||
/* Function which should be called if we get an error that we can't
|
||
recover from. STATUS is the errno value from read_memory_func and
|
||
MEMADDR is the address that we were trying to read. INFO is a
|
||
pointer to this struct. */
|
||
void (*memory_error_func)
|
||
(int status, bfd_vma memaddr, struct disassemble_info *dinfo);
|
||
|
||
/* Function called to print ADDR. */
|
||
void (*print_address_func)
|
||
(bfd_vma addr, struct disassemble_info *dinfo);
|
||
|
||
/* Function called to determine if there is a symbol at the given ADDR.
|
||
If there is, the function returns 1, otherwise it returns 0.
|
||
This is used by ports which support an overlay manager where
|
||
the overlay number is held in the top part of an address. In
|
||
some circumstances we want to include the overlay number in the
|
||
address, (normally because there is a symbol associated with
|
||
that address), but sometimes we want to mask out the overlay bits. */
|
||
asymbol * (*symbol_at_address_func)
|
||
(bfd_vma addr, struct disassemble_info *dinfo);
|
||
|
||
/* Function called to check if a SYMBOL is can be displayed to the user.
|
||
This is used by some ports that want to hide special symbols when
|
||
displaying debugging outout. */
|
||
bool (*symbol_is_valid)
|
||
(asymbol *, struct disassemble_info *dinfo);
|
||
|
||
/* These are for buffer_read_memory. */
|
||
bfd_byte *buffer;
|
||
bfd_vma buffer_vma;
|
||
size_t buffer_length;
|
||
|
||
/* This variable may be set by the instruction decoder. It suggests
|
||
the number of bytes objdump should display on a single line. If
|
||
the instruction decoder sets this, it should always set it to
|
||
the same value in order to get reasonable looking output. */
|
||
int bytes_per_line;
|
||
|
||
/* The next two variables control the way objdump displays the raw data. */
|
||
/* For example, if bytes_per_line is 8 and bytes_per_chunk is 4, the */
|
||
/* output will look like this:
|
||
00: 00000000 00000000
|
||
with the chunks displayed according to "display_endian". */
|
||
int bytes_per_chunk;
|
||
enum bfd_endian display_endian;
|
||
|
||
/* Number of octets per incremented target address
|
||
Normally one, but some DSPs have byte sizes of 16 or 32 bits. */
|
||
unsigned int octets_per_byte;
|
||
|
||
/* The number of zeroes we want to see at the end of a section before we
|
||
start skipping them. */
|
||
unsigned int skip_zeroes;
|
||
|
||
/* The number of zeroes to skip at the end of a section. If the number
|
||
of zeroes at the end is between SKIP_ZEROES_AT_END and SKIP_ZEROES,
|
||
they will be disassembled. If there are fewer than
|
||
SKIP_ZEROES_AT_END, they will be skipped. This is a heuristic
|
||
attempt to avoid disassembling zeroes inserted by section
|
||
alignment. */
|
||
unsigned int skip_zeroes_at_end;
|
||
|
||
/* Whether the disassembler always needs the relocations. */
|
||
bool disassembler_needs_relocs;
|
||
|
||
/* Results from instruction decoders. Not all decoders yet support
|
||
this information. This info is set each time an instruction is
|
||
decoded, and is only valid for the last such instruction.
|
||
|
||
To determine whether this decoder supports this information, set
|
||
insn_info_valid to 0, decode an instruction, then check it. */
|
||
|
||
char insn_info_valid; /* Branch info has been set. */
|
||
char branch_delay_insns; /* How many sequential insn's will run before
|
||
a branch takes effect. (0 = normal) */
|
||
char data_size; /* Size of data reference in insn, in bytes */
|
||
enum dis_insn_type insn_type; /* Type of instruction */
|
||
bfd_vma target; /* Target address of branch or dref, if known;
|
||
zero if unknown. */
|
||
bfd_vma target2; /* Second target address for dref2 */
|
||
|
||
/* Command line options specific to the target disassembler. */
|
||
const char *disassembler_options;
|
||
|
||
/* If non-zero then try not disassemble beyond this address, even if
|
||
there are values left in the buffer. This address is the address
|
||
of the nearest symbol forwards from the start of the disassembly,
|
||
and it is assumed that it lies on the boundary between instructions.
|
||
If an instruction spans this address then this is an error in the
|
||
file being disassembled. */
|
||
bfd_vma stop_vma;
|
||
|
||
/* The end range of the current range being disassembled. This is required
|
||
in order to notify the disassembler when it's currently handling a
|
||
different range than it was before. This prevent unsafe optimizations when
|
||
disassembling such as the way mapping symbols are found on AArch64. */
|
||
bfd_vma stop_offset;
|
||
|
||
/* Set to true if the disassembler applied styling to the output,
|
||
otherwise, set to false. */
|
||
bool created_styled_output;
|
||
} disassemble_info;
|
||
|
||
/* This struct is used to pass information about valid disassembler
|
||
option arguments from the target to the generic GDB functions
|
||
that set and display them. */
|
||
|
||
typedef struct
|
||
{
|
||
/* Option argument name to use in descriptions. */
|
||
const char *name;
|
||
|
||
/* Vector of acceptable option argument values, NULL-terminated.
|
||
NULL if any values are accepted. */
|
||
const char **values;
|
||
} disasm_option_arg_t;
|
||
|
||
/* This struct is used to pass information about valid disassembler
|
||
options, their descriptions and arguments from the target to the
|
||
generic GDB functions that set and display them. Options are
|
||
defined by tuples of vector entries at each index. */
|
||
|
||
typedef struct
|
||
{
|
||
/* Vector of option names, NULL-terminated. */
|
||
const char **name;
|
||
|
||
/* Vector of option descriptions or NULL if none to be shown. */
|
||
const char **description;
|
||
|
||
/* Vector of option argument information pointers or NULL if no
|
||
option accepts an argument. NULL entries denote individual
|
||
options that accept no argument. */
|
||
const disasm_option_arg_t **arg;
|
||
} disasm_options_t;
|
||
|
||
/* This struct is used to pass information about valid disassembler
|
||
options and arguments from the target to the generic GDB functions
|
||
that set and display them. */
|
||
|
||
typedef struct
|
||
{
|
||
/* Valid disassembler options. Individual options that support
|
||
an argument will refer to entries in the ARGS vector. */
|
||
disasm_options_t options;
|
||
|
||
/* Vector of acceptable option arguments, NULL-terminated. This
|
||
collects all possible option argument choices, some of which
|
||
may be shared by different options from the OPTIONS member. */
|
||
disasm_option_arg_t *args;
|
||
} disasm_options_and_args_t;
|
||
|
||
/* Standard disassemblers. Disassemble one instruction at the given
|
||
target address. Return number of octets processed. */
|
||
typedef int (*disassembler_ftype) (bfd_vma, disassemble_info *);
|
||
|
||
/* Disassemblers used out side of opcodes library. */
|
||
extern int print_insn_m32c (bfd_vma, disassemble_info *);
|
||
extern int print_insn_mep (bfd_vma, disassemble_info *);
|
||
extern int print_insn_s12z (bfd_vma, disassemble_info *);
|
||
extern int print_insn_sh (bfd_vma, disassemble_info *);
|
||
extern int print_insn_sparc (bfd_vma, disassemble_info *);
|
||
extern int print_insn_rx (bfd_vma, disassemble_info *);
|
||
extern int print_insn_rl78 (bfd_vma, disassemble_info *);
|
||
extern int print_insn_rl78_g10 (bfd_vma, disassemble_info *);
|
||
extern int print_insn_rl78_g13 (bfd_vma, disassemble_info *);
|
||
extern int print_insn_rl78_g14 (bfd_vma, disassemble_info *);
|
||
|
||
extern disassembler_ftype arc_get_disassembler (bfd *);
|
||
extern disassembler_ftype cris_get_disassembler (bfd *);
|
||
|
||
extern void print_aarch64_disassembler_options (FILE *);
|
||
extern void print_i386_disassembler_options (FILE *);
|
||
extern void print_mips_disassembler_options (FILE *);
|
||
extern void print_nfp_disassembler_options (FILE *);
|
||
extern void print_ppc_disassembler_options (FILE *);
|
||
extern void print_riscv_disassembler_options (FILE *);
|
||
extern void print_arm_disassembler_options (FILE *);
|
||
extern void print_arc_disassembler_options (FILE *);
|
||
extern void print_kvx_disassembler_options(FILE *);
|
||
extern void print_s390_disassembler_options (FILE *);
|
||
extern void print_wasm32_disassembler_options (FILE *);
|
||
extern void print_loongarch_disassembler_options (FILE *);
|
||
extern void print_bpf_disassembler_options (FILE *);
|
||
extern bool aarch64_symbol_is_valid (asymbol *, struct disassemble_info *);
|
||
extern bool arm_symbol_is_valid (asymbol *, struct disassemble_info *);
|
||
extern bool csky_symbol_is_valid (asymbol *, struct disassemble_info *);
|
||
extern bool riscv_symbol_is_valid (asymbol *, struct disassemble_info *);
|
||
extern void disassemble_init_powerpc (struct disassemble_info *);
|
||
extern void disassemble_init_s390 (struct disassemble_info *);
|
||
extern void disassemble_init_wasm32 (struct disassemble_info *);
|
||
extern void disassemble_init_nds32 (struct disassemble_info *);
|
||
extern const disasm_options_and_args_t *disassembler_options_arc (void);
|
||
extern const disasm_options_and_args_t *disassembler_options_arm (void);
|
||
extern const disasm_options_and_args_t *disassembler_options_mips (void);
|
||
extern const disasm_options_and_args_t *disassembler_options_powerpc (void);
|
||
extern const disasm_options_and_args_t *disassembler_options_riscv (void);
|
||
extern const disasm_options_and_args_t *disassembler_options_s390 (void);
|
||
|
||
/* Fetch the disassembler for a given architecture ARC, endianess (big
|
||
endian if BIG is true), bfd_mach value MACH, and ABFD, if that support
|
||
is available. ABFD may be NULL. */
|
||
extern disassembler_ftype disassembler (enum bfd_architecture arc,
|
||
bool big, unsigned long mach,
|
||
bfd *abfd);
|
||
|
||
/* Amend the disassemble_info structure as necessary for the target architecture.
|
||
Should only be called after initialising the info->arch field. */
|
||
extern void disassemble_init_for_target (struct disassemble_info *);
|
||
|
||
/* Tidy any memory allocated by targets, such as info->private_data. */
|
||
extern void disassemble_free_target (struct disassemble_info *);
|
||
|
||
/* Set the basic disassembler print functions. */
|
||
extern void disassemble_set_printf (struct disassemble_info *, void *,
|
||
fprintf_ftype, fprintf_styled_ftype);
|
||
|
||
/* Document any target specific options available from the disassembler. */
|
||
extern void disassembler_usage (FILE *);
|
||
|
||
/* Remove whitespace and consecutive commas. */
|
||
extern char *remove_whitespace_and_extra_commas (char *);
|
||
|
||
/* Like STRCMP, but treat ',' the same as '\0' so that we match
|
||
strings like "foobar" against "foobar,xxyyzz,...". */
|
||
extern int disassembler_options_cmp (const char *, const char *);
|
||
|
||
/* A helper function for FOR_EACH_DISASSEMBLER_OPTION. */
|
||
static inline const char *
|
||
next_disassembler_option (const char *options)
|
||
{
|
||
const char *opt = strchr (options, ',');
|
||
if (opt != NULL)
|
||
opt++;
|
||
return opt;
|
||
}
|
||
|
||
/* A macro for iterating over each comma separated option in OPTIONS. */
|
||
#define FOR_EACH_DISASSEMBLER_OPTION(OPT, OPTIONS) \
|
||
for ((OPT) = (OPTIONS); \
|
||
(OPT) != NULL; \
|
||
(OPT) = next_disassembler_option (OPT))
|
||
|
||
|
||
/* This block of definitions is for particular callers who read instructions
|
||
into a buffer before calling the instruction decoder. */
|
||
|
||
/* Here is a function which callers may wish to use for read_memory_func.
|
||
It gets bytes from a buffer. */
|
||
extern int buffer_read_memory
|
||
(bfd_vma, bfd_byte *, unsigned int, struct disassemble_info *);
|
||
|
||
/* This function goes with buffer_read_memory.
|
||
It prints a message using info->fprintf_func and info->stream. */
|
||
extern void perror_memory (int, bfd_vma, struct disassemble_info *);
|
||
|
||
|
||
/* Just print the address in hex. This is included for completeness even
|
||
though both GDB and objdump provide their own (to print symbolic
|
||
addresses). */
|
||
extern void generic_print_address
|
||
(bfd_vma, struct disassemble_info *);
|
||
|
||
/* Always NULL. */
|
||
extern asymbol *generic_symbol_at_address
|
||
(bfd_vma, struct disassemble_info *);
|
||
|
||
/* Always true. */
|
||
extern bool generic_symbol_is_valid
|
||
(asymbol *, struct disassemble_info *);
|
||
|
||
/* Method to initialize a disassemble_info struct. This should be
|
||
called by all applications creating such a struct. */
|
||
extern void init_disassemble_info (struct disassemble_info *dinfo, void *stream,
|
||
fprintf_ftype fprintf_func,
|
||
fprintf_styled_ftype fprintf_styled_func);
|
||
|
||
/* For compatibility with existing code. */
|
||
#define INIT_DISASSEMBLE_INFO(INFO, STREAM, FPRINTF_FUNC, FPRINTF_STYLED_FUNC) \
|
||
init_disassemble_info (&(INFO), (STREAM), (fprintf_ftype) (FPRINTF_FUNC), \
|
||
(fprintf_styled_ftype) (FPRINTF_STYLED_FUNC))
|
||
|
||
#ifdef __cplusplus
|
||
}
|
||
#endif
|
||
|
||
#endif /* ! defined (DIS_ASM_H) */
|