Commit | Line | Data |
---|---|---|
252b5132 | 1 | /* Interface between the opcode library and its callers. |
4f1d9bd8 | 2 | |
82704155 | 3 | Copyright (C) 1999-2019 Free Software Foundation, Inc. |
d70c5fc7 | 4 | |
4f1d9bd8 NC |
5 | This program is free software; you can redistribute it and/or modify |
6 | it under the terms of the GNU General Public License as published by | |
e4e42b45 | 7 | the Free Software Foundation; either version 3, or (at your option) |
4f1d9bd8 NC |
8 | any later version. |
9 | ||
10 | This program is distributed in the hope that it will be useful, | |
11 | but WITHOUT ANY WARRANTY; without even the implied warranty of | |
12 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
13 | GNU General Public License for more details. | |
14 | ||
15 | You should have received a copy of the GNU General Public License | |
16 | along with this program; if not, write to the Free Software | |
e172dbf8 NC |
17 | Foundation, Inc., 51 Franklin Street - Fifth Floor, |
18 | Boston, MA 02110-1301, USA. | |
d70c5fc7 | 19 | |
252b5132 RH |
20 | Written by Cygnus Support, 1993. |
21 | ||
22 | The opcode library (libopcodes.a) provides instruction decoders for | |
23 | a large variety of instruction sets, callable with an identical | |
24 | interface, for making instruction-processing programs more independent | |
25 | of the instruction set being processed. */ | |
26 | ||
27 | #ifndef DIS_ASM_H | |
28 | #define DIS_ASM_H | |
29 | ||
7d7a6736 ILT |
30 | #ifdef __cplusplus |
31 | extern "C" { | |
32 | #endif | |
33 | ||
252b5132 | 34 | #include <stdio.h> |
8f0a2148 | 35 | #include <string.h> |
252b5132 RH |
36 | #include "bfd.h" |
37 | ||
d908c8af | 38 | typedef int (*fprintf_ftype) (void *, const char*, ...) ATTRIBUTE_FPTR_PRINTF_2; |
252b5132 | 39 | |
1c0d3aa6 NC |
40 | enum dis_insn_type |
41 | { | |
1316c8b3 NC |
42 | dis_noninsn, /* Not a valid instruction. */ |
43 | dis_nonbranch, /* Not a branch instruction. */ | |
44 | dis_branch, /* Unconditional branch. */ | |
45 | dis_condbranch, /* Conditional branch. */ | |
46 | dis_jsr, /* Jump to subroutine. */ | |
47 | dis_condjsr, /* Conditional jump to subroutine. */ | |
48 | dis_dref, /* Data reference instruction. */ | |
49 | dis_dref2 /* Two data references in instruction. */ | |
252b5132 RH |
50 | }; |
51 | ||
d70c5fc7 | 52 | /* This struct is passed into the instruction decoding routine, |
252b5132 RH |
53 | and is passed back out into each callback. The various fields are used |
54 | for conveying information from your main routine into your callbacks, | |
55 | for passing information into the instruction decoders (such as the | |
56 | addresses of the callback functions), or for passing information | |
57 | back from the instruction decoders to their callers. | |
58 | ||
59 | It must be initialized before it is first passed; this can be done | |
60 | by hand, or using one of the initialization macros below. */ | |
61 | ||
1c0d3aa6 NC |
62 | typedef struct disassemble_info |
63 | { | |
252b5132 | 64 | fprintf_ftype fprintf_func; |
8cf3f354 AM |
65 | void *stream; |
66 | void *application_data; | |
252b5132 RH |
67 | |
68 | /* Target description. We could replace this with a pointer to the bfd, | |
69 | but that would require one. There currently isn't any such requirement | |
70 | so to avoid introducing one we record these explicitly. */ | |
71 | /* The bfd_flavour. This can be bfd_target_unknown_flavour. */ | |
72 | enum bfd_flavour flavour; | |
73 | /* The bfd_arch value. */ | |
74 | enum bfd_architecture arch; | |
75 | /* The bfd_mach value. */ | |
76 | unsigned long mach; | |
77 | /* Endianness (for bi-endian cpus). Mono-endian cpus can ignore this. */ | |
78 | enum bfd_endian endian; | |
6a4fe770 SS |
79 | /* Endianness of code, for mixed-endian situations such as ARM BE8. */ |
80 | enum bfd_endian endian_code; | |
cadaa522 FCE |
81 | /* An arch/mach-specific bitmask of selected instruction subsets, mainly |
82 | for processors with run-time-switchable instruction sets. The default, | |
83 | zero, means that there is no constraint. CGEN-based opcodes ports | |
84 | may use ISA_foo masks. */ | |
16175d96 | 85 | void *insn_sets; |
252b5132 | 86 | |
ca6d9fb3 HPN |
87 | /* Some targets need information about the current section to accurately |
88 | display insns. If this is NULL, the target disassembler function | |
89 | will have to make its best guess. */ | |
90 | asection *section; | |
91 | ||
252b5132 RH |
92 | /* An array of pointers to symbols either at the location being disassembled |
93 | or at the start of the function being disassembled. The array is sorted | |
94 | so that the first symbol is intended to be the one used. The others are | |
95 | present for any misc. purposes. This is not set reliably, but if it is | |
96 | not NULL, it is correct. */ | |
97 | asymbol **symbols; | |
98 | /* Number of symbols in array. */ | |
99 | int num_symbols; | |
100 | ||
2087ad84 PB |
101 | /* Symbol table provided for targets that want to look at it. This is |
102 | used on Arm to find mapping symbols and determine Arm/Thumb code. */ | |
103 | asymbol **symtab; | |
104 | int symtab_pos; | |
105 | int symtab_size; | |
106 | ||
252b5132 RH |
107 | /* For use by the disassembler. |
108 | The top 16 bits are reserved for public use (and are documented here). | |
109 | The bottom 16 bits are for the internal use of the disassembler. */ | |
110 | unsigned long flags; | |
1316c8b3 NC |
111 | /* Set if the disassembler has determined that there are one or more |
112 | relocations associated with the instruction being disassembled. */ | |
113 | #define INSN_HAS_RELOC (1 << 31) | |
114 | /* Set if the user has requested the disassembly of data as well as code. */ | |
115 | #define DISASSEMBLE_DATA (1 << 30) | |
0313a2b8 NC |
116 | /* Set if the user has specifically set the machine type encoded in the |
117 | mach field of this structure. */ | |
118 | #define USER_SPECIFIED_MACHINE_TYPE (1 << 29) | |
dd7efa79 PB |
119 | /* Set if the user has requested wide output. */ |
120 | #define WIDE_OUTPUT (1 << 28) | |
1316c8b3 NC |
121 | |
122 | /* Use internally by the target specific disassembly code. */ | |
8cf3f354 | 123 | void *private_data; |
252b5132 RH |
124 | |
125 | /* Function used to get bytes to disassemble. MEMADDR is the | |
126 | address of the stuff to be disassembled, MYADDR is the address to | |
127 | put the bytes in, and LENGTH is the number of bytes to read. | |
128 | INFO is a pointer to this struct. | |
129 | Returns an errno value or 0 for success. */ | |
130 | int (*read_memory_func) | |
8cf3f354 | 131 | (bfd_vma memaddr, bfd_byte *myaddr, unsigned int length, |
e7f8eadb | 132 | struct disassemble_info *dinfo); |
252b5132 RH |
133 | |
134 | /* Function which should be called if we get an error that we can't | |
135 | recover from. STATUS is the errno value from read_memory_func and | |
136 | MEMADDR is the address that we were trying to read. INFO is a | |
137 | pointer to this struct. */ | |
138 | void (*memory_error_func) | |
e7f8eadb | 139 | (int status, bfd_vma memaddr, struct disassemble_info *dinfo); |
252b5132 RH |
140 | |
141 | /* Function called to print ADDR. */ | |
142 | void (*print_address_func) | |
e7f8eadb | 143 | (bfd_vma addr, struct disassemble_info *dinfo); |
252b5132 RH |
144 | |
145 | /* Function called to determine if there is a symbol at the given ADDR. | |
146 | If there is, the function returns 1, otherwise it returns 0. | |
147 | This is used by ports which support an overlay manager where | |
148 | the overlay number is held in the top part of an address. In | |
149 | some circumstances we want to include the overlay number in the | |
150 | address, (normally because there is a symbol associated with | |
151 | that address), but sometimes we want to mask out the overlay bits. */ | |
152 | int (* symbol_at_address_func) | |
e7f8eadb | 153 | (bfd_vma addr, struct disassemble_info *dinfo); |
252b5132 | 154 | |
22a398e1 NC |
155 | /* Function called to check if a SYMBOL is can be displayed to the user. |
156 | This is used by some ports that want to hide special symbols when | |
157 | displaying debugging outout. */ | |
158 | bfd_boolean (* symbol_is_valid) | |
e7f8eadb | 159 | (asymbol *, struct disassemble_info *dinfo); |
d70c5fc7 | 160 | |
252b5132 RH |
161 | /* These are for buffer_read_memory. */ |
162 | bfd_byte *buffer; | |
163 | bfd_vma buffer_vma; | |
0f6329bd | 164 | size_t buffer_length; |
252b5132 RH |
165 | |
166 | /* This variable may be set by the instruction decoder. It suggests | |
167 | the number of bytes objdump should display on a single line. If | |
168 | the instruction decoder sets this, it should always set it to | |
169 | the same value in order to get reasonable looking output. */ | |
170 | int bytes_per_line; | |
171 | ||
22a398e1 | 172 | /* The next two variables control the way objdump displays the raw data. */ |
252b5132 RH |
173 | /* For example, if bytes_per_line is 8 and bytes_per_chunk is 4, the */ |
174 | /* output will look like this: | |
175 | 00: 00000000 00000000 | |
176 | with the chunks displayed according to "display_endian". */ | |
177 | int bytes_per_chunk; | |
178 | enum bfd_endian display_endian; | |
179 | ||
d70c5fc7 | 180 | /* Number of octets per incremented target address |
3c3bdf30 | 181 | Normally one, but some DSPs have byte sizes of 16 or 32 bits. */ |
f6af82bd | 182 | unsigned int octets_per_byte; |
940b2b78 | 183 | |
0bcb06d2 AS |
184 | /* The number of zeroes we want to see at the end of a section before we |
185 | start skipping them. */ | |
186 | unsigned int skip_zeroes; | |
187 | ||
188 | /* The number of zeroes to skip at the end of a section. If the number | |
189 | of zeroes at the end is between SKIP_ZEROES_AT_END and SKIP_ZEROES, | |
190 | they will be disassembled. If there are fewer than | |
191 | SKIP_ZEROES_AT_END, they will be skipped. This is a heuristic | |
192 | attempt to avoid disassembling zeroes inserted by section | |
193 | alignment. */ | |
194 | unsigned int skip_zeroes_at_end; | |
195 | ||
d99b6465 AS |
196 | /* Whether the disassembler always needs the relocations. */ |
197 | bfd_boolean disassembler_needs_relocs; | |
198 | ||
252b5132 RH |
199 | /* Results from instruction decoders. Not all decoders yet support |
200 | this information. This info is set each time an instruction is | |
201 | decoded, and is only valid for the last such instruction. | |
202 | ||
203 | To determine whether this decoder supports this information, set | |
204 | insn_info_valid to 0, decode an instruction, then check it. */ | |
205 | ||
206 | char insn_info_valid; /* Branch info has been set. */ | |
207 | char branch_delay_insns; /* How many sequential insn's will run before | |
208 | a branch takes effect. (0 = normal) */ | |
209 | char data_size; /* Size of data reference in insn, in bytes */ | |
210 | enum dis_insn_type insn_type; /* Type of instruction */ | |
211 | bfd_vma target; /* Target address of branch or dref, if known; | |
212 | zero if unknown. */ | |
213 | bfd_vma target2; /* Second target address for dref2 */ | |
214 | ||
dd92f639 | 215 | /* Command line options specific to the target disassembler. */ |
f995bbe8 | 216 | const char *disassembler_options; |
dd92f639 | 217 | |
bdc4de1b NC |
218 | /* If non-zero then try not disassemble beyond this address, even if |
219 | there are values left in the buffer. This address is the address | |
220 | of the nearest symbol forwards from the start of the disassembly, | |
221 | and it is assumed that it lies on the boundary between instructions. | |
222 | If an instruction spans this address then this is an error in the | |
223 | file being disassembled. */ | |
224 | bfd_vma stop_vma; | |
225 | ||
53b2f36b TC |
226 | /* The end range of the current range being disassembled. This is required |
227 | in order to notify the disassembler when it's currently handling a | |
228 | different range than it was before. This prevent unsafe optimizations when | |
229 | disassembling such as the way mapping symbols are found on AArch64. */ | |
230 | bfd_vma stop_offset; | |
231 | ||
252b5132 RH |
232 | } disassemble_info; |
233 | ||
471b9d15 MR |
234 | /* This struct is used to pass information about valid disassembler |
235 | option arguments from the target to the generic GDB functions | |
236 | that set and display them. */ | |
65b48a81 PB |
237 | |
238 | typedef struct | |
239 | { | |
471b9d15 MR |
240 | /* Option argument name to use in descriptions. */ |
241 | const char *name; | |
242 | ||
243 | /* Vector of acceptable option argument values, NULL-terminated. */ | |
244 | const char **values; | |
245 | } disasm_option_arg_t; | |
246 | ||
247 | /* This struct is used to pass information about valid disassembler | |
248 | options, their descriptions and arguments from the target to the | |
249 | generic GDB functions that set and display them. Options are | |
250 | defined by tuples of vector entries at each index. */ | |
251 | ||
252 | typedef struct | |
253 | { | |
254 | /* Vector of option names, NULL-terminated. */ | |
65b48a81 | 255 | const char **name; |
471b9d15 MR |
256 | |
257 | /* Vector of option descriptions or NULL if none to be shown. */ | |
65b48a81 | 258 | const char **description; |
471b9d15 MR |
259 | |
260 | /* Vector of option argument information pointers or NULL if no | |
261 | option accepts an argument. NULL entries denote individual | |
262 | options that accept no argument. */ | |
263 | const disasm_option_arg_t **arg; | |
65b48a81 PB |
264 | } disasm_options_t; |
265 | ||
471b9d15 MR |
266 | /* This struct is used to pass information about valid disassembler |
267 | options and arguments from the target to the generic GDB functions | |
268 | that set and display them. */ | |
269 | ||
270 | typedef struct | |
271 | { | |
272 | /* Valid disassembler options. Individual options that support | |
273 | an argument will refer to entries in the ARGS vector. */ | |
274 | disasm_options_t options; | |
275 | ||
276 | /* Vector of acceptable option arguments, NULL-terminated. This | |
277 | collects all possible option argument choices, some of which | |
278 | may be shared by different options from the OPTIONS member. */ | |
279 | disasm_option_arg_t *args; | |
280 | } disasm_options_and_args_t; | |
252b5132 RH |
281 | \f |
282 | /* Standard disassemblers. Disassemble one instruction at the given | |
19222dc0 | 283 | target address. Return number of octets processed. */ |
8cf3f354 AM |
284 | typedef int (*disassembler_ftype) (bfd_vma, disassemble_info *); |
285 | ||
88c1242d | 286 | /* Disassemblers used out side of opcodes library. */ |
88c1242d | 287 | extern int print_insn_m32c (bfd_vma, disassemble_info *); |
d6eafc3e | 288 | extern int print_insn_mep (bfd_vma, disassemble_info *); |
007d2fe4 | 289 | extern int print_insn_s12z (bfd_vma, disassemble_info *); |
8cf3f354 | 290 | extern int print_insn_sh (bfd_vma, disassemble_info *); |
1c0d3aa6 | 291 | extern int print_insn_sparc (bfd_vma, disassemble_info *); |
c7927a3c | 292 | extern int print_insn_rx (bfd_vma, disassemble_info *); |
99c513f6 | 293 | extern int print_insn_rl78 (bfd_vma, disassemble_info *); |
0952813b DD |
294 | extern int print_insn_rl78_g10 (bfd_vma, disassemble_info *); |
295 | extern int print_insn_rl78_g13 (bfd_vma, disassemble_info *); | |
296 | extern int print_insn_rl78_g14 (bfd_vma, disassemble_info *); | |
8cf3f354 | 297 | |
886a2506 | 298 | extern disassembler_ftype arc_get_disassembler (bfd *); |
8cf3f354 AM |
299 | extern disassembler_ftype cris_get_disassembler (bfd *); |
300 | ||
a06ea964 | 301 | extern void print_aarch64_disassembler_options (FILE *); |
f59a29b9 | 302 | extern void print_i386_disassembler_options (FILE *); |
8cf3f354 | 303 | extern void print_mips_disassembler_options (FILE *); |
fe944acf | 304 | extern void print_nfp_disassembler_options (FILE *); |
8cf3f354 | 305 | extern void print_ppc_disassembler_options (FILE *); |
e23eba97 | 306 | extern void print_riscv_disassembler_options (FILE *); |
8cf3f354 | 307 | extern void print_arm_disassembler_options (FILE *); |
37fd5ef3 | 308 | extern void print_arc_disassembler_options (FILE *); |
112b7c50 | 309 | extern void print_s390_disassembler_options (FILE *); |
62ecb94c | 310 | extern void print_wasm32_disassembler_options (FILE *); |
a06ea964 | 311 | extern bfd_boolean aarch64_symbol_is_valid (asymbol *, struct disassemble_info *); |
22a398e1 | 312 | extern bfd_boolean arm_symbol_is_valid (asymbol *, struct disassemble_info *); |
b8891f8d | 313 | extern bfd_boolean csky_symbol_is_valid (asymbol *, struct disassemble_info *); |
884b49e3 | 314 | extern bfd_boolean riscv_symbol_is_valid (asymbol *, struct disassemble_info *); |
b240011a | 315 | extern void disassemble_init_powerpc (struct disassemble_info *); |
65b48a81 | 316 | extern void disassemble_init_s390 (struct disassemble_info *); |
62ecb94c | 317 | extern void disassemble_init_wasm32 (struct disassemble_info *); |
fbaf61ad | 318 | extern void disassemble_init_nds32 (struct disassemble_info *); |
471b9d15 MR |
319 | extern const disasm_options_and_args_t *disassembler_options_arm (void); |
320 | extern const disasm_options_and_args_t *disassembler_options_mips (void); | |
321 | extern const disasm_options_and_args_t *disassembler_options_powerpc (void); | |
322 | extern const disasm_options_and_args_t *disassembler_options_s390 (void); | |
dd92f639 | 323 | |
003ca0fd YQ |
324 | /* Fetch the disassembler for a given architecture ARC, endianess (big |
325 | endian if BIG is true), bfd_mach value MACH, and ABFD, if that support | |
326 | is available. ABFD may be NULL. */ | |
327 | extern disassembler_ftype disassembler (enum bfd_architecture arc, | |
328 | bfd_boolean big, unsigned long mach, | |
329 | bfd *abfd); | |
252b5132 | 330 | |
22a398e1 NC |
331 | /* Amend the disassemble_info structure as necessary for the target architecture. |
332 | Should only be called after initialising the info->arch field. */ | |
e7f8eadb | 333 | extern void disassemble_init_for_target (struct disassemble_info * dinfo); |
22a398e1 | 334 | |
94470b23 | 335 | /* Document any target specific options available from the disassembler. */ |
8cf3f354 | 336 | extern void disassembler_usage (FILE *); |
94470b23 | 337 | |
65b48a81 PB |
338 | /* Remove whitespace and consecutive commas. */ |
339 | extern char *remove_whitespace_and_extra_commas (char *); | |
340 | ||
341 | /* Like STRCMP, but treat ',' the same as '\0' so that we match | |
342 | strings like "foobar" against "foobar,xxyyzz,...". */ | |
343 | extern int disassembler_options_cmp (const char *, const char *); | |
344 | ||
345 | /* A helper function for FOR_EACH_DISASSEMBLER_OPTION. */ | |
f995bbe8 PA |
346 | static inline const char * |
347 | next_disassembler_option (const char *options) | |
65b48a81 | 348 | { |
f995bbe8 | 349 | const char *opt = strchr (options, ','); |
65b48a81 PB |
350 | if (opt != NULL) |
351 | opt++; | |
352 | return opt; | |
353 | } | |
354 | ||
355 | /* A macro for iterating over each comma separated option in OPTIONS. */ | |
356 | #define FOR_EACH_DISASSEMBLER_OPTION(OPT, OPTIONS) \ | |
357 | for ((OPT) = (OPTIONS); \ | |
358 | (OPT) != NULL; \ | |
359 | (OPT) = next_disassembler_option (OPT)) | |
360 | ||
252b5132 RH |
361 | \f |
362 | /* This block of definitions is for particular callers who read instructions | |
363 | into a buffer before calling the instruction decoder. */ | |
364 | ||
365 | /* Here is a function which callers may wish to use for read_memory_func. | |
366 | It gets bytes from a buffer. */ | |
367 | extern int buffer_read_memory | |
8cf3f354 | 368 | (bfd_vma, bfd_byte *, unsigned int, struct disassemble_info *); |
252b5132 RH |
369 | |
370 | /* This function goes with buffer_read_memory. | |
371 | It prints a message using info->fprintf_func and info->stream. */ | |
8cf3f354 | 372 | extern void perror_memory (int, bfd_vma, struct disassemble_info *); |
252b5132 RH |
373 | |
374 | ||
375 | /* Just print the address in hex. This is included for completeness even | |
376 | though both GDB and objdump provide their own (to print symbolic | |
377 | addresses). */ | |
378 | extern void generic_print_address | |
8cf3f354 | 379 | (bfd_vma, struct disassemble_info *); |
252b5132 RH |
380 | |
381 | /* Always true. */ | |
382 | extern int generic_symbol_at_address | |
8cf3f354 | 383 | (bfd_vma, struct disassemble_info *); |
252b5132 | 384 | |
d70c5fc7 | 385 | /* Also always true. */ |
22a398e1 NC |
386 | extern bfd_boolean generic_symbol_is_valid |
387 | (asymbol *, struct disassemble_info *); | |
d70c5fc7 | 388 | |
92c2346c AC |
389 | /* Method to initialize a disassemble_info struct. This should be |
390 | called by all applications creating such a struct. */ | |
e7f8eadb | 391 | extern void init_disassemble_info (struct disassemble_info *dinfo, void *stream, |
92c2346c | 392 | fprintf_ftype fprintf_func); |
252b5132 | 393 | |
92c2346c AC |
394 | /* For compatibility with existing code. */ |
395 | #define INIT_DISASSEMBLE_INFO(INFO, STREAM, FPRINTF_FUNC) \ | |
396 | init_disassemble_info (&(INFO), (STREAM), (fprintf_ftype) (FPRINTF_FUNC)) | |
252b5132 | 397 | #define INIT_DISASSEMBLE_INFO_NO_ARCH(INFO, STREAM, FPRINTF_FUNC) \ |
92c2346c AC |
398 | init_disassemble_info (&(INFO), (STREAM), (fprintf_ftype) (FPRINTF_FUNC)) |
399 | ||
252b5132 | 400 | |
7d7a6736 | 401 | #ifdef __cplusplus |
8418f5ff | 402 | } |
7d7a6736 ILT |
403 | #endif |
404 | ||
252b5132 | 405 | #endif /* ! defined (DIS_ASM_H) */ |