db22231044
ommit 3ae729d5a4
Author: H.J. Lu <hjl.tools@gmail.com>
Date: Wed Mar 7 04:18:45 2018 -0800
x86: Rewrite NOP generation for fill and alignment
increased MAX_MEM_FOR_RS_ALIGN_CODE to 4095 which resulted in increase
of assembler time and memory usage by 5 times for inputs with many
.p2align directives, which is typical for LTO output. This patch passes
max_bytes to TC_FRAG_INIT so that MAX_MEM_FOR_RS_ALIGN_CODE can be set
as needed and tracked by backend it so that HANDLE_ALIGN can check the
maximum alignment for each rs_align_code frag. Wall time to assemble
the same cc1plus.s:
before:
423.78user 0.89system 7:05.71elapsed 99%CPU
after:
102.35user 0.27system 1:42.89elapsed 99%CPU
PR gas/24165
* frags.c (frag_var_init): Pass max_chars to TC_FRAG_INIT as
max_bytes.
* config/tc-aarch64.h (TC_FRAG_INIT): Add and pass max_bytes to
aarch64_init_frag.
* /config/tc-arm.h (TC_FRAG_INIT): And and pass max_bytes to
arm_init_frag.
* config/tc-avr.h (TC_FRAG_INIT): And and ignore max_bytes.
* config/tc-ia64.h (TC_FRAG_INIT): Likewise.
* config/tc-mmix.h (TC_FRAG_INIT): Likewise.
* config/tc-nds32.h (TC_FRAG_INIT): Likewise.
* config/tc-ns32k.h (TC_FRAG_INIT): Likewise.
* config/tc-rl78.h (TC_FRAG_INIT): Likewise.
* config/tc-rx.h (TC_FRAG_INIT): Likewise.
* config/tc-score.h (TC_FRAG_INIT): Likewise.
* config/tc-tic54x.h (TC_FRAG_INIT): Likewise.
* config/tc-tic6x.h (TC_FRAG_INIT): Likewise.
* config/tc-xtensa.h (TC_FRAG_INIT): Likewise.
* config/tc-i386.h (MAX_MEM_FOR_RS_ALIGN_CODE): Set to
(alignment ? ((1 << alignment) - 1) : 1)
(i386_tc_frag_data): Add max_bytes.
(TC_FRAG_INIT): Add and track max_bytes.
(HANDLE_ALIGN): Replace MAX_MEM_FOR_RS_ALIGN_CODE with
fragP->tc_frag_data.max_bytes.
* doc/internals.texi: Update TC_FRAG_TYPE with max_bytes.
248 lines
10 KiB
C
248 lines
10 KiB
C
/* This file is tc-avr.h
|
|
Copyright (C) 1999-2019 Free Software Foundation, Inc.
|
|
|
|
Contributed by Denis Chertykov <denisc@overta.ru>
|
|
|
|
This file is part of GAS, the GNU Assembler.
|
|
|
|
GAS is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 3, or (at your option)
|
|
any later version.
|
|
|
|
GAS is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with GAS; see the file COPYING. If not, write to the Free
|
|
Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
|
|
02110-1301, USA. */
|
|
|
|
/* By convention, you should define this macro in the `.h' file. For
|
|
example, `tc-m68k.h' defines `TC_M68K'. You might have to use this
|
|
if it is necessary to add CPU specific code to the object format
|
|
file. */
|
|
#define TC_AVR
|
|
|
|
/* This macro is the BFD target name to use when creating the output
|
|
file. This will normally depend upon the `OBJ_FMT' macro. */
|
|
#define TARGET_FORMAT "elf32-avr"
|
|
|
|
/* This macro is the BFD architecture to pass to `bfd_set_arch_mach'. */
|
|
#define TARGET_ARCH bfd_arch_avr
|
|
|
|
/* This macro is the BFD machine number to pass to
|
|
`bfd_set_arch_mach'. If it is not defined, GAS will use 0. */
|
|
#define TARGET_MACH 0
|
|
|
|
/* You should define this macro to be non-zero if the target is big
|
|
endian, and zero if the target is little endian. */
|
|
#define TARGET_BYTES_BIG_ENDIAN 0
|
|
|
|
/* If you define this macro, GAS will warn about the use of
|
|
nonstandard escape sequences in a string. */
|
|
#define ONLY_STANDARD_ESCAPES
|
|
|
|
#define DIFF_EXPR_OK /* .-foo gets turned into PC relative relocs */
|
|
|
|
/* GAS will call this function for any expression that can not be
|
|
recognized. When the function is called, `input_line_pointer'
|
|
will point to the start of the expression. */
|
|
#define md_operand(x)
|
|
|
|
typedef struct
|
|
{
|
|
/* Name of the expression modifier allowed with .byte, .word, etc. */
|
|
const char *name;
|
|
|
|
/* Only allowed with n bytes of data. */
|
|
int nbytes;
|
|
|
|
/* Associated RELOC. */
|
|
bfd_reloc_code_real_type reloc;
|
|
|
|
/* Part of the error message. */
|
|
const char *error;
|
|
} exp_mod_data_t;
|
|
|
|
extern const exp_mod_data_t exp_mod_data[];
|
|
#define TC_PARSE_CONS_RETURN_TYPE const exp_mod_data_t *
|
|
#define TC_PARSE_CONS_RETURN_NONE exp_mod_data
|
|
|
|
/* You may define this macro to parse an expression used in a data
|
|
allocation pseudo-op such as `.word'. You can use this to
|
|
recognize relocation directives that may appear in such directives. */
|
|
#define TC_PARSE_CONS_EXPRESSION(EXPR,N) avr_parse_cons_expression (EXPR, N)
|
|
extern const exp_mod_data_t *avr_parse_cons_expression (expressionS *, int);
|
|
|
|
/* You may define this macro to generate a fixup for a data
|
|
allocation pseudo-op. */
|
|
#define TC_CONS_FIX_NEW avr_cons_fix_new
|
|
extern void avr_cons_fix_new (fragS *,int, int, expressionS *,
|
|
const exp_mod_data_t *);
|
|
|
|
/* This should just call either `number_to_chars_bigendian' or
|
|
`number_to_chars_littleendian', whichever is appropriate. On
|
|
targets like the MIPS which support options to change the
|
|
endianness, which function to call is a runtime decision. On
|
|
other targets, `md_number_to_chars' can be a simple macro. */
|
|
#define md_number_to_chars number_to_chars_littleendian
|
|
|
|
/* `md_short_jump_size'
|
|
`md_long_jump_size'
|
|
`md_create_short_jump'
|
|
`md_create_long_jump'
|
|
If `WORKING_DOT_WORD' is defined, GAS will not do broken word
|
|
processing (*note Broken words::.). Otherwise, you should set
|
|
`md_short_jump_size' to the size of a short jump (a jump that is
|
|
just long enough to jump around a long jmp) and
|
|
`md_long_jump_size' to the size of a long jump (a jump that can go
|
|
anywhere in the function), You should define
|
|
`md_create_short_jump' to create a short jump around a long jump,
|
|
and define `md_create_long_jump' to create a long jump. */
|
|
#define WORKING_DOT_WORD
|
|
|
|
/* If you define this macro, it means that `tc_gen_reloc' may return
|
|
multiple relocation entries for a single fixup. In this case, the
|
|
return value of `tc_gen_reloc' is a pointer to a null terminated
|
|
array. */
|
|
#undef RELOC_EXPANSION_POSSIBLE
|
|
|
|
/* No shared lib support, so we don't need to ensure externally
|
|
visible symbols can be overridden. */
|
|
#define EXTERN_FORCE_RELOC 0
|
|
|
|
/* If defined, this macro allows control over whether fixups for a
|
|
given section will be processed when the linkrelax variable is
|
|
set. Define it to zero and handle things in md_apply_fix instead.*/
|
|
#define TC_LINKRELAX_FIXUP(SEG) 0
|
|
|
|
/* If this macro returns non-zero, it guarantees that a relocation will be emitted
|
|
even when the value can be resolved locally. Do that if linkrelax is turned on */
|
|
#define TC_FORCE_RELOCATION(fix) avr_force_relocation (fix)
|
|
#define TC_FORCE_RELOCATION_SUB_SAME(fix, seg) \
|
|
(GENERIC_FORCE_RELOCATION_SUB_SAME (fix, seg) \
|
|
|| avr_force_relocation (fix))
|
|
extern int avr_force_relocation (struct fix *);
|
|
|
|
/* Values passed to md_apply_fix don't include the symbol value. */
|
|
#define MD_APPLY_SYM_VALUE(FIX) 0
|
|
|
|
/* If you define this macro, it should return the offset between the
|
|
address of a PC relative fixup and the position from which the PC
|
|
relative adjustment should be made. On many processors, the base
|
|
of a PC relative instruction is the next instruction, so this
|
|
macro would return the length of an instruction. */
|
|
#define MD_PCREL_FROM_SECTION(FIX, SEC) md_pcrel_from_section (FIX, SEC)
|
|
extern long md_pcrel_from_section (struct fix *, segT);
|
|
|
|
/* The number of bytes to put into a word in a listing. This affects
|
|
the way the bytes are clumped together in the listing. For
|
|
example, a value of 2 might print `1234 5678' where a value of 1
|
|
would print `12 34 56 78'. The default value is 4. */
|
|
#define LISTING_WORD_SIZE 2
|
|
|
|
/* AVR port uses `$' as a logical line separator. */
|
|
#define LEX_DOLLAR 0
|
|
|
|
/* An `.lcomm' directive with no explicit alignment parameter will
|
|
use this macro to set P2VAR to the alignment that a request for
|
|
SIZE bytes will have. The alignment is expressed as a power of
|
|
two. If no alignment should take place, the macro definition
|
|
should do nothing. Some targets define a `.bss' directive that is
|
|
also affected by this macro. The default definition will set
|
|
P2VAR to the truncated power of two of sizes up to eight bytes. */
|
|
#define TC_IMPLICIT_LCOMM_ALIGNMENT(SIZE, P2VAR) (P2VAR) = 0
|
|
|
|
/* We don't want gas to fixup the following program memory related relocations.
|
|
We will need them in case that we want to do linker relaxation.
|
|
We could in principle keep these fixups in gas when not relaxing.
|
|
However, there is no serious performance penalty when making the linker
|
|
make the fixup work. Check also that fx_addsy is not NULL, in order to make
|
|
sure that the fixup refers to some sort of label. */
|
|
#define TC_VALIDATE_FIX(FIXP,SEG,SKIP) \
|
|
if ( (FIXP->fx_r_type == BFD_RELOC_AVR_7_PCREL \
|
|
|| FIXP->fx_r_type == BFD_RELOC_AVR_13_PCREL \
|
|
|| FIXP->fx_r_type == BFD_RELOC_AVR_LO8_LDI_PM \
|
|
|| FIXP->fx_r_type == BFD_RELOC_AVR_LO8_LDI_GS \
|
|
|| FIXP->fx_r_type == BFD_RELOC_AVR_HI8_LDI_PM \
|
|
|| FIXP->fx_r_type == BFD_RELOC_AVR_HI8_LDI_GS \
|
|
|| FIXP->fx_r_type == BFD_RELOC_AVR_HH8_LDI_PM \
|
|
|| FIXP->fx_r_type == BFD_RELOC_AVR_LO8_LDI_PM_NEG \
|
|
|| FIXP->fx_r_type == BFD_RELOC_AVR_HI8_LDI_PM_NEG \
|
|
|| FIXP->fx_r_type == BFD_RELOC_AVR_HH8_LDI_PM_NEG \
|
|
|| FIXP->fx_r_type == BFD_RELOC_AVR_8_LO \
|
|
|| FIXP->fx_r_type == BFD_RELOC_AVR_8_HI \
|
|
|| FIXP->fx_r_type == BFD_RELOC_AVR_8_HLO \
|
|
|| FIXP->fx_r_type == BFD_RELOC_AVR_16_PM) \
|
|
&& FIXP->fx_addsy != NULL \
|
|
&& FIXP->fx_subsy == NULL) \
|
|
{ \
|
|
symbol_mark_used_in_reloc (FIXP->fx_addsy); \
|
|
goto SKIP; \
|
|
}
|
|
|
|
/* This macro is evaluated for any fixup with a fx_subsy that
|
|
fixup_segment cannot reduce to a number. If the macro returns
|
|
false an error will be reported. */
|
|
#define TC_VALIDATE_FIX_SUB(fix, seg) avr_validate_fix_sub (fix)
|
|
extern int avr_validate_fix_sub (struct fix *);
|
|
|
|
/* This target is buggy, and sets fix size too large. */
|
|
#define TC_FX_SIZE_SLACK(FIX) 2
|
|
|
|
/* AVR instructions are 2 or 4 bytes long. */
|
|
#define DWARF2_LINE_MIN_INSN_LENGTH 2
|
|
|
|
/* 32 bits pseudo-addresses are used on AVR. */
|
|
#define DWARF2_ADDR_SIZE(bfd) 4
|
|
|
|
/* Enable cfi directives. */
|
|
#define TARGET_USE_CFIPOP 1
|
|
|
|
/* The stack grows down, and is only byte aligned. */
|
|
#define DWARF2_CIE_DATA_ALIGNMENT -1
|
|
|
|
/* Define the column that represents the PC. */
|
|
#define DWARF2_DEFAULT_RETURN_COLUMN 36
|
|
|
|
/* Define a hook to setup initial CFI state. */
|
|
extern void tc_cfi_frame_initial_instructions (void);
|
|
#define tc_cfi_frame_initial_instructions tc_cfi_frame_initial_instructions
|
|
|
|
/* The difference between same-section symbols may be affected by linker
|
|
relaxation, so do not resolve such expressions in the assembler. */
|
|
#define md_allow_local_subtract(l,r,s) avr_allow_local_subtract (l, r, s)
|
|
extern bfd_boolean avr_allow_local_subtract (expressionS *, expressionS *, segT);
|
|
|
|
#define elf_tc_final_processing avr_elf_final_processing
|
|
extern void avr_elf_final_processing (void);
|
|
|
|
#define md_pre_output_hook avr_pre_output_hook ()
|
|
extern void avr_pre_output_hook (void);
|
|
|
|
#define md_undefined_symbol avr_undefined_symbol
|
|
extern symbolS* avr_undefined_symbol (char*);
|
|
|
|
#define md_post_relax_hook avr_post_relax_hook ()
|
|
extern void avr_post_relax_hook (void);
|
|
|
|
#define HANDLE_ALIGN(fragP) avr_handle_align (fragP)
|
|
extern void avr_handle_align (fragS *);
|
|
|
|
struct avr_frag_data
|
|
{
|
|
unsigned is_org : 1;
|
|
unsigned is_align : 1;
|
|
unsigned has_fill : 1;
|
|
|
|
char fill;
|
|
offsetT alignment;
|
|
unsigned int prev_opcode;
|
|
};
|
|
#define TC_FRAG_TYPE struct avr_frag_data
|
|
#define TC_FRAG_INIT(frag, max_bytes) avr_frag_init (frag)
|
|
extern void avr_frag_init (fragS *);
|