リビジョン | 43025f01a0c99c939e20e90a6e695741c14a925a (tree) |
---|---|
日時 | 2022-10-25 10:20:23 |
作者 | Patrick O'Neill <patrick@rivo...> |
コミッター | Nelson Chu |
RISC-V: Improve link time complexity.
The riscv port does deletion and symbol table update for each relocation
while relaxing, so we are moving section bytes and scanning symbol table once
for each relocation. Compared to microblaze port, they record the relaxation
changes into a table, then do the deletion and symbol table update once per
section, rather than per relocation. Therefore, they should have better link
time complexity than us.
To improve the link time complexity, this patch try to make the deletion in
linear time. Compared to record the relaxation changes into a table, we
replace the unused relocation with R_RISCV_DELETE for the deleted bytes, and
then resolve them at the end of the section. Assuming the number of
R_RISCV_DELETE is m, and the number of symbols is n, the total link complexity
should be O(m) for moving section bytes, and O(m*n2) for symbol table update.
If we record the relaxation changes into the table, and then sort the symbol
table by values, then probably can reduce the time complexity to O(m*n*log(n))
for updating symbol table, but it doesn't seem worth it for now.
bfd/
@@ -4043,27 +4043,32 @@ riscv_update_pcgp_relocs (riscv_pcgp_relocs *p, asection *deleted_sec, | ||
4043 | 4043 | } |
4044 | 4044 | } |
4045 | 4045 | |
4046 | -/* Delete some bytes from a section while relaxing. */ | |
4046 | +/* Delete some bytes, adjust relcocations and symbol table from a section. */ | |
4047 | 4047 | |
4048 | 4048 | static bool |
4049 | -riscv_relax_delete_bytes (bfd *abfd, | |
4050 | - asection *sec, | |
4051 | - bfd_vma addr, | |
4052 | - size_t count, | |
4053 | - struct bfd_link_info *link_info, | |
4054 | - riscv_pcgp_relocs *p) | |
4049 | +_riscv_relax_delete_bytes (bfd *abfd, | |
4050 | + asection *sec, | |
4051 | + bfd_vma addr, | |
4052 | + size_t count, | |
4053 | + struct bfd_link_info *link_info, | |
4054 | + riscv_pcgp_relocs *p, | |
4055 | + bfd_vma delete_total, | |
4056 | + bfd_vma toaddr) | |
4055 | 4057 | { |
4056 | 4058 | unsigned int i, symcount; |
4057 | - bfd_vma toaddr = sec->size; | |
4058 | 4059 | struct elf_link_hash_entry **sym_hashes = elf_sym_hashes (abfd); |
4059 | 4060 | Elf_Internal_Shdr *symtab_hdr = &elf_tdata (abfd)->symtab_hdr; |
4060 | 4061 | unsigned int sec_shndx = _bfd_elf_section_from_bfd_section (abfd, sec); |
4061 | 4062 | struct bfd_elf_section_data *data = elf_section_data (sec); |
4062 | 4063 | bfd_byte *contents = data->this_hdr.contents; |
4064 | + size_t bytes_to_move = toaddr - addr - count; | |
4063 | 4065 | |
4064 | 4066 | /* Actually delete the bytes. */ |
4065 | 4067 | sec->size -= count; |
4066 | - memmove (contents + addr, contents + addr + count, toaddr - addr - count); | |
4068 | + memmove (contents + addr, contents + addr + count + delete_total, bytes_to_move); | |
4069 | + | |
4070 | + /* Still adjust relocations and symbols in non-linear times. */ | |
4071 | + toaddr = sec->size + count; | |
4067 | 4072 | |
4068 | 4073 | /* Adjust the location of all of the relocs. Note that we need not |
4069 | 4074 | adjust the addends, since all PC-relative references must be against |
@@ -4161,6 +4166,99 @@ riscv_relax_delete_bytes (bfd *abfd, | ||
4161 | 4166 | return true; |
4162 | 4167 | } |
4163 | 4168 | |
4169 | +typedef bool (*relax_delete_t) (bfd *, asection *, | |
4170 | + bfd_vma, size_t, | |
4171 | + struct bfd_link_info *, | |
4172 | + riscv_pcgp_relocs *, | |
4173 | + Elf_Internal_Rela *); | |
4174 | + | |
4175 | +static relax_delete_t riscv_relax_delete_bytes; | |
4176 | + | |
4177 | +/* Do not delete some bytes from a section while relaxing. | |
4178 | + Just mark the deleted bytes as R_RISCV_DELETE. */ | |
4179 | + | |
4180 | +static bool | |
4181 | +_riscv_relax_delete_piecewise (bfd *abfd ATTRIBUTE_UNUSED, | |
4182 | + asection *sec ATTRIBUTE_UNUSED, | |
4183 | + bfd_vma addr, | |
4184 | + size_t count, | |
4185 | + struct bfd_link_info *link_info ATTRIBUTE_UNUSED, | |
4186 | + riscv_pcgp_relocs *p ATTRIBUTE_UNUSED, | |
4187 | + Elf_Internal_Rela *rel) | |
4188 | +{ | |
4189 | + if (rel == NULL) | |
4190 | + return false; | |
4191 | + rel->r_info = ELFNN_R_INFO (0, R_RISCV_DELETE); | |
4192 | + rel->r_offset = addr; | |
4193 | + rel->r_addend = count; | |
4194 | + return true; | |
4195 | +} | |
4196 | + | |
4197 | +/* Delete some bytes from a section while relaxing. */ | |
4198 | + | |
4199 | +static bool | |
4200 | +_riscv_relax_delete_immediate (bfd *abfd, | |
4201 | + asection *sec, | |
4202 | + bfd_vma addr, | |
4203 | + size_t count, | |
4204 | + struct bfd_link_info *link_info, | |
4205 | + riscv_pcgp_relocs *p, | |
4206 | + Elf_Internal_Rela *rel) | |
4207 | +{ | |
4208 | + if (rel != NULL) | |
4209 | + rel->r_info = ELFNN_R_INFO (0, R_RISCV_NONE); | |
4210 | + return _riscv_relax_delete_bytes (abfd, sec, addr, count, | |
4211 | + link_info, p, 0, sec->size); | |
4212 | +} | |
4213 | + | |
4214 | +/* Delete the bytes for R_RISCV_DELETE relocs. */ | |
4215 | + | |
4216 | +static bool | |
4217 | +riscv_relax_resolve_delete_relocs (bfd *abfd, | |
4218 | + asection *sec, | |
4219 | + struct bfd_link_info *link_info, | |
4220 | + Elf_Internal_Rela *relocs) | |
4221 | +{ | |
4222 | + bfd_vma delete_total = 0; | |
4223 | + unsigned int i; | |
4224 | + | |
4225 | + for (i = 0; i < sec->reloc_count; i++) | |
4226 | + { | |
4227 | + Elf_Internal_Rela *rel = relocs + i; | |
4228 | + if (ELFNN_R_TYPE (rel->r_info) != R_RISCV_DELETE) | |
4229 | + continue; | |
4230 | + | |
4231 | + /* Find the next R_RISCV_DELETE reloc if possible. */ | |
4232 | + Elf_Internal_Rela *rel_next = NULL; | |
4233 | + unsigned int start = rel - relocs; | |
4234 | + for (i = start; i < sec->reloc_count; i++) | |
4235 | + { | |
4236 | + /* Since we only replace existing relocs and don't add new relocs, the | |
4237 | + relocs are in sequential order. We can skip the relocs prior to this | |
4238 | + one, making this search linear time. */ | |
4239 | + rel_next = relocs + i; | |
4240 | + if (ELFNN_R_TYPE ((rel_next)->r_info) == R_RISCV_DELETE | |
4241 | + && (rel_next)->r_offset > rel->r_offset) | |
4242 | + break; | |
4243 | + else | |
4244 | + rel_next = NULL; | |
4245 | + } | |
4246 | + | |
4247 | + bfd_vma toaddr = rel_next == NULL ? sec->size : rel_next->r_offset; | |
4248 | + if (!_riscv_relax_delete_bytes (abfd, sec, rel->r_offset, rel->r_addend, | |
4249 | + link_info, NULL, delete_total, toaddr)) | |
4250 | + return false; | |
4251 | + | |
4252 | + delete_total += rel->r_addend; | |
4253 | + rel->r_info = ELFNN_R_INFO (0, R_RISCV_NONE); | |
4254 | + | |
4255 | + /* Skip ahead to the next delete reloc. */ | |
4256 | + i = rel_next != NULL ? rel_next - relocs - 1 : sec->reloc_count; | |
4257 | + } | |
4258 | + | |
4259 | + return true; | |
4260 | +} | |
4261 | + | |
4164 | 4262 | typedef bool (*relax_func_t) (bfd *, asection *, asection *, |
4165 | 4263 | struct bfd_link_info *, |
4166 | 4264 | Elf_Internal_Rela *, |
@@ -4239,10 +4337,10 @@ _bfd_riscv_relax_call (bfd *abfd, asection *sec, asection *sym_sec, | ||
4239 | 4337 | /* Replace the AUIPC. */ |
4240 | 4338 | riscv_put_insn (8 * len, auipc, contents + rel->r_offset); |
4241 | 4339 | |
4242 | - /* Delete unnecessary JALR. */ | |
4340 | + /* Delete unnecessary JALR and reuse the R_RISCV_RELAX reloc. */ | |
4243 | 4341 | *again = true; |
4244 | 4342 | return riscv_relax_delete_bytes (abfd, sec, rel->r_offset + len, 8 - len, |
4245 | - link_info, pcgp_relocs); | |
4343 | + link_info, pcgp_relocs, rel + 1); | |
4246 | 4344 | } |
4247 | 4345 | |
4248 | 4346 | /* Traverse all output sections and return the max alignment. */ |
@@ -4332,11 +4430,10 @@ _bfd_riscv_relax_lui (bfd *abfd, | ||
4332 | 4430 | return true; |
4333 | 4431 | |
4334 | 4432 | case R_RISCV_HI20: |
4335 | - /* We can delete the unnecessary LUI and reloc. */ | |
4336 | - rel->r_info = ELFNN_R_INFO (0, R_RISCV_NONE); | |
4433 | + /* Delete unnecessary LUI and reuse the reloc. */ | |
4337 | 4434 | *again = true; |
4338 | 4435 | return riscv_relax_delete_bytes (abfd, sec, rel->r_offset, 4, |
4339 | - link_info, pcgp_relocs); | |
4436 | + link_info, pcgp_relocs, rel); | |
4340 | 4437 | |
4341 | 4438 | default: |
4342 | 4439 | abort (); |
@@ -4367,9 +4464,10 @@ _bfd_riscv_relax_lui (bfd *abfd, | ||
4367 | 4464 | /* Replace the R_RISCV_HI20 reloc. */ |
4368 | 4465 | rel->r_info = ELFNN_R_INFO (ELFNN_R_SYM (rel->r_info), R_RISCV_RVC_LUI); |
4369 | 4466 | |
4467 | + /* Delete extra bytes and reuse the R_RISCV_RELAX reloc. */ | |
4370 | 4468 | *again = true; |
4371 | 4469 | return riscv_relax_delete_bytes (abfd, sec, rel->r_offset + 2, 2, |
4372 | - link_info, pcgp_relocs); | |
4470 | + link_info, pcgp_relocs, rel + 1); | |
4373 | 4471 | } |
4374 | 4472 | |
4375 | 4473 | return true; |
@@ -4407,11 +4505,10 @@ _bfd_riscv_relax_tls_le (bfd *abfd, | ||
4407 | 4505 | |
4408 | 4506 | case R_RISCV_TPREL_HI20: |
4409 | 4507 | case R_RISCV_TPREL_ADD: |
4410 | - /* We can delete the unnecessary instruction and reloc. */ | |
4411 | - rel->r_info = ELFNN_R_INFO (0, R_RISCV_NONE); | |
4508 | + /* Delete unnecessary instruction and reuse the reloc. */ | |
4412 | 4509 | *again = true; |
4413 | 4510 | return riscv_relax_delete_bytes (abfd, sec, rel->r_offset, 4, link_info, |
4414 | - pcgp_relocs); | |
4511 | + pcgp_relocs, rel); | |
4415 | 4512 | |
4416 | 4513 | default: |
4417 | 4514 | abort (); |
@@ -4472,10 +4569,10 @@ _bfd_riscv_relax_align (bfd *abfd, asection *sec, | ||
4472 | 4569 | if (nop_bytes % 4 != 0) |
4473 | 4570 | bfd_putl16 (RVC_NOP, contents + rel->r_offset + pos); |
4474 | 4571 | |
4475 | - /* Delete the excess bytes. */ | |
4572 | + /* Delete excess bytes. */ | |
4476 | 4573 | return riscv_relax_delete_bytes (abfd, sec, rel->r_offset + nop_bytes, |
4477 | 4574 | rel->r_addend - nop_bytes, link_info, |
4478 | - NULL); | |
4575 | + NULL, NULL); | |
4479 | 4576 | } |
4480 | 4577 | |
4481 | 4578 | /* Relax PC-relative references to GP-relative references. */ |
@@ -4617,9 +4714,9 @@ _bfd_riscv_relax_pc (bfd *abfd ATTRIBUTE_UNUSED, | ||
4617 | 4714 | ELFNN_R_SYM(rel->r_info), |
4618 | 4715 | sym_sec, |
4619 | 4716 | undefined_weak); |
4620 | - /* We can delete the unnecessary AUIPC and reloc. */ | |
4621 | - rel->r_info = ELFNN_R_INFO (0, R_RISCV_DELETE); | |
4622 | - rel->r_addend = 4; | |
4717 | + /* Delete unnecessary AUIPC and reuse the reloc. */ | |
4718 | + riscv_relax_delete_bytes (abfd, sec, rel->r_offset, 4, link_info, | |
4719 | + pcgp_relocs, rel); | |
4623 | 4720 | return true; |
4624 | 4721 | |
4625 | 4722 | default: |
@@ -4630,28 +4727,6 @@ _bfd_riscv_relax_pc (bfd *abfd ATTRIBUTE_UNUSED, | ||
4630 | 4727 | return true; |
4631 | 4728 | } |
4632 | 4729 | |
4633 | -/* Delete the bytes for R_RISCV_DELETE. */ | |
4634 | - | |
4635 | -static bool | |
4636 | -_bfd_riscv_relax_delete (bfd *abfd, | |
4637 | - asection *sec, | |
4638 | - asection *sym_sec ATTRIBUTE_UNUSED, | |
4639 | - struct bfd_link_info *link_info, | |
4640 | - Elf_Internal_Rela *rel, | |
4641 | - bfd_vma symval ATTRIBUTE_UNUSED, | |
4642 | - bfd_vma max_alignment ATTRIBUTE_UNUSED, | |
4643 | - bfd_vma reserve_size ATTRIBUTE_UNUSED, | |
4644 | - bool *again ATTRIBUTE_UNUSED, | |
4645 | - riscv_pcgp_relocs *pcgp_relocs ATTRIBUTE_UNUSED, | |
4646 | - bool undefined_weak ATTRIBUTE_UNUSED) | |
4647 | -{ | |
4648 | - if (!riscv_relax_delete_bytes (abfd, sec, rel->r_offset, rel->r_addend, | |
4649 | - link_info, NULL)) | |
4650 | - return false; | |
4651 | - rel->r_info = ELFNN_R_INFO (0, R_RISCV_NONE); | |
4652 | - return true; | |
4653 | -} | |
4654 | - | |
4655 | 4730 | /* Called by after_allocation to set the information of data segment |
4656 | 4731 | before relaxing. */ |
4657 | 4732 |
@@ -4729,6 +4804,7 @@ _bfd_riscv_relax_section (bfd *abfd, asection *sec, | ||
4729 | 4804 | bool undefined_weak = false; |
4730 | 4805 | |
4731 | 4806 | relax_func = NULL; |
4807 | + riscv_relax_delete_bytes = NULL; | |
4732 | 4808 | if (info->relax_pass == 0) |
4733 | 4809 | { |
4734 | 4810 | if (type == R_RISCV_CALL |
@@ -4750,6 +4826,7 @@ _bfd_riscv_relax_section (bfd *abfd, asection *sec, | ||
4750 | 4826 | relax_func = _bfd_riscv_relax_pc; |
4751 | 4827 | else |
4752 | 4828 | continue; |
4829 | + riscv_relax_delete_bytes = _riscv_relax_delete_piecewise; | |
4753 | 4830 | |
4754 | 4831 | /* Only relax this reloc if it is paired with R_RISCV_RELAX. */ |
4755 | 4832 | if (i == sec->reloc_count - 1 |
@@ -4760,10 +4837,11 @@ _bfd_riscv_relax_section (bfd *abfd, asection *sec, | ||
4760 | 4837 | /* Skip over the R_RISCV_RELAX. */ |
4761 | 4838 | i++; |
4762 | 4839 | } |
4763 | - else if (info->relax_pass == 1 && type == R_RISCV_DELETE) | |
4764 | - relax_func = _bfd_riscv_relax_delete; | |
4765 | - else if (info->relax_pass == 2 && type == R_RISCV_ALIGN) | |
4766 | - relax_func = _bfd_riscv_relax_align; | |
4840 | + else if (info->relax_pass == 1 && type == R_RISCV_ALIGN) | |
4841 | + { | |
4842 | + relax_func = _bfd_riscv_relax_align; | |
4843 | + riscv_relax_delete_bytes = _riscv_relax_delete_immediate; | |
4844 | + } | |
4767 | 4845 | else |
4768 | 4846 | continue; |
4769 | 4847 |
@@ -4921,6 +4999,10 @@ _bfd_riscv_relax_section (bfd *abfd, asection *sec, | ||
4921 | 4999 | goto fail; |
4922 | 5000 | } |
4923 | 5001 | |
5002 | + /* Resolve R_RISCV_DELETE relocations. */ | |
5003 | + if (!riscv_relax_resolve_delete_relocs (abfd, sec, info, relocs)) | |
5004 | + goto fail; | |
5005 | + | |
4924 | 5006 | ret = true; |
4925 | 5007 | |
4926 | 5008 | fail: |