1*fae548d3Szrj // merge.cc -- handle section merging for gold
2*fae548d3Szrj 
3*fae548d3Szrj // Copyright (C) 2006-2020 Free Software Foundation, Inc.
4*fae548d3Szrj // Written by Ian Lance Taylor <iant@google.com>.
5*fae548d3Szrj 
6*fae548d3Szrj // This file is part of gold.
7*fae548d3Szrj 
8*fae548d3Szrj // This program is free software; you can redistribute it and/or modify
9*fae548d3Szrj // it under the terms of the GNU General Public License as published by
10*fae548d3Szrj // the Free Software Foundation; either version 3 of the License, or
11*fae548d3Szrj // (at your option) any later version.
12*fae548d3Szrj 
13*fae548d3Szrj // This program is distributed in the hope that it will be useful,
14*fae548d3Szrj // but WITHOUT ANY WARRANTY; without even the implied warranty of
15*fae548d3Szrj // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
16*fae548d3Szrj // GNU General Public License for more details.
17*fae548d3Szrj 
18*fae548d3Szrj // You should have received a copy of the GNU General Public License
19*fae548d3Szrj // along with this program; if not, write to the Free Software
20*fae548d3Szrj // Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston,
21*fae548d3Szrj // MA 02110-1301, USA.
22*fae548d3Szrj 
23*fae548d3Szrj #include "gold.h"
24*fae548d3Szrj 
25*fae548d3Szrj #include <cstdlib>
26*fae548d3Szrj #include <algorithm>
27*fae548d3Szrj 
28*fae548d3Szrj #include "merge.h"
29*fae548d3Szrj #include "compressed_output.h"
30*fae548d3Szrj 
31*fae548d3Szrj namespace gold
32*fae548d3Szrj {
33*fae548d3Szrj 
34*fae548d3Szrj // Class Object_merge_map.
35*fae548d3Szrj 
36*fae548d3Szrj // Destructor.
37*fae548d3Szrj 
~Object_merge_map()38*fae548d3Szrj Object_merge_map::~Object_merge_map()
39*fae548d3Szrj {
40*fae548d3Szrj   for (Section_merge_maps::iterator p = this->section_merge_maps_.begin();
41*fae548d3Szrj        p != this->section_merge_maps_.end();
42*fae548d3Szrj        ++p)
43*fae548d3Szrj     delete p->second;
44*fae548d3Szrj }
45*fae548d3Szrj 
46*fae548d3Szrj // Get the Input_merge_map to use for an input section, or NULL.
47*fae548d3Szrj 
48*fae548d3Szrj const Object_merge_map::Input_merge_map*
get_input_merge_map(unsigned int shndx) const49*fae548d3Szrj Object_merge_map::get_input_merge_map(unsigned int shndx) const
50*fae548d3Szrj {
51*fae548d3Szrj   gold_assert(shndx != -1U);
52*fae548d3Szrj   const Section_merge_maps &maps = this->section_merge_maps_;
53*fae548d3Szrj   for (Section_merge_maps::const_iterator i = maps.begin(), e = maps.end();
54*fae548d3Szrj        i != e; ++i)
55*fae548d3Szrj     {
56*fae548d3Szrj       if (i->first == shndx)
57*fae548d3Szrj 	return i->second;
58*fae548d3Szrj     }
59*fae548d3Szrj   return NULL;
60*fae548d3Szrj }
61*fae548d3Szrj 
62*fae548d3Szrj // Get or create the Input_merge_map to use for an input section.
63*fae548d3Szrj 
64*fae548d3Szrj Object_merge_map::Input_merge_map*
get_or_make_input_merge_map(const Output_section_data * output_data,unsigned int shndx)65*fae548d3Szrj Object_merge_map::get_or_make_input_merge_map(
66*fae548d3Szrj     const Output_section_data* output_data, unsigned int shndx) {
67*fae548d3Szrj   Input_merge_map* map = this->get_input_merge_map(shndx);
68*fae548d3Szrj   if (map != NULL)
69*fae548d3Szrj     {
70*fae548d3Szrj       // For a given input section in a given object, every mapping
71*fae548d3Szrj       // must be done with the same Merge_map.
72*fae548d3Szrj       gold_assert(map->output_data == output_data);
73*fae548d3Szrj       return map;
74*fae548d3Szrj     }
75*fae548d3Szrj 
76*fae548d3Szrj   Input_merge_map* new_map = new Input_merge_map;
77*fae548d3Szrj   new_map->output_data = output_data;
78*fae548d3Szrj   Section_merge_maps &maps = this->section_merge_maps_;
79*fae548d3Szrj   maps.push_back(std::make_pair(shndx, new_map));
80*fae548d3Szrj   return new_map;
81*fae548d3Szrj }
82*fae548d3Szrj 
83*fae548d3Szrj // Add a mapping.
84*fae548d3Szrj 
85*fae548d3Szrj void
add_mapping(const Output_section_data * output_data,unsigned int shndx,section_offset_type input_offset,section_size_type length,section_offset_type output_offset)86*fae548d3Szrj Object_merge_map::add_mapping(const Output_section_data* output_data,
87*fae548d3Szrj 			      unsigned int shndx,
88*fae548d3Szrj 			      section_offset_type input_offset,
89*fae548d3Szrj 			      section_size_type length,
90*fae548d3Szrj 			      section_offset_type output_offset)
91*fae548d3Szrj {
92*fae548d3Szrj   Input_merge_map* map = this->get_or_make_input_merge_map(output_data, shndx);
93*fae548d3Szrj   map->add_mapping(input_offset, length, output_offset);
94*fae548d3Szrj }
95*fae548d3Szrj 
96*fae548d3Szrj void
add_mapping(section_offset_type input_offset,section_size_type length,section_offset_type output_offset)97*fae548d3Szrj Object_merge_map::Input_merge_map::add_mapping(
98*fae548d3Szrj     section_offset_type input_offset, section_size_type length,
99*fae548d3Szrj     section_offset_type output_offset) {
100*fae548d3Szrj   // Try to merge the new entry in the last one we saw.
101*fae548d3Szrj   if (!this->entries.empty())
102*fae548d3Szrj     {
103*fae548d3Szrj       Input_merge_entry& entry(this->entries.back());
104*fae548d3Szrj 
105*fae548d3Szrj       // Use section_size_type to avoid signed/unsigned warnings.
106*fae548d3Szrj       section_size_type input_offset_u = input_offset;
107*fae548d3Szrj       section_size_type output_offset_u = output_offset;
108*fae548d3Szrj 
109*fae548d3Szrj       // If this entry is not in order, we need to sort the vector
110*fae548d3Szrj       // before looking anything up.
111*fae548d3Szrj       if (input_offset_u < entry.input_offset + entry.length)
112*fae548d3Szrj 	{
113*fae548d3Szrj 	  gold_assert(input_offset < entry.input_offset);
114*fae548d3Szrj 	  gold_assert(input_offset_u + length
115*fae548d3Szrj 		      <= static_cast<section_size_type>(entry.input_offset));
116*fae548d3Szrj 	  this->sorted = false;
117*fae548d3Szrj 	}
118*fae548d3Szrj       else if (entry.input_offset + entry.length == input_offset_u
119*fae548d3Szrj 	       && (output_offset == -1
120*fae548d3Szrj 		   ? entry.output_offset == -1
121*fae548d3Szrj 		   : entry.output_offset + entry.length == output_offset_u))
122*fae548d3Szrj 	{
123*fae548d3Szrj 	  entry.length += length;
124*fae548d3Szrj 	  return;
125*fae548d3Szrj 	}
126*fae548d3Szrj     }
127*fae548d3Szrj 
128*fae548d3Szrj   Input_merge_entry entry;
129*fae548d3Szrj   entry.input_offset = input_offset;
130*fae548d3Szrj   entry.length = length;
131*fae548d3Szrj   entry.output_offset = output_offset;
132*fae548d3Szrj   this->entries.push_back(entry);
133*fae548d3Szrj }
134*fae548d3Szrj 
135*fae548d3Szrj // Get the output offset for an input address.
136*fae548d3Szrj 
137*fae548d3Szrj bool
get_output_offset(unsigned int shndx,section_offset_type input_offset,section_offset_type * output_offset)138*fae548d3Szrj Object_merge_map::get_output_offset(unsigned int shndx,
139*fae548d3Szrj 				    section_offset_type input_offset,
140*fae548d3Szrj 				    section_offset_type* output_offset)
141*fae548d3Szrj {
142*fae548d3Szrj   Input_merge_map* map = this->get_input_merge_map(shndx);
143*fae548d3Szrj   if (map == NULL)
144*fae548d3Szrj     return false;
145*fae548d3Szrj 
146*fae548d3Szrj   if (!map->sorted)
147*fae548d3Szrj     {
148*fae548d3Szrj       std::sort(map->entries.begin(), map->entries.end(),
149*fae548d3Szrj 		Input_merge_compare());
150*fae548d3Szrj       map->sorted = true;
151*fae548d3Szrj     }
152*fae548d3Szrj 
153*fae548d3Szrj   Input_merge_entry entry;
154*fae548d3Szrj   entry.input_offset = input_offset;
155*fae548d3Szrj   std::vector<Input_merge_entry>::const_iterator p =
156*fae548d3Szrj     std::upper_bound(map->entries.begin(), map->entries.end(),
157*fae548d3Szrj 		     entry, Input_merge_compare());
158*fae548d3Szrj   if (p == map->entries.begin())
159*fae548d3Szrj     return false;
160*fae548d3Szrj   --p;
161*fae548d3Szrj   gold_assert(p->input_offset <= input_offset);
162*fae548d3Szrj 
163*fae548d3Szrj   if (input_offset - p->input_offset
164*fae548d3Szrj       >= static_cast<section_offset_type>(p->length))
165*fae548d3Szrj     return false;
166*fae548d3Szrj 
167*fae548d3Szrj   *output_offset = p->output_offset;
168*fae548d3Szrj   if (*output_offset != -1)
169*fae548d3Szrj     *output_offset += (input_offset - p->input_offset);
170*fae548d3Szrj   return true;
171*fae548d3Szrj }
172*fae548d3Szrj 
173*fae548d3Szrj // Return whether this is the merge map for section SHNDX.
174*fae548d3Szrj 
175*fae548d3Szrj const Output_section_data*
find_merge_section(unsigned int shndx) const176*fae548d3Szrj Object_merge_map::find_merge_section(unsigned int shndx) const {
177*fae548d3Szrj   const Object_merge_map::Input_merge_map* map =
178*fae548d3Szrj     this->get_input_merge_map(shndx);
179*fae548d3Szrj   if (map == NULL)
180*fae548d3Szrj     return NULL;
181*fae548d3Szrj   return map->output_data;
182*fae548d3Szrj }
183*fae548d3Szrj 
184*fae548d3Szrj // Initialize a mapping from input offsets to output addresses.
185*fae548d3Szrj 
186*fae548d3Szrj template<int size>
187*fae548d3Szrj void
initialize_input_to_output_map(unsigned int shndx,typename elfcpp::Elf_types<size>::Elf_Addr starting_address,Unordered_map<section_offset_type,typename elfcpp::Elf_types<size>::Elf_Addr> * initialize_map)188*fae548d3Szrj Object_merge_map::initialize_input_to_output_map(
189*fae548d3Szrj     unsigned int shndx,
190*fae548d3Szrj     typename elfcpp::Elf_types<size>::Elf_Addr starting_address,
191*fae548d3Szrj     Unordered_map<section_offset_type,
192*fae548d3Szrj 		  typename elfcpp::Elf_types<size>::Elf_Addr>* initialize_map)
193*fae548d3Szrj {
194*fae548d3Szrj   Input_merge_map* map = this->get_input_merge_map(shndx);
195*fae548d3Szrj   gold_assert(map != NULL);
196*fae548d3Szrj 
197*fae548d3Szrj   gold_assert(initialize_map->empty());
198*fae548d3Szrj   // We know how many entries we are going to add.
199*fae548d3Szrj   // reserve_unordered_map takes an expected count of buckets, not a
200*fae548d3Szrj   // count of elements, so double it to try to reduce collisions.
201*fae548d3Szrj   reserve_unordered_map(initialize_map, map->entries.size() * 2);
202*fae548d3Szrj 
203*fae548d3Szrj   for (Input_merge_map::Entries::const_iterator p = map->entries.begin();
204*fae548d3Szrj        p != map->entries.end();
205*fae548d3Szrj        ++p)
206*fae548d3Szrj     {
207*fae548d3Szrj       section_offset_type output_offset = p->output_offset;
208*fae548d3Szrj       if (output_offset != -1)
209*fae548d3Szrj 	output_offset += starting_address;
210*fae548d3Szrj       else
211*fae548d3Szrj 	{
212*fae548d3Szrj 	  // If we see a relocation against an address we have chosen
213*fae548d3Szrj 	  // to discard, we relocate to zero.  FIXME: We could also
214*fae548d3Szrj 	  // issue a warning in this case; that would require
215*fae548d3Szrj 	  // reporting this somehow and checking it in the routines in
216*fae548d3Szrj 	  // reloc.h.
217*fae548d3Szrj 	  output_offset = 0;
218*fae548d3Szrj 	}
219*fae548d3Szrj       initialize_map->insert(std::make_pair(p->input_offset, output_offset));
220*fae548d3Szrj     }
221*fae548d3Szrj }
222*fae548d3Szrj 
223*fae548d3Szrj // Class Output_merge_base.
224*fae548d3Szrj 
225*fae548d3Szrj // Return the output offset for an input offset.  The input address is
226*fae548d3Szrj // at offset OFFSET in section SHNDX in OBJECT.  If we know the
227*fae548d3Szrj // offset, set *POUTPUT and return true.  Otherwise return false.
228*fae548d3Szrj 
229*fae548d3Szrj bool
do_output_offset(const Relobj * object,unsigned int shndx,section_offset_type offset,section_offset_type * poutput) const230*fae548d3Szrj Output_merge_base::do_output_offset(const Relobj* object,
231*fae548d3Szrj 				    unsigned int shndx,
232*fae548d3Szrj 				    section_offset_type offset,
233*fae548d3Szrj 				    section_offset_type* poutput) const
234*fae548d3Szrj {
235*fae548d3Szrj   return object->merge_output_offset(shndx, offset, poutput);
236*fae548d3Szrj }
237*fae548d3Szrj 
238*fae548d3Szrj // Record a merged input section for script processing.
239*fae548d3Szrj 
240*fae548d3Szrj void
record_input_section(Relobj * relobj,unsigned int shndx)241*fae548d3Szrj Output_merge_base::record_input_section(Relobj* relobj, unsigned int shndx)
242*fae548d3Szrj {
243*fae548d3Szrj   gold_assert(this->keeps_input_sections_ && relobj != NULL);
244*fae548d3Szrj   // If this is the first input section, record it.  We need do this because
245*fae548d3Szrj   // this->input_sections_ is unordered.
246*fae548d3Szrj   if (this->first_relobj_ == NULL)
247*fae548d3Szrj     {
248*fae548d3Szrj       this->first_relobj_ = relobj;
249*fae548d3Szrj       this->first_shndx_ = shndx;
250*fae548d3Szrj     }
251*fae548d3Szrj 
252*fae548d3Szrj   std::pair<Input_sections::iterator, bool> result =
253*fae548d3Szrj     this->input_sections_.insert(Section_id(relobj, shndx));
254*fae548d3Szrj   // We should insert a merge section once only.
255*fae548d3Szrj   gold_assert(result.second);
256*fae548d3Szrj }
257*fae548d3Szrj 
258*fae548d3Szrj // Class Output_merge_data.
259*fae548d3Szrj 
260*fae548d3Szrj // Compute the hash code for a fixed-size constant.
261*fae548d3Szrj 
262*fae548d3Szrj size_t
operator ()(Merge_data_key k) const263*fae548d3Szrj Output_merge_data::Merge_data_hash::operator()(Merge_data_key k) const
264*fae548d3Szrj {
265*fae548d3Szrj   const unsigned char* p = this->pomd_->constant(k);
266*fae548d3Szrj   section_size_type entsize =
267*fae548d3Szrj     convert_to_section_size_type(this->pomd_->entsize());
268*fae548d3Szrj 
269*fae548d3Szrj   // Fowler/Noll/Vo (FNV) hash (type FNV-1a).
270*fae548d3Szrj   if (sizeof(size_t) == 8)
271*fae548d3Szrj     {
272*fae548d3Szrj       size_t result = static_cast<size_t>(14695981039346656037ULL);
273*fae548d3Szrj       for (section_size_type i = 0; i < entsize; ++i)
274*fae548d3Szrj 	{
275*fae548d3Szrj 	  result &= (size_t) *p++;
276*fae548d3Szrj 	  result *= 1099511628211ULL;
277*fae548d3Szrj 	}
278*fae548d3Szrj       return result;
279*fae548d3Szrj     }
280*fae548d3Szrj   else
281*fae548d3Szrj     {
282*fae548d3Szrj       size_t result = 2166136261UL;
283*fae548d3Szrj       for (section_size_type i = 0; i < entsize; ++i)
284*fae548d3Szrj 	{
285*fae548d3Szrj 	  result ^= (size_t) *p++;
286*fae548d3Szrj 	  result *= 16777619UL;
287*fae548d3Szrj 	}
288*fae548d3Szrj       return result;
289*fae548d3Szrj     }
290*fae548d3Szrj }
291*fae548d3Szrj 
292*fae548d3Szrj // Return whether one hash table key equals another.
293*fae548d3Szrj 
294*fae548d3Szrj bool
operator ()(Merge_data_key k1,Merge_data_key k2) const295*fae548d3Szrj Output_merge_data::Merge_data_eq::operator()(Merge_data_key k1,
296*fae548d3Szrj 					     Merge_data_key k2) const
297*fae548d3Szrj {
298*fae548d3Szrj   const unsigned char* p1 = this->pomd_->constant(k1);
299*fae548d3Szrj   const unsigned char* p2 = this->pomd_->constant(k2);
300*fae548d3Szrj   return memcmp(p1, p2, this->pomd_->entsize()) == 0;
301*fae548d3Szrj }
302*fae548d3Szrj 
303*fae548d3Szrj // Add a constant to the end of the section contents.
304*fae548d3Szrj 
305*fae548d3Szrj void
add_constant(const unsigned char * p)306*fae548d3Szrj Output_merge_data::add_constant(const unsigned char* p)
307*fae548d3Szrj {
308*fae548d3Szrj   section_size_type entsize = convert_to_section_size_type(this->entsize());
309*fae548d3Szrj   section_size_type addralign =
310*fae548d3Szrj     convert_to_section_size_type(this->addralign());
311*fae548d3Szrj   section_size_type addsize = std::max(entsize, addralign);
312*fae548d3Szrj   if (this->len_ + addsize > this->alc_)
313*fae548d3Szrj     {
314*fae548d3Szrj       if (this->alc_ == 0)
315*fae548d3Szrj 	this->alc_ = 128 * addsize;
316*fae548d3Szrj       else
317*fae548d3Szrj 	this->alc_ *= 2;
318*fae548d3Szrj       this->p_ = static_cast<unsigned char*>(realloc(this->p_, this->alc_));
319*fae548d3Szrj       if (this->p_ == NULL)
320*fae548d3Szrj 	gold_nomem();
321*fae548d3Szrj     }
322*fae548d3Szrj 
323*fae548d3Szrj   memcpy(this->p_ + this->len_, p, entsize);
324*fae548d3Szrj   if (addsize > entsize)
325*fae548d3Szrj     memset(this->p_ + this->len_ + entsize, 0, addsize - entsize);
326*fae548d3Szrj   this->len_ += addsize;
327*fae548d3Szrj }
328*fae548d3Szrj 
329*fae548d3Szrj // Add the input section SHNDX in OBJECT to a merged output section
330*fae548d3Szrj // which holds fixed length constants.  Return whether we were able to
331*fae548d3Szrj // handle the section; if not, it will be linked as usual without
332*fae548d3Szrj // constant merging.
333*fae548d3Szrj 
334*fae548d3Szrj bool
do_add_input_section(Relobj * object,unsigned int shndx)335*fae548d3Szrj Output_merge_data::do_add_input_section(Relobj* object, unsigned int shndx)
336*fae548d3Szrj {
337*fae548d3Szrj   section_size_type len;
338*fae548d3Szrj   bool is_new;
339*fae548d3Szrj   const unsigned char* p = object->decompressed_section_contents(shndx, &len,
340*fae548d3Szrj 								 &is_new);
341*fae548d3Szrj 
342*fae548d3Szrj   section_size_type entsize = convert_to_section_size_type(this->entsize());
343*fae548d3Szrj 
344*fae548d3Szrj   if (len % entsize != 0)
345*fae548d3Szrj     {
346*fae548d3Szrj       if (is_new)
347*fae548d3Szrj 	delete[] p;
348*fae548d3Szrj       return false;
349*fae548d3Szrj     }
350*fae548d3Szrj 
351*fae548d3Szrj   this->input_count_ += len / entsize;
352*fae548d3Szrj 
353*fae548d3Szrj   Object_merge_map* merge_map = object->get_or_create_merge_map();
354*fae548d3Szrj   Object_merge_map::Input_merge_map* input_merge_map =
355*fae548d3Szrj     merge_map->get_or_make_input_merge_map(this, shndx);
356*fae548d3Szrj 
357*fae548d3Szrj   for (section_size_type i = 0; i < len; i += entsize, p += entsize)
358*fae548d3Szrj     {
359*fae548d3Szrj       // Add the constant to the section contents.  If we find that it
360*fae548d3Szrj       // is already in the hash table, we will remove it again.
361*fae548d3Szrj       Merge_data_key k = this->len_;
362*fae548d3Szrj       this->add_constant(p);
363*fae548d3Szrj 
364*fae548d3Szrj       std::pair<Merge_data_hashtable::iterator, bool> ins =
365*fae548d3Szrj 	this->hashtable_.insert(k);
366*fae548d3Szrj 
367*fae548d3Szrj       if (!ins.second)
368*fae548d3Szrj 	{
369*fae548d3Szrj 	  // Key was already present.  Remove the copy we just added.
370*fae548d3Szrj 	  this->len_ -= entsize;
371*fae548d3Szrj 	  k = *ins.first;
372*fae548d3Szrj 	}
373*fae548d3Szrj 
374*fae548d3Szrj       // Record the offset of this constant in the output section.
375*fae548d3Szrj       input_merge_map->add_mapping(i, entsize, k);
376*fae548d3Szrj     }
377*fae548d3Szrj 
378*fae548d3Szrj   // For script processing, we keep the input sections.
379*fae548d3Szrj   if (this->keeps_input_sections())
380*fae548d3Szrj     record_input_section(object, shndx);
381*fae548d3Szrj 
382*fae548d3Szrj   if (is_new)
383*fae548d3Szrj     delete[] p;
384*fae548d3Szrj 
385*fae548d3Szrj   return true;
386*fae548d3Szrj }
387*fae548d3Szrj 
388*fae548d3Szrj // Set the final data size in a merged output section with fixed size
389*fae548d3Szrj // constants.
390*fae548d3Szrj 
391*fae548d3Szrj void
set_final_data_size()392*fae548d3Szrj Output_merge_data::set_final_data_size()
393*fae548d3Szrj {
394*fae548d3Szrj   // Release the memory we don't need.
395*fae548d3Szrj   this->p_ = static_cast<unsigned char*>(realloc(this->p_, this->len_));
396*fae548d3Szrj   // An Output_merge_data object may be empty and realloc is allowed
397*fae548d3Szrj   // to return a NULL pointer in this case.  An Output_merge_data is empty
398*fae548d3Szrj   // if all its input sections have sizes that are not multiples of entsize.
399*fae548d3Szrj   gold_assert(this->p_ != NULL || this->len_ == 0);
400*fae548d3Szrj   this->set_data_size(this->len_);
401*fae548d3Szrj }
402*fae548d3Szrj 
403*fae548d3Szrj // Write the data of a merged output section with fixed size constants
404*fae548d3Szrj // to the file.
405*fae548d3Szrj 
406*fae548d3Szrj void
do_write(Output_file * of)407*fae548d3Szrj Output_merge_data::do_write(Output_file* of)
408*fae548d3Szrj {
409*fae548d3Szrj   of->write(this->offset(), this->p_, this->len_);
410*fae548d3Szrj }
411*fae548d3Szrj 
412*fae548d3Szrj // Write the data to a buffer.
413*fae548d3Szrj 
414*fae548d3Szrj void
do_write_to_buffer(unsigned char * buffer)415*fae548d3Szrj Output_merge_data::do_write_to_buffer(unsigned char* buffer)
416*fae548d3Szrj {
417*fae548d3Szrj   memcpy(buffer, this->p_, this->len_);
418*fae548d3Szrj }
419*fae548d3Szrj 
420*fae548d3Szrj // Print merge stats to stderr.
421*fae548d3Szrj 
422*fae548d3Szrj void
do_print_merge_stats(const char * section_name)423*fae548d3Szrj Output_merge_data::do_print_merge_stats(const char* section_name)
424*fae548d3Szrj {
425*fae548d3Szrj   fprintf(stderr,
426*fae548d3Szrj 	  _("%s: %s merged constants size: %lu; input: %zu; output: %zu\n"),
427*fae548d3Szrj 	  program_name, section_name,
428*fae548d3Szrj 	  static_cast<unsigned long>(this->entsize()),
429*fae548d3Szrj 	  this->input_count_, this->hashtable_.size());
430*fae548d3Szrj }
431*fae548d3Szrj 
432*fae548d3Szrj // Class Output_merge_string.
433*fae548d3Szrj 
434*fae548d3Szrj // Add an input section to a merged string section.
435*fae548d3Szrj 
436*fae548d3Szrj template<typename Char_type>
437*fae548d3Szrj bool
do_add_input_section(Relobj * object,unsigned int shndx)438*fae548d3Szrj Output_merge_string<Char_type>::do_add_input_section(Relobj* object,
439*fae548d3Szrj 						     unsigned int shndx)
440*fae548d3Szrj {
441*fae548d3Szrj   section_size_type sec_len;
442*fae548d3Szrj   bool is_new;
443*fae548d3Szrj   uint64_t addralign = this->addralign();
444*fae548d3Szrj   const unsigned char* pdata = object->decompressed_section_contents(shndx,
445*fae548d3Szrj 								     &sec_len,
446*fae548d3Szrj 								     &is_new,
447*fae548d3Szrj 								     &addralign);
448*fae548d3Szrj 
449*fae548d3Szrj   const Char_type* p = reinterpret_cast<const Char_type*>(pdata);
450*fae548d3Szrj   const Char_type* pend = p + sec_len / sizeof(Char_type);
451*fae548d3Szrj   const Char_type* pend0 = pend;
452*fae548d3Szrj 
453*fae548d3Szrj   if (sec_len % sizeof(Char_type) != 0)
454*fae548d3Szrj     {
455*fae548d3Szrj       object->error(_("mergeable string section length not multiple of "
456*fae548d3Szrj 		      "character size"));
457*fae548d3Szrj       if (is_new)
458*fae548d3Szrj 	delete[] pdata;
459*fae548d3Szrj       return false;
460*fae548d3Szrj     }
461*fae548d3Szrj 
462*fae548d3Szrj   if (pend[-1] != 0)
463*fae548d3Szrj     {
464*fae548d3Szrj       gold_warning(_("%s: last entry in mergeable string section '%s' "
465*fae548d3Szrj 		     "not null terminated"),
466*fae548d3Szrj 		   object->name().c_str(),
467*fae548d3Szrj 		   object->section_name(shndx).c_str());
468*fae548d3Szrj       // Find the end of the last NULL-terminated string in the buffer.
469*fae548d3Szrj       while (pend0 > p && pend0[-1] != 0)
470*fae548d3Szrj 	--pend0;
471*fae548d3Szrj     }
472*fae548d3Szrj 
473*fae548d3Szrj   Merged_strings_list* merged_strings_list =
474*fae548d3Szrj       new Merged_strings_list(object, shndx);
475*fae548d3Szrj   this->merged_strings_lists_.push_back(merged_strings_list);
476*fae548d3Szrj   Merged_strings& merged_strings = merged_strings_list->merged_strings;
477*fae548d3Szrj 
478*fae548d3Szrj   // Count the number of non-null strings in the section and size the list.
479*fae548d3Szrj   size_t count = 0;
480*fae548d3Szrj   const Char_type* pt = p;
481*fae548d3Szrj   while (pt < pend0)
482*fae548d3Szrj     {
483*fae548d3Szrj       size_t len = string_length(pt);
484*fae548d3Szrj       if (len != 0)
485*fae548d3Szrj 	++count;
486*fae548d3Szrj       pt += len + 1;
487*fae548d3Szrj     }
488*fae548d3Szrj   if (pend0 < pend)
489*fae548d3Szrj     ++count;
490*fae548d3Szrj   merged_strings.reserve(count + 1);
491*fae548d3Szrj 
492*fae548d3Szrj   // The index I is in bytes, not characters.
493*fae548d3Szrj   section_size_type i = 0;
494*fae548d3Szrj 
495*fae548d3Szrj   // We assume here that the beginning of the section is correctly
496*fae548d3Szrj   // aligned, so each string within the section must retain the same
497*fae548d3Szrj   // modulo.
498*fae548d3Szrj   uintptr_t init_align_modulo = (reinterpret_cast<uintptr_t>(pdata)
499*fae548d3Szrj 				 & (addralign - 1));
500*fae548d3Szrj   bool has_misaligned_strings = false;
501*fae548d3Szrj 
502*fae548d3Szrj   while (p < pend)
503*fae548d3Szrj     {
504*fae548d3Szrj       size_t len = p < pend0 ? string_length(p) : pend - p;
505*fae548d3Szrj 
506*fae548d3Szrj       // Within merge input section each string must be aligned.
507*fae548d3Szrj       if (len != 0
508*fae548d3Szrj 	  && ((reinterpret_cast<uintptr_t>(p) & (addralign - 1))
509*fae548d3Szrj 	      != init_align_modulo))
510*fae548d3Szrj 	  has_misaligned_strings = true;
511*fae548d3Szrj 
512*fae548d3Szrj       Stringpool::Key key;
513*fae548d3Szrj       this->stringpool_.add_with_length(p, len, true, &key);
514*fae548d3Szrj 
515*fae548d3Szrj       merged_strings.push_back(Merged_string(i, key));
516*fae548d3Szrj       p += len + 1;
517*fae548d3Szrj       i += (len + 1) * sizeof(Char_type);
518*fae548d3Szrj     }
519*fae548d3Szrj 
520*fae548d3Szrj   // Record the last offset in the input section so that we can
521*fae548d3Szrj   // compute the length of the last string.
522*fae548d3Szrj   merged_strings.push_back(Merged_string(i, 0));
523*fae548d3Szrj 
524*fae548d3Szrj   this->input_count_ += count;
525*fae548d3Szrj   this->input_size_ += i;
526*fae548d3Szrj 
527*fae548d3Szrj   if (has_misaligned_strings)
528*fae548d3Szrj     gold_warning(_("%s: section %s contains incorrectly aligned strings;"
529*fae548d3Szrj 		   " the alignment of those strings won't be preserved"),
530*fae548d3Szrj 		 object->name().c_str(),
531*fae548d3Szrj 		 object->section_name(shndx).c_str());
532*fae548d3Szrj 
533*fae548d3Szrj   // For script processing, we keep the input sections.
534*fae548d3Szrj   if (this->keeps_input_sections())
535*fae548d3Szrj     record_input_section(object, shndx);
536*fae548d3Szrj 
537*fae548d3Szrj   if (is_new)
538*fae548d3Szrj     delete[] pdata;
539*fae548d3Szrj 
540*fae548d3Szrj   return true;
541*fae548d3Szrj }
542*fae548d3Szrj 
543*fae548d3Szrj // Finalize the mappings from the input sections to the output
544*fae548d3Szrj // section, and return the final data size.
545*fae548d3Szrj 
546*fae548d3Szrj template<typename Char_type>
547*fae548d3Szrj section_size_type
finalize_merged_data()548*fae548d3Szrj Output_merge_string<Char_type>::finalize_merged_data()
549*fae548d3Szrj {
550*fae548d3Szrj   this->stringpool_.set_string_offsets();
551*fae548d3Szrj 
552*fae548d3Szrj   for (typename Merged_strings_lists::const_iterator l =
553*fae548d3Szrj 	 this->merged_strings_lists_.begin();
554*fae548d3Szrj        l != this->merged_strings_lists_.end();
555*fae548d3Szrj        ++l)
556*fae548d3Szrj     {
557*fae548d3Szrj       section_offset_type last_input_offset = 0;
558*fae548d3Szrj       section_offset_type last_output_offset = 0;
559*fae548d3Szrj       Relobj *object = (*l)->object;
560*fae548d3Szrj       Object_merge_map* merge_map = object->get_or_create_merge_map();
561*fae548d3Szrj       Object_merge_map::Input_merge_map* input_merge_map =
562*fae548d3Szrj         merge_map->get_or_make_input_merge_map(this, (*l)->shndx);
563*fae548d3Szrj 
564*fae548d3Szrj       for (typename Merged_strings::const_iterator p =
565*fae548d3Szrj 	     (*l)->merged_strings.begin();
566*fae548d3Szrj 	   p != (*l)->merged_strings.end();
567*fae548d3Szrj 	   ++p)
568*fae548d3Szrj 	{
569*fae548d3Szrj 	  section_size_type length = p->offset - last_input_offset;
570*fae548d3Szrj 	  if (length > 0)
571*fae548d3Szrj 	    input_merge_map->add_mapping(last_input_offset, length,
572*fae548d3Szrj                                          last_output_offset);
573*fae548d3Szrj 	  last_input_offset = p->offset;
574*fae548d3Szrj 	  if (p->stringpool_key != 0)
575*fae548d3Szrj 	    last_output_offset =
576*fae548d3Szrj 	        this->stringpool_.get_offset_from_key(p->stringpool_key);
577*fae548d3Szrj 	}
578*fae548d3Szrj       delete *l;
579*fae548d3Szrj     }
580*fae548d3Szrj 
581*fae548d3Szrj   // Save some memory.  This also ensures that this function will work
582*fae548d3Szrj   // if called twice, as may happen if Layout::set_segment_offsets
583*fae548d3Szrj   // finds a better alignment.
584*fae548d3Szrj   this->merged_strings_lists_.clear();
585*fae548d3Szrj 
586*fae548d3Szrj   return this->stringpool_.get_strtab_size();
587*fae548d3Szrj }
588*fae548d3Szrj 
589*fae548d3Szrj template<typename Char_type>
590*fae548d3Szrj void
set_final_data_size()591*fae548d3Szrj Output_merge_string<Char_type>::set_final_data_size()
592*fae548d3Szrj {
593*fae548d3Szrj   const off_t final_data_size = this->finalize_merged_data();
594*fae548d3Szrj   this->set_data_size(final_data_size);
595*fae548d3Szrj }
596*fae548d3Szrj 
597*fae548d3Szrj // Write out a merged string section.
598*fae548d3Szrj 
599*fae548d3Szrj template<typename Char_type>
600*fae548d3Szrj void
do_write(Output_file * of)601*fae548d3Szrj Output_merge_string<Char_type>::do_write(Output_file* of)
602*fae548d3Szrj {
603*fae548d3Szrj   this->stringpool_.write(of, this->offset());
604*fae548d3Szrj }
605*fae548d3Szrj 
606*fae548d3Szrj // Write a merged string section to a buffer.
607*fae548d3Szrj 
608*fae548d3Szrj template<typename Char_type>
609*fae548d3Szrj void
do_write_to_buffer(unsigned char * buffer)610*fae548d3Szrj Output_merge_string<Char_type>::do_write_to_buffer(unsigned char* buffer)
611*fae548d3Szrj {
612*fae548d3Szrj   this->stringpool_.write_to_buffer(buffer, this->data_size());
613*fae548d3Szrj }
614*fae548d3Szrj 
615*fae548d3Szrj // Return the name of the types of string to use with
616*fae548d3Szrj // do_print_merge_stats.
617*fae548d3Szrj 
618*fae548d3Szrj template<typename Char_type>
619*fae548d3Szrj const char*
string_name()620*fae548d3Szrj Output_merge_string<Char_type>::string_name()
621*fae548d3Szrj {
622*fae548d3Szrj   gold_unreachable();
623*fae548d3Szrj   return NULL;
624*fae548d3Szrj }
625*fae548d3Szrj 
626*fae548d3Szrj template<>
627*fae548d3Szrj const char*
string_name()628*fae548d3Szrj Output_merge_string<char>::string_name()
629*fae548d3Szrj {
630*fae548d3Szrj   return "strings";
631*fae548d3Szrj }
632*fae548d3Szrj 
633*fae548d3Szrj template<>
634*fae548d3Szrj const char*
string_name()635*fae548d3Szrj Output_merge_string<uint16_t>::string_name()
636*fae548d3Szrj {
637*fae548d3Szrj   return "16-bit strings";
638*fae548d3Szrj }
639*fae548d3Szrj 
640*fae548d3Szrj template<>
641*fae548d3Szrj const char*
string_name()642*fae548d3Szrj Output_merge_string<uint32_t>::string_name()
643*fae548d3Szrj {
644*fae548d3Szrj   return "32-bit strings";
645*fae548d3Szrj }
646*fae548d3Szrj 
647*fae548d3Szrj // Print merge stats to stderr.
648*fae548d3Szrj 
649*fae548d3Szrj template<typename Char_type>
650*fae548d3Szrj void
do_print_merge_stats(const char * section_name)651*fae548d3Szrj Output_merge_string<Char_type>::do_print_merge_stats(const char* section_name)
652*fae548d3Szrj {
653*fae548d3Szrj   char buf[200];
654*fae548d3Szrj   snprintf(buf, sizeof buf, "%s merged %s", section_name, this->string_name());
655*fae548d3Szrj   fprintf(stderr, _("%s: %s input bytes: %zu\n"),
656*fae548d3Szrj 	  program_name, buf, this->input_size_);
657*fae548d3Szrj   fprintf(stderr, _("%s: %s input strings: %zu\n"),
658*fae548d3Szrj 	  program_name, buf, this->input_count_);
659*fae548d3Szrj   this->stringpool_.print_stats(buf);
660*fae548d3Szrj }
661*fae548d3Szrj 
662*fae548d3Szrj // Instantiate the templates we need.
663*fae548d3Szrj 
664*fae548d3Szrj template
665*fae548d3Szrj class Output_merge_string<char>;
666*fae548d3Szrj 
667*fae548d3Szrj template
668*fae548d3Szrj class Output_merge_string<uint16_t>;
669*fae548d3Szrj 
670*fae548d3Szrj template
671*fae548d3Szrj class Output_merge_string<uint32_t>;
672*fae548d3Szrj 
673*fae548d3Szrj #if defined(HAVE_TARGET_32_LITTLE) || defined(HAVE_TARGET_32_BIG)
674*fae548d3Szrj template
675*fae548d3Szrj void
676*fae548d3Szrj Object_merge_map::initialize_input_to_output_map<32>(
677*fae548d3Szrj     unsigned int shndx,
678*fae548d3Szrj     elfcpp::Elf_types<32>::Elf_Addr starting_address,
679*fae548d3Szrj     Unordered_map<section_offset_type, elfcpp::Elf_types<32>::Elf_Addr>*);
680*fae548d3Szrj #endif
681*fae548d3Szrj 
682*fae548d3Szrj #if defined(HAVE_TARGET_64_LITTLE) || defined(HAVE_TARGET_64_BIG)
683*fae548d3Szrj template
684*fae548d3Szrj void
685*fae548d3Szrj Object_merge_map::initialize_input_to_output_map<64>(
686*fae548d3Szrj     unsigned int shndx,
687*fae548d3Szrj     elfcpp::Elf_types<64>::Elf_Addr starting_address,
688*fae548d3Szrj     Unordered_map<section_offset_type, elfcpp::Elf_types<64>::Elf_Addr>*);
689*fae548d3Szrj #endif
690*fae548d3Szrj 
691*fae548d3Szrj } // End namespace gold.
692