mirror of
https://review.haiku-os.org/buildtools
synced 2024-11-23 07:18:49 +01:00
624 lines
17 KiB
C++
624 lines
17 KiB
C++
// fileread.h -- read files for gold -*- C++ -*-
|
|
|
|
// Copyright (C) 2006-2023 Free Software Foundation, Inc.
|
|
// Written by Ian Lance Taylor <iant@google.com>.
|
|
|
|
// This file is part of gold.
|
|
|
|
// This program is free software; you can redistribute it and/or modify
|
|
// it under the terms of the GNU General Public License as published by
|
|
// the Free Software Foundation; either version 3 of the License, or
|
|
// (at your option) any later version.
|
|
|
|
// This program is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU General Public License for more details.
|
|
|
|
// You should have received a copy of the GNU General Public License
|
|
// along with this program; if not, write to the Free Software
|
|
// Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston,
|
|
// MA 02110-1301, USA.
|
|
|
|
// Classes used to read data from binary input files.
|
|
|
|
#ifndef GOLD_FILEREAD_H
|
|
#define GOLD_FILEREAD_H
|
|
|
|
#include <list>
|
|
#include <map>
|
|
#include <string>
|
|
#include <vector>
|
|
|
|
#include "token.h"
|
|
|
|
namespace gold
|
|
{
|
|
|
|
// Since not all system supports stat.st_mtim and struct timespec,
|
|
// we define our own structure and fill the nanoseconds if we can.
|
|
|
|
struct Timespec
|
|
{
|
|
Timespec()
|
|
: seconds(0), nanoseconds(0)
|
|
{ }
|
|
|
|
Timespec(time_t a_seconds, int a_nanoseconds)
|
|
: seconds(a_seconds), nanoseconds(a_nanoseconds)
|
|
{ }
|
|
|
|
time_t seconds;
|
|
int nanoseconds;
|
|
};
|
|
|
|
// Get the last modified time of an unopened file. Returns false if the
|
|
// file does not exist.
|
|
|
|
bool
|
|
get_mtime(const char* filename, Timespec* mtime);
|
|
|
|
class Position_dependent_options;
|
|
class Input_file_argument;
|
|
class Dirsearch;
|
|
class File_view;
|
|
|
|
// File_read manages a file descriptor and mappings for a file we are
|
|
// reading.
|
|
|
|
class File_read
|
|
{
|
|
public:
|
|
File_read()
|
|
: name_(), descriptor_(-1), is_descriptor_opened_(false), object_count_(0),
|
|
size_(0), token_(false), views_(), saved_views_(), mapped_bytes_(0),
|
|
released_(true), whole_file_view_(NULL)
|
|
{ }
|
|
|
|
~File_read();
|
|
|
|
// Open a file.
|
|
bool
|
|
open(const Task*, const std::string& name);
|
|
|
|
// Pretend to open the file, but provide the file contents. No
|
|
// actual file system activity will occur. This is used for
|
|
// testing.
|
|
bool
|
|
open(const Task*, const std::string& name, const unsigned char* contents,
|
|
off_t size);
|
|
|
|
// Return the file name.
|
|
const std::string&
|
|
filename() const
|
|
{ return this->name_; }
|
|
|
|
// Add an object associated with a file.
|
|
void
|
|
add_object()
|
|
{ ++this->object_count_; }
|
|
|
|
// Remove an object associated with a file.
|
|
void
|
|
remove_object()
|
|
{ --this->object_count_; }
|
|
|
|
// Lock the file for exclusive access within a particular Task::run
|
|
// execution. This routine may only be called when the workqueue
|
|
// lock is held.
|
|
void
|
|
lock(const Task* t);
|
|
|
|
// Unlock the file.
|
|
void
|
|
unlock(const Task* t);
|
|
|
|
// Test whether the object is locked.
|
|
bool
|
|
is_locked() const;
|
|
|
|
// Return the token, so that the task can be queued.
|
|
Task_token*
|
|
token()
|
|
{ return &this->token_; }
|
|
|
|
// Release the file. This indicates that we aren't going to do
|
|
// anything further with it until it is unlocked. This is used
|
|
// because a Task which locks the file never calls either lock or
|
|
// unlock; it just locks the token. The basic rule is that a Task
|
|
// which locks a file via the Task::locks interface must explicitly
|
|
// call release() when it is done. This is not necessary for code
|
|
// which calls unlock() on the file.
|
|
void
|
|
release();
|
|
|
|
// Return the size of the file.
|
|
off_t
|
|
filesize() const
|
|
{ return this->size_; }
|
|
|
|
// Return a view into the file starting at file offset START for
|
|
// SIZE bytes. OFFSET is the offset into the input file for the
|
|
// file we are reading; this is zero for a normal object file,
|
|
// non-zero for an object file in an archive. ALIGNED is true if
|
|
// the data must be naturally aligned (i.e., aligned to the size
|
|
// of a target word); this only matters when OFFSET is not zero.
|
|
// The pointer will remain valid until the File_read is unlocked.
|
|
// It is an error if we can not read enough data from the file.
|
|
// The CACHE parameter is a hint as to whether it will be useful
|
|
// to cache this data for later accesses--i.e., later calls to
|
|
// get_view, read, or get_lasting_view which retrieve the same
|
|
// data.
|
|
const unsigned char*
|
|
get_view(off_t offset, off_t start, section_size_type size, bool aligned,
|
|
bool cache);
|
|
|
|
// Read data from the file into the buffer P starting at file offset
|
|
// START for SIZE bytes.
|
|
void
|
|
read(off_t start, section_size_type size, void* p);
|
|
|
|
// Return a lasting view into the file starting at file offset START
|
|
// for SIZE bytes. This is allocated with new, and the caller is
|
|
// responsible for deleting it when done. The data associated with
|
|
// this view will remain valid until the view is deleted. It is an
|
|
// error if we can not read enough data from the file. The OFFSET,
|
|
// ALIGNED and CACHE parameters are as in get_view.
|
|
File_view*
|
|
get_lasting_view(off_t offset, off_t start, section_size_type size,
|
|
bool aligned, bool cache);
|
|
|
|
// Mark all views as no longer cached.
|
|
void
|
|
clear_view_cache_marks();
|
|
|
|
// Discard all uncached views. This is normally done by release(),
|
|
// but not for objects in archives. FIXME: This is a complicated
|
|
// interface, and it would be nice to have something more automatic.
|
|
void
|
|
clear_uncached_views()
|
|
{ this->clear_views(CLEAR_VIEWS_ARCHIVE); }
|
|
|
|
// A struct used to do a multiple read.
|
|
struct Read_multiple_entry
|
|
{
|
|
// The file offset of the data to read.
|
|
off_t file_offset;
|
|
// The amount of data to read.
|
|
section_size_type size;
|
|
// The buffer where the data should be placed.
|
|
unsigned char* buffer;
|
|
|
|
Read_multiple_entry(off_t o, section_size_type s, unsigned char* b)
|
|
: file_offset(o), size(s), buffer(b)
|
|
{ }
|
|
};
|
|
|
|
typedef std::vector<Read_multiple_entry> Read_multiple;
|
|
|
|
// Read a bunch of data from the file into various different
|
|
// locations. The vector must be sorted by ascending file_offset.
|
|
// BASE is a base offset to be added to all the offsets in the
|
|
// vector.
|
|
void
|
|
read_multiple(off_t base, const Read_multiple&);
|
|
|
|
// Dump statistical information to stderr.
|
|
static void
|
|
print_stats();
|
|
|
|
// Write the dependency file listing all files read.
|
|
static void
|
|
write_dependency_file(const char* dependency_file_name,
|
|
const char* output_file_name);
|
|
|
|
// Record that a file was read. File_read::open does this.
|
|
static void
|
|
record_file_read(const std::string& name);
|
|
|
|
// Return the open file descriptor (for plugins).
|
|
int
|
|
descriptor()
|
|
{
|
|
this->reopen_descriptor();
|
|
return this->descriptor_;
|
|
}
|
|
|
|
// Return the file last modification time. Calls gold_fatal if the stat
|
|
// system call failed.
|
|
Timespec
|
|
get_mtime();
|
|
|
|
private:
|
|
// Control for what views to clear.
|
|
enum Clear_views_mode
|
|
{
|
|
// Clear uncached views not used by an archive.
|
|
CLEAR_VIEWS_NORMAL,
|
|
// Clear all uncached views (including in an archive).
|
|
CLEAR_VIEWS_ARCHIVE,
|
|
// Clear all views (i.e., we're destroying the file).
|
|
CLEAR_VIEWS_ALL
|
|
};
|
|
|
|
// This class may not be copied.
|
|
File_read(const File_read&);
|
|
File_read& operator=(const File_read&);
|
|
|
|
// Total bytes mapped into memory during the link if --stats.
|
|
static unsigned long long total_mapped_bytes;
|
|
|
|
// Current number of bytes mapped into memory during the link if
|
|
// --stats.
|
|
static unsigned long long current_mapped_bytes;
|
|
|
|
// High water mark of bytes mapped into memory during the link if
|
|
// --stats.
|
|
static unsigned long long maximum_mapped_bytes;
|
|
|
|
// Set of names of all files read.
|
|
static std::vector<std::string> files_read;
|
|
|
|
// A view into the file.
|
|
class View
|
|
{
|
|
public:
|
|
// Specifies how to dispose the data on destruction of the view.
|
|
enum Data_ownership
|
|
{
|
|
// Data owned by File object - nothing done in destructor.
|
|
DATA_NOT_OWNED,
|
|
// Data allocated with new[] and owned by this object - should
|
|
// use delete[].
|
|
DATA_ALLOCATED_ARRAY,
|
|
// Data mmapped and owned by this object - should munmap.
|
|
DATA_MMAPPED
|
|
};
|
|
|
|
View(off_t start, section_size_type size, const unsigned char* data,
|
|
unsigned int byteshift, bool cache, Data_ownership data_ownership)
|
|
: start_(start), size_(size), data_(data), lock_count_(0),
|
|
byteshift_(byteshift), cache_(cache), data_ownership_(data_ownership),
|
|
accessed_(true)
|
|
{ }
|
|
|
|
~View();
|
|
|
|
off_t
|
|
start() const
|
|
{ return this->start_; }
|
|
|
|
section_size_type
|
|
size() const
|
|
{ return this->size_; }
|
|
|
|
const unsigned char*
|
|
data() const
|
|
{ return this->data_; }
|
|
|
|
void
|
|
lock();
|
|
|
|
void
|
|
unlock();
|
|
|
|
bool
|
|
is_locked();
|
|
|
|
unsigned int
|
|
byteshift() const
|
|
{ return this->byteshift_; }
|
|
|
|
void
|
|
set_cache()
|
|
{ this->cache_ = true; }
|
|
|
|
void
|
|
clear_cache()
|
|
{ this->cache_ = false; }
|
|
|
|
bool
|
|
should_cache() const
|
|
{ return this->cache_; }
|
|
|
|
void
|
|
set_accessed()
|
|
{ this->accessed_ = true; }
|
|
|
|
void
|
|
clear_accessed()
|
|
{ this->accessed_= false; }
|
|
|
|
bool
|
|
accessed() const
|
|
{ return this->accessed_; }
|
|
|
|
// Returns TRUE if this view contains permanent data -- e.g., data that
|
|
// was supplied by the owner of the File object.
|
|
bool
|
|
is_permanent_view() const
|
|
{ return this->data_ownership_ == DATA_NOT_OWNED; }
|
|
|
|
private:
|
|
View(const View&);
|
|
View& operator=(const View&);
|
|
|
|
// The file offset of the start of the view.
|
|
off_t start_;
|
|
// The size of the view.
|
|
section_size_type size_;
|
|
// A pointer to the actual bytes.
|
|
const unsigned char* data_;
|
|
// The number of locks on this view.
|
|
int lock_count_;
|
|
// The number of bytes that the view is shifted relative to the
|
|
// underlying file. This is used to align data. This is normally
|
|
// zero, except possibly for an object in an archive.
|
|
unsigned int byteshift_;
|
|
// Whether the view is cached.
|
|
bool cache_;
|
|
// Whether the view is mapped into memory. If not, data_ points
|
|
// to memory allocated using new[].
|
|
Data_ownership data_ownership_;
|
|
// Whether the view has been accessed recently.
|
|
bool accessed_;
|
|
};
|
|
|
|
friend class View;
|
|
friend class File_view;
|
|
|
|
// The type of a mapping from page start and byte shift to views.
|
|
typedef std::map<std::pair<off_t, unsigned int>, View*> Views;
|
|
|
|
// A simple list of Views.
|
|
typedef std::list<View*> Saved_views;
|
|
|
|
// Open the descriptor if necessary.
|
|
void
|
|
reopen_descriptor();
|
|
|
|
// Find a view into the file.
|
|
View*
|
|
find_view(off_t start, section_size_type size, unsigned int byteshift,
|
|
View** vshifted) const;
|
|
|
|
// Read data from the file into a buffer.
|
|
void
|
|
do_read(off_t start, section_size_type size, void* p);
|
|
|
|
// Add a view.
|
|
void
|
|
add_view(View*);
|
|
|
|
// Make a view into the file.
|
|
View*
|
|
make_view(off_t start, section_size_type size, unsigned int byteshift,
|
|
bool cache);
|
|
|
|
// Find or make a view into the file.
|
|
View*
|
|
find_or_make_view(off_t offset, off_t start, section_size_type size,
|
|
bool aligned, bool cache);
|
|
|
|
// Clear the file views.
|
|
void
|
|
clear_views(Clear_views_mode);
|
|
|
|
// The size of a file page for buffering data.
|
|
static const off_t page_size = 8192;
|
|
|
|
// Given a file offset, return the page offset.
|
|
static off_t
|
|
page_offset(off_t file_offset)
|
|
{ return file_offset & ~ (page_size - 1); }
|
|
|
|
// Given a file size, return the size to read integral pages.
|
|
static off_t
|
|
pages(off_t file_size)
|
|
{ return (file_size + (page_size - 1)) & ~ (page_size - 1); }
|
|
|
|
// The maximum number of entries we will pass to ::readv.
|
|
static const size_t max_readv_entries = 128;
|
|
|
|
// Use readv to read data.
|
|
void
|
|
do_readv(off_t base, const Read_multiple&, size_t start, size_t count);
|
|
|
|
// File name.
|
|
std::string name_;
|
|
// File descriptor.
|
|
int descriptor_;
|
|
// Whether we have regained the descriptor after releasing the file.
|
|
bool is_descriptor_opened_;
|
|
// The number of objects associated with this file. This will be
|
|
// more than 1 in the case of an archive.
|
|
int object_count_;
|
|
// File size.
|
|
off_t size_;
|
|
// A token used to lock the file.
|
|
Task_token token_;
|
|
// Buffered views into the file.
|
|
Views views_;
|
|
// List of views which were locked but had to be removed from views_
|
|
// because they were not large enough.
|
|
Saved_views saved_views_;
|
|
// Total amount of space mapped into memory. This is only changed
|
|
// while the file is locked. When we unlock the file, we transfer
|
|
// the total to total_mapped_bytes, and reset this to zero.
|
|
size_t mapped_bytes_;
|
|
// Whether the file was released.
|
|
bool released_;
|
|
// A view containing the whole file. May be NULL if we mmap only
|
|
// the relevant parts of the file. Not NULL if:
|
|
// - Flag --mmap_whole_files is set (default on 64-bit hosts).
|
|
// - The contents was specified in the constructor. Used only for
|
|
// testing purposes).
|
|
View* whole_file_view_;
|
|
};
|
|
|
|
// A view of file data that persists even when the file is unlocked.
|
|
// Callers should destroy these when no longer required. These are
|
|
// obtained form File_read::get_lasting_view. They may only be
|
|
// destroyed when the underlying File_read is locked.
|
|
|
|
class File_view
|
|
{
|
|
public:
|
|
// This may only be called when the underlying File_read is locked.
|
|
~File_view();
|
|
|
|
// Return a pointer to the data associated with this view.
|
|
const unsigned char*
|
|
data() const
|
|
{ return this->data_; }
|
|
|
|
private:
|
|
File_view(const File_view&);
|
|
File_view& operator=(const File_view&);
|
|
|
|
friend class File_read;
|
|
|
|
// Callers have to get these via File_read::get_lasting_view.
|
|
File_view(File_read& file, File_read::View* view, const unsigned char* data)
|
|
: file_(file), view_(view), data_(data)
|
|
{ }
|
|
|
|
File_read& file_;
|
|
File_read::View* view_;
|
|
const unsigned char* data_;
|
|
};
|
|
|
|
// All the information we hold for a single input file. This can be
|
|
// an object file, a shared library, or an archive.
|
|
|
|
class Input_file
|
|
{
|
|
public:
|
|
enum Format
|
|
{
|
|
FORMAT_NONE,
|
|
FORMAT_ELF,
|
|
FORMAT_BINARY
|
|
};
|
|
|
|
Input_file(const Input_file_argument* input_argument)
|
|
: input_argument_(input_argument), found_name_(), file_(),
|
|
is_in_sysroot_(false), format_(FORMAT_NONE)
|
|
{ }
|
|
|
|
// Create an input file given just a filename.
|
|
Input_file(const char* name);
|
|
|
|
// Create an input file with the contents already provided. This is
|
|
// only used for testing. With this path, don't call the open
|
|
// method.
|
|
Input_file(const Task*, const char* name, const unsigned char* contents,
|
|
off_t size);
|
|
|
|
// Return the command line argument.
|
|
const Input_file_argument*
|
|
input_file_argument() const
|
|
{ return this->input_argument_; }
|
|
|
|
// Return whether this is a file that we will search for in the list
|
|
// of directories.
|
|
bool
|
|
will_search_for() const;
|
|
|
|
// Open the file. If the open fails, this will report an error and
|
|
// return false. If there is a search, it starts at directory
|
|
// *PINDEX. *PINDEX should be initialized to zero. It may be
|
|
// restarted to find the next file with a matching name by
|
|
// incrementing the result and calling this again.
|
|
bool
|
|
open(const Dirsearch&, const Task*, int* pindex);
|
|
|
|
// Return the name given by the user. For -lc this will return "c".
|
|
const char*
|
|
name() const;
|
|
|
|
// Return the file name. For -lc this will return something like
|
|
// "/usr/lib/libc.so".
|
|
const std::string&
|
|
filename() const
|
|
{ return this->file_.filename(); }
|
|
|
|
// Return the name under which we found the file, corresponding to
|
|
// the command line. For -lc this will return something like
|
|
// "libc.so".
|
|
const std::string&
|
|
found_name() const
|
|
{ return this->found_name_; }
|
|
|
|
// Return the position dependent options.
|
|
const Position_dependent_options&
|
|
options() const;
|
|
|
|
// Return the file.
|
|
File_read&
|
|
file()
|
|
{ return this->file_; }
|
|
|
|
const File_read&
|
|
file() const
|
|
{ return this->file_; }
|
|
|
|
// Whether we found the file in a directory in the system root.
|
|
bool
|
|
is_in_sysroot() const
|
|
{ return this->is_in_sysroot_; }
|
|
|
|
// Whether this file is in a system directory.
|
|
bool
|
|
is_in_system_directory() const;
|
|
|
|
// Return whether this file is to be read only for its symbols.
|
|
bool
|
|
just_symbols() const;
|
|
|
|
// Return the format of the unconverted input file.
|
|
Format
|
|
format() const
|
|
{ return this->format_; }
|
|
|
|
// Try to find a file in the extra search dirs. Returns true on success.
|
|
static bool
|
|
try_extra_search_path(int* pindex,
|
|
const Input_file_argument* input_argument,
|
|
std::string filename, std::string* found_name,
|
|
std::string* namep);
|
|
|
|
// Find the actual file.
|
|
static bool
|
|
find_file(const Dirsearch& dirpath, int* pindex,
|
|
const Input_file_argument* input_argument,
|
|
bool* is_in_sysroot,
|
|
std::string* found_name, std::string* namep);
|
|
|
|
private:
|
|
Input_file(const Input_file&);
|
|
Input_file& operator=(const Input_file&);
|
|
|
|
// Open a binary file.
|
|
bool
|
|
open_binary(const Task* task, const std::string& name);
|
|
|
|
// The argument from the command line.
|
|
const Input_file_argument* input_argument_;
|
|
// The name under which we opened the file. This is like the name
|
|
// on the command line, but -lc turns into libc.so (or whatever).
|
|
// It only includes the full path if the path was on the command
|
|
// line.
|
|
std::string found_name_;
|
|
// The file after we open it.
|
|
File_read file_;
|
|
// Whether we found the file in a directory in the system root.
|
|
bool is_in_sysroot_;
|
|
// Format of unconverted input file.
|
|
Format format_;
|
|
};
|
|
|
|
} // end namespace gold
|
|
|
|
#endif // !defined(GOLD_FILEREAD_H)
|