1
  2
  3
  4
  5
  6
  7
  8
  9
 10
 11
 12
 13
 14
 15
 16
 17
 18
 19
 20
 21
 22
 23
 24
 25
 26
 27
 28
 29
 30
 31
 32
 33
 34
 35
 36
 37
 38
 39
 40
 41
 42
 43
 44
 45
 46
 47
 48
 49
 50
 51
 52
 53
 54
 55
 56
 57
 58
 59
 60
 61
 62
 63
 64
 65
 66
 67
 68
 69
 70
 71
 72
 73
 74
 75
 76
 77
 78
 79
 80
 81
 82
 83
 84
 85
 86
 87
 88
 89
 90
 91
 92
 93
 94
 95
 96
 97
 98
 99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
use crate::assembler::resource::{RelaSymbol, Symbol};
use crate::assembler::{
    generator, parser,
    resource::{ELFBuilder, Syntax},
};
use indexmap::map::IndexMap;
use std::fs;

type ELFOrError = Result<elf_utilities::file::ELF64Dumper, Box<dyn std::error::Error>>;

/// translate assembly file into object file
pub fn assemble_file(input_file: &str, syntax: Syntax) -> ELFOrError {
    let source = fs::read_to_string(input_file)?;
    assemble(source, syntax)
}

/// translate assembly code into object file.
///
/// # Examples
///
/// ```
/// use asmpeach::*;
///
/// let s = "    .globl main
///     .type main, @function
/// main:
///     pushq %rbp
///     movq %rsp, %rbp
///     movq $42, %rax
///     popq %rbp
///     ret"
///     .to_string();
/// let elf_builder = assemble_code(s, Syntax::ATANDT).unwrap();
/// elf_builder.generate_elf_file("obj.o", 0o644);
/// ```
pub fn assemble_code(assembly_code: String, syntax: Syntax) -> ELFOrError {
    assemble(assembly_code, syntax)
}

fn assemble(source: String, syntax: Syntax) -> ELFOrError {
    let mut symbols = match syntax {
        Syntax::INTEL => unimplemented!(),
        Syntax::ATANDT => parser::parse_atandt(source),
    };

    // コード生成
    // この時点で再配置シンボルが定義される
    let mut reloc_syms = generator::generate_main(&mut symbols);
    // 再配置テーブルを探索して,シンボルテーブル内に該当するエントリがあれば再配置シンボルを更新する
    generator::setup_relocation(&symbols, &mut reloc_syms);

    let mut builder = ELFBuilder::new();

    // (NULL) セクション
    builder.add_section(elf_utilities::section::Section64::new_null_section());
    // .text セクション
    builder.add_text_section(&symbols);
    // .symtab セクション
    builder.add_symbol_table_section(&symbols);
    // .strtab セクション
    builder.add_symtab_string_section(&symbols);
    // .rela.text セクション
    builder.add_relatext_section(&reloc_syms);
    // .rodata セクション
    // object_file_builder.add_rodata_section(&symbols);
    // .shstrtab セクション
    builder.add_shstrtab_string_section();

    // ヘッダの調整
    builder.condition_elf_header();

    Ok(elf_utilities::file::ELF64Dumper::new(builder.give_file()))
}

impl ELFBuilder {
    fn add_text_section(&mut self, symbols: &IndexMap<String, Symbol>) {
        // すべてのシンボルのコードを結合する
        let mut all_symbol_codes: Vec<u8> = Vec::new();

        for (_name, sym) in symbols.iter() {
            let mut symbol_codes = sym.codes.clone();
            all_symbol_codes.append(&mut symbol_codes);
        }

        // .textセクションの生成
        let text_shdr = self.init_text_section_header(all_symbol_codes.len());
        let mut text_section =
            elf_utilities::section::Section64::new(".text".to_string(), text_shdr);
        text_section.bytes = Some(all_symbol_codes);

        self.add_section(text_section);
    }

    fn add_symbol_table_section(&mut self, symbols: &IndexMap<String, Symbol>) {
        // NULLシンボル + .textシンボル (+ .rodataシンボル)
        let mut elf_symbols = vec![
            elf_utilities::symbol::Symbol64::new_null_symbol(),
            self.create_section_symbol(1),
        ];

        // シンボルを走査する
        // name_indexの操作も行う.
        // また,各シンボルのオフセットも計算する.
        let mut symbol_name_index: elf_utilities::Elf64Word = 1; // 最初のnull文字を飛ばす
        let mut symbol_offset: elf_utilities::Elf64Addr = 0; // st_value用

        for (symbol_name, symbol_info) in symbols.iter() {
            let symbol_code_length = symbol_info.codes.len();
            let symbol_name_length = symbol_name.len();

            let mut global_symbol = self.create_global_symbol(
                symbol_name_index,
                symbol_code_length as u64,
                symbol_offset,
            );
            global_symbol.symbol_name = Some(symbol_name.to_string());
            elf_symbols.push(global_symbol);

            // シンボル名を指すインデックスの更新( null byte を見越して+1する)
            symbol_name_index += symbol_name_length as elf_utilities::Elf64Word + 1;

            // オフセットの更新
            // 後ろのシンボルのオフセット <- 前のシンボルのサイズの総合値
            symbol_offset += symbol_code_length as elf_utilities::Elf64Addr;
        }

        let symbol_table_size =
            elf_symbols.len() * elf_utilities::symbol::Symbol64::size() as usize;
        // セクションの追加
        let symtab_section_header = self.init_symbol_table_section_header(symbol_table_size as u64);
        let mut symtab_section =
            elf_utilities::section::Section64::new(".symtab".to_string(), symtab_section_header);
        symtab_section.symbols = Some(elf_symbols);
        self.add_section(symtab_section);
    }

    fn add_symtab_string_section(&mut self, symbols: &IndexMap<String, Symbol>) {
        // シンボルマップをイテレートして,名前を集める.
        let symbol_names: Vec<&str> = symbols
            .iter()
            .map(|(name, _)| name.as_str())
            .collect::<Vec<&str>>();

        let symbol_string_table = elf_utilities::section::build_string_table(symbol_names);
        let strtab_header =
            self.init_string_table_header(symbol_string_table.len() as elf_utilities::Elf64Xword);
        let mut strtab_section =
            elf_utilities::section::Section64::new(".strtab".to_string(), strtab_header);
        strtab_section.bytes = Some(symbol_string_table);
        self.add_section(strtab_section);
    }

    fn add_relatext_section(&mut self, reloc_syms: &IndexMap<String, Vec<RelaSymbol>>) {
        let mut relas = Vec::new();

        for (_rela_name, relocs_in_syms) in reloc_syms.iter() {
            for rela in relocs_in_syms.iter() {
                relas.push(rela.rela64);
            }
        }

        // Relaオブジェクトをバイナリに変換
        let mut rela_table_binary: Vec<u8> = Vec::new();
        for rela in relas.iter() {
            let mut rela_entry_binary = rela.to_le_bytes();
            rela_table_binary.append(&mut rela_entry_binary);
        }

        let relatext_hdr = self.init_relatext_header(rela_table_binary.len() as u64);
        let mut relatext_section =
            elf_utilities::section::Section64::new(".rela.text".to_string(), relatext_hdr);
        relatext_section.rela_symbols = Some(relas);
        self.add_section(relatext_section);
    }

    pub fn add_shstrtab_string_section(&mut self) {
        // TODO: 決め打ち
        let section_names = vec![".text", ".symtab", ".strtab", ".rela.text", ".shstrtab"];

        let section_string_table = elf_utilities::section::build_string_table(section_names);
        let shstrtab_header =
            self.init_string_table_header(section_string_table.len() as elf_utilities::Elf64Xword);
        let mut shstrtab_section =
            elf_utilities::section::Section64::new(".shstrtab".to_string(), shstrtab_header);
        shstrtab_section.bytes = Some(section_string_table);
        self.add_section(shstrtab_section);
    }

    fn condition_elf_header(&mut self) {
        self.file.finalize();
    }

    fn init_text_section_header(&self, length: usize) -> elf_utilities::section::Shdr64 {
        let mut shdr: elf_utilities::section::Shdr64 = Default::default();

        shdr.set_type(elf_utilities::section::Type::ProgBits);
        shdr.sh_size = length as elf_utilities::Elf64Xword;
        shdr.sh_addralign = 1;
        shdr.sh_flags = elf_utilities::section::SHF_ALLOC | elf_utilities::section::SHF_EXECINSTR;

        shdr
    }

    fn init_symbol_table_section_header(
        &self,
        length: elf_utilities::Elf64Xword,
    ) -> elf_utilities::section::Shdr64 {
        let mut shdr: elf_utilities::section::Shdr64 = Default::default();

        shdr.set_type(elf_utilities::section::Type::SymTab);
        shdr.sh_size = length;
        shdr.sh_addralign = 1;
        shdr.sh_entsize = elf_utilities::symbol::Symbol64::size();

        // TODO: .strtabが3番目にあることを決め打ち
        shdr.sh_link = 3;

        // TODO: 最初のグローバルシンボルが3番目にあることを決め打ち
        shdr.sh_info = 2;
        shdr
    }

    fn init_string_table_header(
        &self,
        length: elf_utilities::Elf64Xword,
    ) -> elf_utilities::section::Shdr64 {
        let mut shdr: elf_utilities::section::Shdr64 = Default::default();

        shdr.set_type(elf_utilities::section::Type::StrTab);
        shdr.sh_size = length;
        shdr.sh_addralign = 1;

        shdr
    }

    fn init_relatext_header(
        &self,
        length: elf_utilities::Elf64Xword,
    ) -> elf_utilities::section::Shdr64 {
        let mut shdr: elf_utilities::section::Shdr64 = Default::default();

        shdr.set_type(elf_utilities::section::Type::Rela);
        shdr.sh_size = length;
        shdr.sh_flags = elf_utilities::section::SHF_INFO_LINK;
        shdr.sh_addralign = 8;
        shdr.sh_entsize = elf_utilities::relocation::Rela64::size();

        // TODO: シンボルテーブルが2番目にあることを決め打ち
        shdr.sh_link = 2;

        // TODO: .textセクションが一番目にあることを決め打ち
        shdr.sh_info = 1;

        shdr
    }

    fn create_global_symbol(
        &self,
        st_name: elf_utilities::Elf64Word,
        st_size: elf_utilities::Elf64Xword,
        st_offset: elf_utilities::Elf64Addr,
    ) -> elf_utilities::symbol::Symbol64 {
        let mut symbol: elf_utilities::symbol::Symbol64 = Default::default();
        symbol.st_name = st_name;
        symbol.st_size = st_size;
        symbol.st_value = st_offset;

        // TODO: .textが1番目にあることを決め打ち
        symbol.st_shndx = 1;

        // グローバル + Function属性

        symbol.set_info(
            elf_utilities::symbol::Type::Func,
            elf_utilities::symbol::Bind::Global,
        );

        symbol
    }

    fn create_section_symbol(&self, shndx: u16) -> elf_utilities::symbol::Symbol64 {
        let mut symbol: elf_utilities::symbol::Symbol64 = Default::default();

        symbol.st_shndx = shndx;

        // ローカル + SECTION属性
        symbol.set_info(
            elf_utilities::symbol::Type::Section,
            elf_utilities::symbol::Bind::Local,
        );

        symbol
    }
}