as: input: move pass 1 and 2 to separate modules

This commit is contained in:
Mikael Pettersson 2024-01-27 18:01:38 +01:00
parent 84742bfddc
commit 137ccba768
4 changed files with 810 additions and 732 deletions

View File

@ -1,7 +1,7 @@
%%% -*- erlang-indent-level: 2 -*- %%% -*- erlang-indent-level: 2 -*-
%%% %%%
%%% input processing phase for pdp10-elf as %%% input processing phase for pdp10-elf as
%%% Copyright (C) 2013-2023 Mikael Pettersson %%% Copyright (C) 2013-2024 Mikael Pettersson
%%% %%%
%%% This file is part of pdp10-tools. %%% This file is part of pdp10-tools.
%%% %%%
@ -21,741 +21,18 @@
-module(input). -module(input).
-export([ files/1 -export([ files/1
, format_error/1
]). ]).
-include("tunit.hrl"). -include("tunit.hrl").
-include_lib("lib/include/pdp10_elf36.hrl").
-spec files([string()]) -> {ok, #tunit{}} | {error, {module(), term()}}. -spec files([string()]) -> {ok, #tunit{}} | {error, {module(), term()}}.
files(Files0) -> files(Files) ->
Files = case input_pass1:pass1(fixup_files(Files)) of
case Files0 of {ok, SectionsMap} -> input_pass2:pass2(SectionsMap);
[] -> ["--"]; % alias for stdin
_ -> Files0
end,
pass1(Files).
%% Pass 1 ----------------------------------------------------------------------
%%
%% - scan, parse, annotate stmts with locations
%% - maintain current and previous section and subsection, and stack thereof
%% - interpret sectioning stmts, accumulate annotated stmts in subsections
-type sectionname() :: string().
-type subsectionnr() :: non_neg_integer().
-type locationandstmt() :: {scan:location(), stmt()}.
-type subsectionsmap() :: #{subsectionnr() => [locationandstmt()]}.
-type sectionsmap() :: #{sectionname() => {#section{}, subsectionsmap()}}.
-type sectionandsub() :: {sectionname(), subsectionnr()}.
-record(ctx,
{ sections_map :: sectionsmap()
, stack :: [{Current :: sectionandsub(), Previous :: sectionandsub()}]
, current :: sectionandsub()
, previous :: sectionandsub() | []
, stmts :: [locationandstmt()]
}).
pass1(Files) ->
pass1_files(Files, ctx_init()).
pass1_files([], Ctx) -> pass2(ctx_fini(Ctx));
pass1_files([File | Files], Ctx) ->
case pass1_file(File, Ctx) of
{ok, NewCtx} -> pass1_files(Files, NewCtx);
{error, _Reason} = Error -> Error {error, _Reason} = Error -> Error
end. end.
pass1_file(File, Ctx) -> %% Internal --------------------------------------------------------------------
case scan_state_open(File) of
{ok, ScanState} ->
try pass1_process(ScanState, Ctx)
after scan:fclose(ScanState)
end;
{error, _Reason} = Error -> Error
end.
pass1_process(ScanState, Ctx) -> fixup_files([]) -> ["--"]; % alias for stdin
case parse:stmt(ScanState) of fixup_files(Files) -> Files.
eof -> {ok, Ctx};
{ok, {Location, Stmt}} ->
case pass1_stmt(Location, Ctx, Stmt) of
{ok, NewCtx} -> pass1_process(ScanState, NewCtx);
{error, _Reason} = Error -> Error
end;
{error, _Reason} = Error -> Error
end.
pass1_stmt(Location, Ctx, Stmt) ->
case Stmt of
#s_dot_data{} -> dot_data(Location, Ctx, Stmt);
#s_dot_popsection{} -> dot_popsection(Location, Ctx, Stmt);
#s_dot_previous{} -> dot_previous(Location, Ctx, Stmt);
#s_dot_section{} -> dot_section(Location, Ctx, Stmt);
#s_dot_subsection{} -> dot_subsection(Location, Ctx, Stmt);
#s_dot_text{} -> dot_text(Location, Ctx, Stmt);
_ -> {ok, ctx_append(Ctx, Location, Stmt)}
end.
dot_data(Location, Ctx, #s_dot_data{nr = SubsectionNr}) ->
{ok, ctx_data(Ctx, Location, SubsectionNr)}.
dot_popsection(Location, Ctx0, #s_dot_popsection{}) ->
case ctx_try_popsection(Ctx0) of
{ok, _Ctx} = Result -> Result;
false -> fmterr(Location, ".popsection with empty section stack", [])
end.
dot_previous(Location, Ctx0, #s_dot_previous{}) ->
case ctx_try_previous(Ctx0) of
{ok, _Ctx} = Result -> Result;
false -> fmterr(Location, ".previous with empty section stack", [])
end.
dot_section(Location, Ctx, Stmt) ->
#s_dot_section{ name = SectionName
, nr = SubsectionNrOpt
, sh_flags = ShFlags
, sh_type = ShType
, sh_entsize = ShEntSize
} = Stmt,
ctx_section(Ctx, Location, SectionName, SubsectionNrOpt,
ShFlags, ShType, ShEntSize).
dot_subsection(_Location, Ctx, #s_dot_subsection{nr = SubsectionNr}) ->
{ok, ctx_subsection(Ctx, SubsectionNr)}.
dot_text(Location, Ctx, #s_dot_text{nr = SubsectionNr}) ->
{ok, ctx_text(Ctx, Location, SubsectionNr)}.
%% Context utilities
%% INV: any section name in current/previous/stack is bound in sections_map
ctx_init() ->
SectionName = ".text",
Section = section_dot_text(),
SubsectionsMap = #{},
SubsectionNr = 0,
#ctx{ sections_map = #{SectionName => {Section, SubsectionsMap}}
, stack = []
, current = {SectionName, SubsectionNr}
, previous = []
, stmts = []
}.
ctx_fini(Ctx) ->
(ctx_flush(Ctx))#ctx.sections_map.
ctx_flush(Ctx) ->
#ctx{ sections_map = SectionsMap0
, current = {SectionName, SubsectionNr}
, stmts = Stmts
} = Ctx,
{Section, SubsectionsMap0} = maps:get(SectionName, SectionsMap0), % must exist
SubsectionsMap = maps:put(SubsectionNr, Stmts, SubsectionsMap0),
SectionsMap = maps:put(SectionName, {Section, SubsectionsMap}, SectionsMap0),
Ctx#ctx{sections_map = SectionsMap}.
ctx_try_popsection(Ctx0) -> % implements .popsection
Ctx = ctx_flush(Ctx0),
#ctx{ sections_map = SectionsMap
, stack = Stack
} = Ctx,
case Stack of
[] -> false;
[{Current = {SectionName, SubsectionNr}, Previous} | RestStack] ->
Stmts = get_subsection(SectionName, SubsectionNr, SectionsMap),
{ok, Ctx#ctx{ stack = RestStack
, current = Current
, previous = Previous
, stmts = Stmts
}}
end.
ctx_try_previous(Ctx0) -> % implements .previous
Ctx = ctx_flush(Ctx0),
#ctx{ sections_map = SectionsMap
, current = Current
, previous = Previous
} = Ctx,
case Previous of
[] -> false;
{SectionName, SubsectionNr} ->
Stmts = get_subsection(SectionName, SubsectionNr, SectionsMap),
{ok, Ctx#ctx{ current = Previous
, previous = Current
, stmts = Stmts
}}
end.
ctx_section(Ctx0, Location, SectionName, SubsectionNrOpt,
ShFlags, ShType, ShEntSize) ->
{IsPushsection, SubsectionNr} =
case SubsectionNrOpt of
false -> {false, 0};
_ -> {true, SubsectionNrOpt}
end,
Ctx = ctx_flush(Ctx0),
#ctx{ sections_map = SectionsMap0
, stack = Stack
, current = Current
, previous = Previous
} = Ctx,
case enter_section(Location, SectionName, SubsectionNr, SectionsMap0,
ShFlags, ShType, ShEntSize) of
{ok, {Stmts, SectionsMap}} ->
NewStack =
case IsPushsection of
true -> [{Current, Previous} | Stack];
false -> Stack
end,
{ok, Ctx#ctx{ sections_map = SectionsMap
, stack = NewStack
, current = {SectionName, SubsectionNr}
, previous = Current
, stmts = Stmts
}};
{error, _Reason} = Error -> Error
end.
ctx_subsection(Ctx0, SubsectionNr) -> % implements .subsection <nr>
Ctx = ctx_flush(Ctx0),
#ctx{ sections_map = SectionsMap
, current = Current = {SectionName, _CurSubsectionNr}
} = Ctx,
Stmts = enter_subsection(SectionName, SubsectionNr, SectionsMap),
Ctx#ctx{ current = {SectionName, SubsectionNr}
, previous = Current
, stmts = Stmts
}.
ctx_data(Ctx, Location, SubsectionNr) -> % implements .data <nr>
ctx_enter_section(Ctx, Location, ".data", SubsectionNr).
ctx_text(Ctx, Location, SubsectionNr) -> % implements .text <nr>
ctx_enter_section(Ctx, Location, ".text", SubsectionNr).
%% switch to known system section, e.g. .data or .text
ctx_enter_section(Ctx0, Location, SectionName, SubsectionNr) ->
Ctx = ctx_flush(Ctx0),
#ctx{ sections_map = SectionsMap0
, current = Current
} = Ctx,
{ok, {Stmts, SectionsMap}} =
enter_section(Location, SectionName, SubsectionNr, SectionsMap0),
Ctx#ctx{ sections_map = SectionsMap
, current = {SectionName, SubsectionNr}
, previous = Current
, stmts = Stmts
}.
ctx_append(Ctx, Location, Stmt) ->
#ctx{stmts = Stmts} = Ctx,
Ctx#ctx{stmts = [{Location, Stmt} | Stmts]}.
enter_section(Location, SectionName, SubsectionNr, SectionsMap) ->
enter_section(Location, SectionName, SubsectionNr, SectionsMap,
_ShFlags = 0, _ShType = 0, _ShEntSize = 0).
enter_section(Location, SectionName, SubsectionNr, SectionsMap0,
ShFlags, ShType, ShEntSize) ->
{Section0, SubsectionsMap} = get_section(SectionName, SectionsMap0),
case update_section(Location, Section0, ShFlags, ShType, ShEntSize) of
{ok, Section} ->
SectionsMap = maps:put(SectionName, {Section, SubsectionsMap}, SectionsMap0),
Stmts = maps:get(SubsectionNr, SubsectionsMap, []),
{ok, {Stmts, SectionsMap}};
{error, _Reason} = Error -> Error
end.
get_section(SectionName, SectionsMap) ->
case maps:get(SectionName, SectionsMap, false) of
{_Section, _SubsectionsMap} = Result -> Result;
false ->
case section_from_name(SectionName) of
#section{} = Section ->
SubsectionsMap = #{},
{Section, SubsectionsMap};
false ->
Section = make_section(SectionName),
SubsectionsMap = #{},
{Section, SubsectionsMap}
end
end.
make_section(SectionName) ->
%% update_section/5 will set sh_flags, sh_type, and sh_entsize
#section{ name = SectionName
, data = {stmts, []}
, dot = 0
, shndx = 0
, sh_name = 0
, sh_type = 0
, sh_offset = 0
, sh_flags = 0
, sh_link = ?SHN_UNDEF
, sh_info = 0
, sh_addralign = 1
, sh_entsize = 0
}.
update_section(Location, Section0, ShFlags, ShType, ShEntSize) ->
case update_sh_flags(Location, Section0, ShFlags) of
{ok, Section1} ->
case update_sh_type(Location, Section1, ShType) of
{ok, Section2} ->
update_sh_entsize(Location, Section2, ShEntSize);
{error, _Reason} = Error -> Error
end;
{error, _Reason} = Error -> Error
end.
update_sh_flags(Location, Section, ShFlags) ->
case ShFlags of
0 -> {ok, Section};
_ ->
case Section#section.sh_flags of
0 -> {ok, Section#section{sh_flags = ShFlags}};
ShFlags -> {ok, Section};
ShFlags0 ->
case may_update_sh_flags(Section, ShFlags) of
true -> {ok, Section#section{sh_flags = ShFlags0 bor ShFlags}};
false -> fmterr(Location, "cannot change section flags", [])
end
end
end.
may_update_sh_flags(Section, ShFlags) ->
%% Processor and application-specific flags may be added to an existing
%% section. The range of application-specific flags isn't defined in the
%% ELF spec: we interpret that as any flag outside of the reserved ranges.
ReservedMask = (?SHF_COMPRESSED * 2 - 1) bor ?SHF_MASKOS,
case (ShFlags band ReservedMask) =:= 0 of
true -> true;
false ->
case ShFlags of
?SHF_ALLOC ->
case Section#section.name of
".interp" -> true;
".strtab" -> true;
".symtab" -> true;
_ -> false
end;
?SHF_EXECINSTR -> Section#section.name =:= ".note.GNU-stack";
_ -> false
end
end.
update_sh_type(Location, Section, ShType) ->
case ShType of
0 -> {ok, Section};
_ ->
case Section#section.sh_type of
0 -> {ok, Section#section{sh_type = ShType}};
ShType -> {ok, Section};
_ -> fmterr(Location, "cannot change section type", [])
end
end.
update_sh_entsize(Location, Section, ShEntSize) ->
case ShEntSize of
0 -> {ok, Section};
_ ->
case Section#section.sh_entsize of
0 -> {ok, Section#section{sh_entsize = ShEntSize}};
ShEntSize -> {ok, Section};
_ -> fmterr(Location, "cannot change section element size", [])
end
end.
enter_subsection(SectionName, SubsectionNr, SectionsMap) ->
{_Section, SubsectionsMap} = maps:get(SectionName, SectionsMap), % must exist
maps:get(SubsectionNr, SubsectionsMap, []). % may be absent
get_subsection(SectionName, SubsectionNr, SectionsMap) ->
{_Section, SubsectionsMap} = maps:get(SectionName, SectionsMap), % must exist
maps:get(SubsectionNr, SubsectionsMap). % must exist
%% Scan state utilities
scan_state_open(File) ->
case File of
"--" -> scan:stdin();
"-" -> scan:stdin();
_ -> scan:fopen(File)
end.
%% Pass 2 ----------------------------------------------------------------------
%%
%% - process subsections in order
%% - interpret stmts
pass2(SectionsMap) ->
pass2_sections(maps:to_list(SectionsMap), tunit_init()).
pass2_sections([], Tunit) -> {ok, Tunit};
pass2_sections([{SectionName, {Section, SubsectionsMap}} | Sections], Tunit0) ->
Tunit = (tunit:put_section(Tunit0, Section))#tunit{cursect = SectionName},
case pass2_subsections(SectionName, SubsectionsMap, Tunit) of
{ok, NewTunit} -> pass2_sections(Sections, NewTunit);
{error, _Reason} = Error -> Error
end.
pass2_subsections(SectionName, SubsectionsMap, Tunit) ->
case SectionName of
".data" ++ _ -> ok;
".debug" ++ _ -> ok;
".rodata" ++ _ -> ok;
".text" ++ _ -> ok
end,
pass2_subsections(lists:sort(maps:to_list(SubsectionsMap)), Tunit).
pass2_subsections([], Tunit) -> {ok, Tunit};
pass2_subsections([{_SubsectionNr, StmtsRev} | Subsections], Tunit) ->
case pass2_stmts(lists:reverse(StmtsRev), Tunit) of
{ok, NewTunit} ->
%% GAS documentation states that each sub-section is padded to make its
%% size a multiple of 4 bytes, but also that other implementations may
%% do differently. We do not insert any implicit padding.
pass2_subsections(Subsections, NewTunit);
{error, _Reason} = Error -> Error
end.
pass2_stmts([], Tunit) -> {ok, Tunit};
pass2_stmts([{Location, Stmt} | Stmts], Tunit) ->
case pass2_stmt(Location, Tunit, Stmt) of
{ok, NewTunit} -> pass2_stmts(Stmts, NewTunit);
{error, _Reason} = Error -> Error
end.
pass2_stmt(Location, Tunit, Stmt) ->
case Stmt of
#s_dot_ascii{} -> dot_ascii(Location, Tunit, Stmt);
#s_dot_byte{} -> dot_byte(Location, Tunit, Stmt);
#s_dot_file{} -> dot_file(Location, Tunit, Stmt);
#s_dot_globl{} -> dot_globl(Location, Tunit, Stmt);
#s_dot_ident{} -> dot_ident(Location, Tunit, Stmt);
#s_dot_long{} -> dot_long(Location, Tunit, Stmt);
#s_dot_short{} -> dot_short(Location, Tunit, Stmt);
#s_dot_size{} -> dot_size(Location, Tunit, Stmt);
#s_dot_type{} -> dot_type(Location, Tunit, Stmt);
#s_dot_2byte{} -> dot_2byte(Location, Tunit, Stmt);
#s_dot_4byte{} -> dot_4byte(Location, Tunit, Stmt);
#s_label{} -> label(Location, Tunit, Stmt);
#s_local_label{} -> local_label(Location, Tunit, Stmt);
#s_insn{} -> insn(Location, Tunit, Stmt)
end.
dot_ascii(_Location, Tunit, #s_dot_ascii{z = Z, strings = Strings} = Stmt) ->
#tunit{cursect = Cursect} = Tunit,
#section{data = {stmts, Stmts}, dot = Dot} = Section = tunit:get_section(Tunit, Cursect),
Size0 = lists:sum(lists:map(fun erlang:length/1, Strings)),
Size =
case Z of
true -> Size0 + length(Strings);
false -> Size0
end,
NewSection =
Section#section{ data = {stmts, [Stmt | Stmts]}
, dot = Dot + Size
},
{ok, tunit:put_section(Tunit, NewSection)}.
dot_byte(Location, Tunit, #s_dot_byte{} = Stmt0) ->
Size = 1,
Align = 1,
integer_data_directive(Location, Tunit, Stmt0, Size, Align, ".byte",
fun(Stmt) -> Stmt#s_dot_byte.exprs end,
fun(Stmt, Exprs) -> Stmt#s_dot_byte{exprs = Exprs} end).
dot_file(_Location, Tunit, #s_dot_file{string = String}) ->
Symbol = #symbol{ name = String
, section = abs
, st_value = 0
, st_size = 0
, st_info = ?ELF_ST_INFO(?STB_LOCAL, ?STT_FILE)
, st_name = 0
, st_shndx = ?SHN_ABS
},
{ok, tunit:put_symbol(Tunit, Symbol)}.
dot_globl(Location, Tunit, #s_dot_globl{name = Name}) ->
case tunit:get_symbol(Tunit, Name) of
false ->
Symbol =
#symbol{ name = Name
, section = false
, st_value = false
, st_size = false
, st_info = ?ELF_ST_INFO(?STB_GLOBAL, ?STT_NOTYPE)
, st_name = 0
, st_shndx = 0
},
{ok, tunit:put_symbol(Tunit, Symbol)};
#symbol{st_info = StInfo} = OldSymbol ->
case ?ELF_ST_BIND(StInfo) of
?STB_GLOBAL -> {ok, Tunit};
?STB_LOCAL -> % FIXME: assumed local-by-default, are there hard-local symbols?
Symbol = OldSymbol#symbol{st_info = ?ELF_ST_INFO(?STB_GLOBAL, ?ELF_ST_TYPE(StInfo))},
{ok, tunit:put_symbol(Tunit, Symbol)};
Bind ->
fmterr(Location, "symbol ~s has previous incompatible binding type ~p", [Name, Bind])
end
end.
dot_ident(_Location, Tunit, #s_dot_ident{} = Stmt) ->
#section{data = {stmts, Stmts}} = OldSection =
case tunit:get_section(Tunit, ".comment") of
false -> section_dot_comment();
Section -> Section
end,
NewSection = OldSection#section{data = {stmts, [Stmt | Stmts]}},
{ok, tunit:put_section(Tunit, NewSection)}.
dot_long(Location, Tunit, #s_dot_long{} = Stmt0) ->
Size = 4, % FIXME: target-specific
Align = Size,
integer_data_directive(Location, Tunit, Stmt0, Size, Align, ".long",
fun(Stmt) -> Stmt#s_dot_long.exprs end,
fun(Stmt, Exprs) -> Stmt#s_dot_long{exprs = Exprs} end).
integer_data_directive(Location, Tunit, Stmt, Size, Align, Lexeme, GetExpr, SetExprs) ->
Exprs = GetExpr(Stmt),
#tunit{cursect = Cursect} = Tunit,
#section{data = {stmts, Stmts}, dot = Dot} = Section = tunit:get_section(Tunit, Cursect),
case Dot rem Align of
0 ->
NewExprs = [expr_fixup(Tunit, Expr) || Expr <- Exprs],
NewStmt = SetExprs(Stmt, NewExprs),
NewSection =
Section#section{ data = {stmts, [NewStmt | Stmts]}
, dot = Dot + Size * length(NewExprs)
},
{ok, tunit:put_section(Tunit, NewSection)};
_ -> fmterr(Location, "misaligned address for ~s", [Lexeme])
end.
dot_short(Location, Tunit, #s_dot_short{} = Stmt0) ->
Size = 2, % FIXME: target-specific
Align = Size,
integer_data_directive(Location, Tunit, Stmt0, Size, Align, ".short",
fun(Stmt) -> Stmt#s_dot_short.exprs end,
fun(Stmt, Exprs) -> Stmt#s_dot_short{exprs = Exprs} end).
dot_size(Location, Tunit, #s_dot_size{name = Name}) ->
#tunit{cursect = Cursect} = Tunit,
#section{dot = Dot} = tunit:get_section(Tunit, Cursect),
case tunit:get_symbol(Tunit, Name) of
#symbol{st_size = StSize} when StSize =/= false ->
fmterr(Location, "size of symbol ~s already defined", [Name]);
#symbol{section = Section} when Section =/= Cursect ->
fmterr(Location, "symbol ~s not defined in same section as dot", [Name]);
#symbol{st_value = StValue} = OldSymbol when StValue =< Dot -> % note: false > integer()
Symbol = OldSymbol#symbol{st_size = Dot - StValue},
{ok, tunit:put_symbol(Tunit, Symbol)};
#symbol{st_value = StValue} when StValue =/= false, StValue > Dot ->
fmterr(Location, "cannot make symbol ~s negative size", [Name]);
_ ->
fmterr(Location, "symbol ~s not defined", [Name])
end.
dot_type(Location, Tunit, #s_dot_type{name = Name, type = Type}) ->
StType =
case Type of
function -> ?STT_FUNC;
object -> ?STT_OBJECT
end,
case tunit:get_symbol(Tunit, Name) of
false ->
Symbol =
#symbol{ name = Name
, section = false
, st_value = false
, st_size = false
, st_info = ?ELF_ST_INFO(?STB_LOCAL, StType)
, st_name = 0
, st_shndx = 0
},
{ok, tunit:put_symbol(Tunit, Symbol)};
#symbol{st_info = StInfo} = OldSymbol ->
case ?ELF_ST_TYPE(StInfo) of
StType -> {ok, Tunit};
?STT_NOTYPE ->
Symbol = OldSymbol#symbol{st_info = ?ELF_ST_INFO(?ELF_ST_BIND(StInfo), StType)},
{ok, tunit:put_symbol(Tunit, Symbol)};
Other ->
fmterr(Location, "symbol ~s has previous incompatible type ~p", [Name, Other])
end
end.
dot_2byte(Location, Tunit, #s_dot_2byte{} = Stmt0) ->
Size = 2, % FIXME: target-specific
Align = 1,
integer_data_directive(Location, Tunit, Stmt0, Size, Align, ".2byte",
fun(Stmt) -> Stmt#s_dot_2byte.exprs end,
fun(Stmt, Exprs) -> Stmt#s_dot_2byte{exprs = Exprs} end).
dot_4byte(Location, Tunit, #s_dot_4byte{} = Stmt0) ->
Size = 4, % FIXME: target-specific
Align = 1,
integer_data_directive(Location, Tunit, Stmt0, Size, Align, ".4byte",
fun(Stmt) -> Stmt#s_dot_4byte.exprs end,
fun(Stmt, Exprs) -> Stmt#s_dot_4byte{exprs = Exprs} end).
label(Location, Tunit, #s_label{name = Name}) ->
case tunit:get_symbol(Tunit, Name) of
#symbol{section = false, st_value = false} = Symbol -> define_label(Tunit, Symbol);
#symbol{} -> fmterr(Location, "label ~s already defined", [Name]);
false -> define_new_label(Tunit, Name)
end.
define_new_label(Tunit, Name) ->
Symbol =
#symbol{ name = Name
, section = false % overridden below
, st_value = false % overridden below
, st_size = false
, st_info = 0
, st_name = 0
, st_shndx = 0
},
define_label(Tunit, Symbol).
define_label(Tunit, Symbol) ->
#tunit{cursect = Cursect} = Tunit,
#section{dot = Dot} = tunit:get_section(Tunit, Cursect),
{ok, tunit:put_symbol(Tunit, Symbol#symbol{section = Cursect, st_value = Dot})}.
local_label(_Location, Tunit, #s_local_label{number = Number}) ->
Serial = local_label_serial(Tunit, Number) + 1,
Name = local_label_name(Number, Serial),
define_new_label(tunit:put_local_label(Tunit, Number, Serial), Name).
local_label_serial(Tunit, Number) ->
case tunit:get_local_label(Tunit, Number) of
false -> 0;
Serial -> Serial
end.
local_label_name(Number, Serial) ->
lists:flatten(io_lib:format(".L~.10b\^B~.10b", [Number, Serial])).
insn(Location, Tunit, #s_insn{} = Stmt) ->
#tunit{cursect = Cursect} = Tunit,
#section{data = {stmts, Stmts}, dot = Dot} = Section = tunit:get_section(Tunit, Cursect),
case Dot rem 4 of % FIXME: target-specific
0 ->
NewStmt = insn_fixup(Tunit, Stmt),
NewSection =
Section#section{ data = {stmts, [NewStmt | Stmts]}
, dot = Dot + 4 % FIXME: target-specific
},
{ok, tunit:put_section(Tunit, NewSection)};
_ -> fmterr(Location, "misaligned address for instruction", [])
end.
insn_fixup(Tunit, Insn) ->
Address = Insn#s_insn.address,
Insn#s_insn{address = expr_fixup(Tunit, Address)}.
expr_fixup(Tunit, Expr) ->
#expr{operand1 = Operand1, operand2 = Operand2} = Expr,
Expr#expr{operand1 = operand_fixup(Tunit, Operand1),
operand2 = operand_fixup(Tunit, Operand2)}.
operand_fixup(Tunit, {Number, Direction}) ->
LabelSerial = local_label_serial(Tunit, Number),
ReferenceSerial =
case Direction of
$b -> LabelSerial;
$f -> LabelSerial + 1
end,
local_label_name(Number, ReferenceSerial);
operand_fixup(_Tunit, Operand) -> Operand.
%% Initialization --------------------------------------------------------------
tunit_init() ->
SectionText = section_dot_text(),
Cursect = SectionText#section.name,
tunit:put_section(tunit:new(Cursect), SectionText).
%% Predefined Sections ---------------------------------------------------------
section_from_name(SectionName) ->
case SectionName of
".data" -> section_dot_data();
".rodata" -> section_dot_rodata();
".text" -> section_dot_text();
_ -> false
end.
section_dot_comment() -> % ".comment"
#section{ name = ".comment"
, data = {stmts, []}
, dot = 0
, shndx = 0
, sh_name = 0
, sh_type = ?SHT_PROGBITS
, sh_offset = 0
, sh_flags = ?SHF_MERGE bor ?SHF_STRINGS
, sh_link = ?SHN_UNDEF
, sh_info = 0
, sh_addralign = 1
, sh_entsize = 1
}.
section_dot_data() -> % ".data"
#section{ name = ".data"
, data = {stmts, []}
, dot = 0
, shndx = 0
, sh_name = 0
, sh_type = ?SHT_PROGBITS
, sh_offset = 0
, sh_flags = ?SHF_ALLOC bor ?SHF_WRITE
, sh_link = ?SHN_UNDEF
, sh_info = 0
, sh_addralign = 4 % FIXME: target-specific
, sh_entsize = 0
}.
section_dot_rodata() -> % ".rodata"
#section{ name = ".rodata"
, data = {stmts, []}
, dot = 0
, shndx = 0
, sh_name = 0
, sh_type = ?SHT_PROGBITS
, sh_offset = 0
, sh_flags = ?SHF_ALLOC
, sh_link = ?SHN_UNDEF
, sh_info = 0
, sh_addralign = 4 % FIXME: target-specific
, sh_entsize = 0
}.
section_dot_text() -> % ".text"
#section{ name = ".text"
, data = {stmts, []}
, dot = 0
, shndx = 0
, sh_name = 0
, sh_type = ?SHT_PROGBITS
, sh_offset = 0
, sh_flags = ?SHF_ALLOC bor ?SHF_EXECINSTR
, sh_link = ?SHN_UNDEF
, sh_info = 0
, sh_addralign = 4 % FIXME: target-specific
, sh_entsize = 0
}.
%% Error reporting -------------------------------------------------------------
fmterr({FileName, LineNr}, Fmt, Args) ->
{error, {?MODULE, {FileName, LineNr, Fmt, Args}}}.
-spec format_error(term()) -> io_lib:chars().
format_error({FileName, LineNr, Fmt, Args}) ->
io_lib:format("file ~s line ~p: " ++ Fmt, [FileName, LineNr | Args]).

View File

@ -0,0 +1,467 @@
%%% -*- erlang-indent-level: 2 -*-
%%%
%%% input processing pass 1 for pdp10-elf as
%%% Copyright (C) 2013-2024 Mikael Pettersson
%%%
%%% This file is part of pdp10-tools.
%%%
%%% pdp10-tools is free software: you can redistribute it and/or modify
%%% it under the terms of the GNU General Public License as published by
%%% the Free Software Foundation, either version 3 of the License, or
%%% (at your option) any later version.
%%%
%%% pdp10-tools is distributed in the hope that it will be useful,
%%% but WITHOUT ANY WARRANTY; without even the implied warranty of
%%% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
%%% GNU General Public License for more details.
%%%
%%% You should have received a copy of the GNU General Public License
%%% along with pdp10-tools. If not, see <http://www.gnu.org/licenses/>.
-module(input_pass1).
-export([ format_error/1
, pass1/1
, section_dot_comment/0
, section_dot_text/0
]).
-export_type([ sectionsmap/0
]).
-include("tunit.hrl").
-include_lib("lib/include/pdp10_elf36.hrl").
%% Pass 1 ----------------------------------------------------------------------
%%
%% - scan, parse, annotate stmts with locations
%% - maintain current and previous section and subsection, and stack thereof
%% - interpret sectioning stmts, accumulate annotated stmts in subsections
-type sectionname() :: string().
-type subsectionnr() :: non_neg_integer().
-type locationandstmt() :: {scan:location(), stmt()}.
-type subsectionsmap() :: #{subsectionnr() => [locationandstmt()]}.
-type sectionsmap() :: #{sectionname() => {#section{}, subsectionsmap()}}.
-type sectionandsub() :: {sectionname(), subsectionnr()}.
-record(ctx,
{ sections_map :: sectionsmap()
, stack :: [{Current :: sectionandsub(), Previous :: sectionandsub()}]
, current :: sectionandsub()
, previous :: sectionandsub() | []
, stmts :: [locationandstmt()]
}).
-spec pass1([string()]) -> {ok, sectionsmap()} | {error, {module(), term()}}.
pass1(Files) ->
pass1_files(Files, ctx_init()).
pass1_files([], Ctx) -> {ok, ctx_fini(Ctx)};
pass1_files([File | Files], Ctx) ->
case pass1_file(File, Ctx) of
{ok, NewCtx} -> pass1_files(Files, NewCtx);
{error, _Reason} = Error -> Error
end.
pass1_file(File, Ctx) ->
case scan_state_open(File) of
{ok, ScanState} ->
try pass1_process(ScanState, Ctx)
after scan:fclose(ScanState)
end;
{error, _Reason} = Error -> Error
end.
pass1_process(ScanState, Ctx) ->
case parse:stmt(ScanState) of
eof -> {ok, Ctx};
{ok, {Location, Stmt}} ->
case pass1_stmt(Location, Ctx, Stmt) of
{ok, NewCtx} -> pass1_process(ScanState, NewCtx);
{error, _Reason} = Error -> Error
end;
{error, _Reason} = Error -> Error
end.
pass1_stmt(Location, Ctx, Stmt) ->
case Stmt of
#s_dot_data{} -> dot_data(Location, Ctx, Stmt);
#s_dot_popsection{} -> dot_popsection(Location, Ctx, Stmt);
#s_dot_previous{} -> dot_previous(Location, Ctx, Stmt);
#s_dot_section{} -> dot_section(Location, Ctx, Stmt);
#s_dot_subsection{} -> dot_subsection(Location, Ctx, Stmt);
#s_dot_text{} -> dot_text(Location, Ctx, Stmt);
_ -> {ok, ctx_append(Ctx, Location, Stmt)}
end.
dot_data(Location, Ctx, #s_dot_data{nr = SubsectionNr}) ->
{ok, ctx_data(Ctx, Location, SubsectionNr)}.
dot_popsection(Location, Ctx0, #s_dot_popsection{}) ->
case ctx_try_popsection(Ctx0) of
{ok, _Ctx} = Result -> Result;
false -> fmterr(Location, ".popsection with empty section stack", [])
end.
dot_previous(Location, Ctx0, #s_dot_previous{}) ->
case ctx_try_previous(Ctx0) of
{ok, _Ctx} = Result -> Result;
false -> fmterr(Location, ".previous with empty section stack", [])
end.
dot_section(Location, Ctx, Stmt) ->
#s_dot_section{ name = SectionName
, nr = SubsectionNrOpt
, sh_flags = ShFlags
, sh_type = ShType
, sh_entsize = ShEntSize
} = Stmt,
ctx_section(Ctx, Location, SectionName, SubsectionNrOpt,
ShFlags, ShType, ShEntSize).
dot_subsection(_Location, Ctx, #s_dot_subsection{nr = SubsectionNr}) ->
{ok, ctx_subsection(Ctx, SubsectionNr)}.
dot_text(Location, Ctx, #s_dot_text{nr = SubsectionNr}) ->
{ok, ctx_text(Ctx, Location, SubsectionNr)}.
%% Context utilities
%% INV: any section name in current/previous/stack is bound in sections_map
ctx_init() ->
SectionName = ".text",
Section = section_dot_text(),
SubsectionsMap = #{},
SubsectionNr = 0,
#ctx{ sections_map = #{SectionName => {Section, SubsectionsMap}}
, stack = []
, current = {SectionName, SubsectionNr}
, previous = []
, stmts = []
}.
ctx_fini(Ctx) ->
(ctx_flush(Ctx))#ctx.sections_map.
ctx_flush(Ctx) ->
#ctx{ sections_map = SectionsMap0
, current = {SectionName, SubsectionNr}
, stmts = Stmts
} = Ctx,
{Section, SubsectionsMap0} = maps:get(SectionName, SectionsMap0), % must exist
SubsectionsMap = maps:put(SubsectionNr, Stmts, SubsectionsMap0),
SectionsMap = maps:put(SectionName, {Section, SubsectionsMap}, SectionsMap0),
Ctx#ctx{sections_map = SectionsMap}.
ctx_try_popsection(Ctx0) -> % implements .popsection
Ctx = ctx_flush(Ctx0),
#ctx{ sections_map = SectionsMap
, stack = Stack
} = Ctx,
case Stack of
[] -> false;
[{Current = {SectionName, SubsectionNr}, Previous} | RestStack] ->
Stmts = get_subsection(SectionName, SubsectionNr, SectionsMap),
{ok, Ctx#ctx{ stack = RestStack
, current = Current
, previous = Previous
, stmts = Stmts
}}
end.
ctx_try_previous(Ctx0) -> % implements .previous
Ctx = ctx_flush(Ctx0),
#ctx{ sections_map = SectionsMap
, current = Current
, previous = Previous
} = Ctx,
case Previous of
[] -> false;
{SectionName, SubsectionNr} ->
Stmts = get_subsection(SectionName, SubsectionNr, SectionsMap),
{ok, Ctx#ctx{ current = Previous
, previous = Current
, stmts = Stmts
}}
end.
ctx_section(Ctx0, Location, SectionName, SubsectionNrOpt,
ShFlags, ShType, ShEntSize) ->
{IsPushsection, SubsectionNr} =
case SubsectionNrOpt of
false -> {false, 0};
_ -> {true, SubsectionNrOpt}
end,
Ctx = ctx_flush(Ctx0),
#ctx{ sections_map = SectionsMap0
, stack = Stack
, current = Current
, previous = Previous
} = Ctx,
case enter_section(Location, SectionName, SubsectionNr, SectionsMap0,
ShFlags, ShType, ShEntSize) of
{ok, {Stmts, SectionsMap}} ->
NewStack =
case IsPushsection of
true -> [{Current, Previous} | Stack];
false -> Stack
end,
{ok, Ctx#ctx{ sections_map = SectionsMap
, stack = NewStack
, current = {SectionName, SubsectionNr}
, previous = Current
, stmts = Stmts
}};
{error, _Reason} = Error -> Error
end.
ctx_subsection(Ctx0, SubsectionNr) -> % implements .subsection <nr>
Ctx = ctx_flush(Ctx0),
#ctx{ sections_map = SectionsMap
, current = Current = {SectionName, _CurSubsectionNr}
} = Ctx,
Stmts = enter_subsection(SectionName, SubsectionNr, SectionsMap),
Ctx#ctx{ current = {SectionName, SubsectionNr}
, previous = Current
, stmts = Stmts
}.
ctx_data(Ctx, Location, SubsectionNr) -> % implements .data <nr>
ctx_enter_section(Ctx, Location, ".data", SubsectionNr).
ctx_text(Ctx, Location, SubsectionNr) -> % implements .text <nr>
ctx_enter_section(Ctx, Location, ".text", SubsectionNr).
%% switch to known system section, e.g. .data or .text
ctx_enter_section(Ctx0, Location, SectionName, SubsectionNr) ->
Ctx = ctx_flush(Ctx0),
#ctx{ sections_map = SectionsMap0
, current = Current
} = Ctx,
{ok, {Stmts, SectionsMap}} =
enter_section(Location, SectionName, SubsectionNr, SectionsMap0),
Ctx#ctx{ sections_map = SectionsMap
, current = {SectionName, SubsectionNr}
, previous = Current
, stmts = Stmts
}.
ctx_append(Ctx, Location, Stmt) ->
#ctx{stmts = Stmts} = Ctx,
Ctx#ctx{stmts = [{Location, Stmt} | Stmts]}.
enter_section(Location, SectionName, SubsectionNr, SectionsMap) ->
enter_section(Location, SectionName, SubsectionNr, SectionsMap,
_ShFlags = 0, _ShType = 0, _ShEntSize = 0).
enter_section(Location, SectionName, SubsectionNr, SectionsMap0,
ShFlags, ShType, ShEntSize) ->
{Section0, SubsectionsMap} = get_section(SectionName, SectionsMap0),
case update_section(Location, Section0, ShFlags, ShType, ShEntSize) of
{ok, Section} ->
SectionsMap = maps:put(SectionName, {Section, SubsectionsMap}, SectionsMap0),
Stmts = maps:get(SubsectionNr, SubsectionsMap, []),
{ok, {Stmts, SectionsMap}};
{error, _Reason} = Error -> Error
end.
get_section(SectionName, SectionsMap) ->
case maps:get(SectionName, SectionsMap, false) of
{_Section, _SubsectionsMap} = Result -> Result;
false ->
case section_from_name(SectionName) of
#section{} = Section ->
SubsectionsMap = #{},
{Section, SubsectionsMap};
false ->
Section = make_section(SectionName),
SubsectionsMap = #{},
{Section, SubsectionsMap}
end
end.
make_section(SectionName) ->
%% update_section/5 will set sh_flags, sh_type, and sh_entsize
#section{ name = SectionName
, data = {stmts, []}
, dot = 0
, shndx = 0
, sh_name = 0
, sh_type = 0
, sh_offset = 0
, sh_flags = 0
, sh_link = ?SHN_UNDEF
, sh_info = 0
, sh_addralign = 1
, sh_entsize = 0
}.
update_section(Location, Section0, ShFlags, ShType, ShEntSize) ->
case update_sh_flags(Location, Section0, ShFlags) of
{ok, Section1} ->
case update_sh_type(Location, Section1, ShType) of
{ok, Section2} ->
update_sh_entsize(Location, Section2, ShEntSize);
{error, _Reason} = Error -> Error
end;
{error, _Reason} = Error -> Error
end.
update_sh_flags(Location, Section, ShFlags) ->
case ShFlags of
0 -> {ok, Section};
_ ->
case Section#section.sh_flags of
0 -> {ok, Section#section{sh_flags = ShFlags}};
ShFlags -> {ok, Section};
ShFlags0 ->
case may_update_sh_flags(Section, ShFlags) of
true -> {ok, Section#section{sh_flags = ShFlags0 bor ShFlags}};
false -> fmterr(Location, "cannot change section flags", [])
end
end
end.
may_update_sh_flags(Section, ShFlags) ->
%% Processor and application-specific flags may be added to an existing
%% section. The range of application-specific flags isn't defined in the
%% ELF spec: we interpret that as any flag outside of the reserved ranges.
ReservedMask = (?SHF_COMPRESSED * 2 - 1) bor ?SHF_MASKOS,
case (ShFlags band ReservedMask) =:= 0 of
true -> true;
false ->
case ShFlags of
?SHF_ALLOC ->
case Section#section.name of
".interp" -> true;
".strtab" -> true;
".symtab" -> true;
_ -> false
end;
?SHF_EXECINSTR -> Section#section.name =:= ".note.GNU-stack";
_ -> false
end
end.
update_sh_type(Location, Section, ShType) ->
case ShType of
0 -> {ok, Section};
_ ->
case Section#section.sh_type of
0 -> {ok, Section#section{sh_type = ShType}};
ShType -> {ok, Section};
_ -> fmterr(Location, "cannot change section type", [])
end
end.
update_sh_entsize(Location, Section, ShEntSize) ->
case ShEntSize of
0 -> {ok, Section};
_ ->
case Section#section.sh_entsize of
0 -> {ok, Section#section{sh_entsize = ShEntSize}};
ShEntSize -> {ok, Section};
_ -> fmterr(Location, "cannot change section element size", [])
end
end.
enter_subsection(SectionName, SubsectionNr, SectionsMap) ->
{_Section, SubsectionsMap} = maps:get(SectionName, SectionsMap), % must exist
maps:get(SubsectionNr, SubsectionsMap, []). % may be absent
get_subsection(SectionName, SubsectionNr, SectionsMap) ->
{_Section, SubsectionsMap} = maps:get(SectionName, SectionsMap), % must exist
maps:get(SubsectionNr, SubsectionsMap). % must exist
%% Scan state utilities
scan_state_open(File) ->
case File of
"--" -> scan:stdin();
"-" -> scan:stdin();
_ -> scan:fopen(File)
end.
%% Predefined Sections ---------------------------------------------------------
section_from_name(SectionName) ->
case SectionName of
".data" -> section_dot_data();
".rodata" -> section_dot_rodata();
".text" -> section_dot_text();
_ -> false
end.
-spec section_dot_comment() -> #section{}.
section_dot_comment() -> % ".comment"
#section{ name = ".comment"
, data = {stmts, []}
, dot = 0
, shndx = 0
, sh_name = 0
, sh_type = ?SHT_PROGBITS
, sh_offset = 0
, sh_flags = ?SHF_MERGE bor ?SHF_STRINGS
, sh_link = ?SHN_UNDEF
, sh_info = 0
, sh_addralign = 1
, sh_entsize = 1
}.
-spec section_dot_data() -> #section{}.
section_dot_data() -> % ".data"
#section{ name = ".data"
, data = {stmts, []}
, dot = 0
, shndx = 0
, sh_name = 0
, sh_type = ?SHT_PROGBITS
, sh_offset = 0
, sh_flags = ?SHF_ALLOC bor ?SHF_WRITE
, sh_link = ?SHN_UNDEF
, sh_info = 0
, sh_addralign = 4 % FIXME: target-specific
, sh_entsize = 0
}.
-spec section_dot_rodata() -> #section{}.
section_dot_rodata() -> % ".rodata"
#section{ name = ".rodata"
, data = {stmts, []}
, dot = 0
, shndx = 0
, sh_name = 0
, sh_type = ?SHT_PROGBITS
, sh_offset = 0
, sh_flags = ?SHF_ALLOC
, sh_link = ?SHN_UNDEF
, sh_info = 0
, sh_addralign = 4 % FIXME: target-specific
, sh_entsize = 0
}.
-spec section_dot_text() -> #section{}.
section_dot_text() -> % ".text"
#section{ name = ".text"
, data = {stmts, []}
, dot = 0
, shndx = 0
, sh_name = 0
, sh_type = ?SHT_PROGBITS
, sh_offset = 0
, sh_flags = ?SHF_ALLOC bor ?SHF_EXECINSTR
, sh_link = ?SHN_UNDEF
, sh_info = 0
, sh_addralign = 4 % FIXME: target-specific
, sh_entsize = 0
}.
%% Error reporting -------------------------------------------------------------
fmterr({FileName, LineNr}, Fmt, Args) ->
{error, {?MODULE, {FileName, LineNr, Fmt, Args}}}.
-spec format_error(term()) -> io_lib:chars().
format_error({FileName, LineNr, Fmt, Args}) ->
io_lib:format("file ~s line ~p: " ++ Fmt, [FileName, LineNr | Args]).

View File

@ -0,0 +1,333 @@
%%% -*- erlang-indent-level: 2 -*-
%%%
%%% input processing pass 2 for pdp10-elf as
%%% Copyright (C) 2013-2024 Mikael Pettersson
%%%
%%% This file is part of pdp10-tools.
%%%
%%% pdp10-tools is free software: you can redistribute it and/or modify
%%% it under the terms of the GNU General Public License as published by
%%% the Free Software Foundation, either version 3 of the License, or
%%% (at your option) any later version.
%%%
%%% pdp10-tools is distributed in the hope that it will be useful,
%%% but WITHOUT ANY WARRANTY; without even the implied warranty of
%%% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
%%% GNU General Public License for more details.
%%%
%%% You should have received a copy of the GNU General Public License
%%% along with pdp10-tools. If not, see <http://www.gnu.org/licenses/>.
-module(input_pass2).
-export([ format_error/1
, pass2/1
]).
-include("tunit.hrl").
-include_lib("lib/include/pdp10_elf36.hrl").
%% Pass 2 ----------------------------------------------------------------------
%%
%% - process subsections in order
%% - interpret stmts
-spec pass2(input_pass1:sectionsmap()) -> {ok, #tunit{}} | {error, {module(), term()}}.
pass2(SectionsMap) ->
pass2_sections(maps:to_list(SectionsMap), tunit_init()).
pass2_sections([], Tunit) -> {ok, Tunit};
pass2_sections([{SectionName, {Section, SubsectionsMap}} | Sections], Tunit0) ->
Tunit = (tunit:put_section(Tunit0, Section))#tunit{cursect = SectionName},
case pass2_subsections(SectionName, SubsectionsMap, Tunit) of
{ok, NewTunit} -> pass2_sections(Sections, NewTunit);
{error, _Reason} = Error -> Error
end.
pass2_subsections(SectionName, SubsectionsMap, Tunit) ->
case SectionName of
".data" ++ _ -> ok;
".debug" ++ _ -> ok;
".rodata" ++ _ -> ok;
".text" ++ _ -> ok
end,
pass2_subsections(lists:sort(maps:to_list(SubsectionsMap)), Tunit).
pass2_subsections([], Tunit) -> {ok, Tunit};
pass2_subsections([{_SubsectionNr, StmtsRev} | Subsections], Tunit) ->
case pass2_stmts(lists:reverse(StmtsRev), Tunit) of
{ok, NewTunit} ->
%% GAS documentation states that each sub-section is padded to make its
%% size a multiple of 4 bytes, but also that other implementations may
%% do differently. We do not insert any implicit padding.
pass2_subsections(Subsections, NewTunit);
{error, _Reason} = Error -> Error
end.
pass2_stmts([], Tunit) -> {ok, Tunit};
pass2_stmts([{Location, Stmt} | Stmts], Tunit) ->
case pass2_stmt(Location, Tunit, Stmt) of
{ok, NewTunit} -> pass2_stmts(Stmts, NewTunit);
{error, _Reason} = Error -> Error
end.
pass2_stmt(Location, Tunit, Stmt) ->
case Stmt of
#s_dot_ascii{} -> dot_ascii(Location, Tunit, Stmt);
#s_dot_byte{} -> dot_byte(Location, Tunit, Stmt);
#s_dot_file{} -> dot_file(Location, Tunit, Stmt);
#s_dot_globl{} -> dot_globl(Location, Tunit, Stmt);
#s_dot_ident{} -> dot_ident(Location, Tunit, Stmt);
#s_dot_long{} -> dot_long(Location, Tunit, Stmt);
#s_dot_short{} -> dot_short(Location, Tunit, Stmt);
#s_dot_size{} -> dot_size(Location, Tunit, Stmt);
#s_dot_type{} -> dot_type(Location, Tunit, Stmt);
#s_dot_2byte{} -> dot_2byte(Location, Tunit, Stmt);
#s_dot_4byte{} -> dot_4byte(Location, Tunit, Stmt);
#s_label{} -> label(Location, Tunit, Stmt);
#s_local_label{} -> local_label(Location, Tunit, Stmt);
#s_insn{} -> insn(Location, Tunit, Stmt)
end.
dot_ascii(_Location, Tunit, #s_dot_ascii{z = Z, strings = Strings} = Stmt) ->
#tunit{cursect = Cursect} = Tunit,
#section{data = {stmts, Stmts}, dot = Dot} = Section = tunit:get_section(Tunit, Cursect),
Size0 = lists:sum(lists:map(fun erlang:length/1, Strings)),
Size =
case Z of
true -> Size0 + length(Strings);
false -> Size0
end,
NewSection =
Section#section{ data = {stmts, [Stmt | Stmts]}
, dot = Dot + Size
},
{ok, tunit:put_section(Tunit, NewSection)}.
dot_byte(Location, Tunit, #s_dot_byte{} = Stmt0) ->
Size = 1,
Align = 1,
integer_data_directive(Location, Tunit, Stmt0, Size, Align, ".byte",
fun(Stmt) -> Stmt#s_dot_byte.exprs end,
fun(Stmt, Exprs) -> Stmt#s_dot_byte{exprs = Exprs} end).
dot_file(_Location, Tunit, #s_dot_file{string = String}) ->
Symbol = #symbol{ name = String
, section = abs
, st_value = 0
, st_size = 0
, st_info = ?ELF_ST_INFO(?STB_LOCAL, ?STT_FILE)
, st_name = 0
, st_shndx = ?SHN_ABS
},
{ok, tunit:put_symbol(Tunit, Symbol)}.
dot_globl(Location, Tunit, #s_dot_globl{name = Name}) ->
case tunit:get_symbol(Tunit, Name) of
false ->
Symbol =
#symbol{ name = Name
, section = false
, st_value = false
, st_size = false
, st_info = ?ELF_ST_INFO(?STB_GLOBAL, ?STT_NOTYPE)
, st_name = 0
, st_shndx = 0
},
{ok, tunit:put_symbol(Tunit, Symbol)};
#symbol{st_info = StInfo} = OldSymbol ->
case ?ELF_ST_BIND(StInfo) of
?STB_GLOBAL -> {ok, Tunit};
?STB_LOCAL -> % FIXME: assumed local-by-default, are there hard-local symbols?
Symbol = OldSymbol#symbol{st_info = ?ELF_ST_INFO(?STB_GLOBAL, ?ELF_ST_TYPE(StInfo))},
{ok, tunit:put_symbol(Tunit, Symbol)};
Bind ->
fmterr(Location, "symbol ~s has previous incompatible binding type ~p", [Name, Bind])
end
end.
dot_ident(_Location, Tunit, #s_dot_ident{} = Stmt) ->
#section{data = {stmts, Stmts}} = OldSection =
case tunit:get_section(Tunit, ".comment") of
false -> input_pass1:section_dot_comment();
Section -> Section
end,
NewSection = OldSection#section{data = {stmts, [Stmt | Stmts]}},
{ok, tunit:put_section(Tunit, NewSection)}.
dot_long(Location, Tunit, #s_dot_long{} = Stmt0) ->
Size = 4, % FIXME: target-specific
Align = Size,
integer_data_directive(Location, Tunit, Stmt0, Size, Align, ".long",
fun(Stmt) -> Stmt#s_dot_long.exprs end,
fun(Stmt, Exprs) -> Stmt#s_dot_long{exprs = Exprs} end).
integer_data_directive(Location, Tunit, Stmt, Size, Align, Lexeme, GetExpr, SetExprs) ->
Exprs = GetExpr(Stmt),
#tunit{cursect = Cursect} = Tunit,
#section{data = {stmts, Stmts}, dot = Dot} = Section = tunit:get_section(Tunit, Cursect),
case Dot rem Align of
0 ->
NewExprs = [expr_fixup(Tunit, Expr) || Expr <- Exprs],
NewStmt = SetExprs(Stmt, NewExprs),
NewSection =
Section#section{ data = {stmts, [NewStmt | Stmts]}
, dot = Dot + Size * length(NewExprs)
},
{ok, tunit:put_section(Tunit, NewSection)};
_ -> fmterr(Location, "misaligned address for ~s", [Lexeme])
end.
dot_short(Location, Tunit, #s_dot_short{} = Stmt0) ->
Size = 2, % FIXME: target-specific
Align = Size,
integer_data_directive(Location, Tunit, Stmt0, Size, Align, ".short",
fun(Stmt) -> Stmt#s_dot_short.exprs end,
fun(Stmt, Exprs) -> Stmt#s_dot_short{exprs = Exprs} end).
dot_size(Location, Tunit, #s_dot_size{name = Name}) ->
#tunit{cursect = Cursect} = Tunit,
#section{dot = Dot} = tunit:get_section(Tunit, Cursect),
case tunit:get_symbol(Tunit, Name) of
#symbol{st_size = StSize} when StSize =/= false ->
fmterr(Location, "size of symbol ~s already defined", [Name]);
#symbol{section = Section} when Section =/= Cursect ->
fmterr(Location, "symbol ~s not defined in same section as dot", [Name]);
#symbol{st_value = StValue} = OldSymbol when StValue =< Dot -> % note: false > integer()
Symbol = OldSymbol#symbol{st_size = Dot - StValue},
{ok, tunit:put_symbol(Tunit, Symbol)};
#symbol{st_value = StValue} when StValue =/= false, StValue > Dot ->
fmterr(Location, "cannot make symbol ~s negative size", [Name]);
_ ->
fmterr(Location, "symbol ~s not defined", [Name])
end.
dot_type(Location, Tunit, #s_dot_type{name = Name, type = Type}) ->
StType =
case Type of
function -> ?STT_FUNC;
object -> ?STT_OBJECT
end,
case tunit:get_symbol(Tunit, Name) of
false ->
Symbol =
#symbol{ name = Name
, section = false
, st_value = false
, st_size = false
, st_info = ?ELF_ST_INFO(?STB_LOCAL, StType)
, st_name = 0
, st_shndx = 0
},
{ok, tunit:put_symbol(Tunit, Symbol)};
#symbol{st_info = StInfo} = OldSymbol ->
case ?ELF_ST_TYPE(StInfo) of
StType -> {ok, Tunit};
?STT_NOTYPE ->
Symbol = OldSymbol#symbol{st_info = ?ELF_ST_INFO(?ELF_ST_BIND(StInfo), StType)},
{ok, tunit:put_symbol(Tunit, Symbol)};
Other ->
fmterr(Location, "symbol ~s has previous incompatible type ~p", [Name, Other])
end
end.
dot_2byte(Location, Tunit, #s_dot_2byte{} = Stmt0) ->
Size = 2, % FIXME: target-specific
Align = 1,
integer_data_directive(Location, Tunit, Stmt0, Size, Align, ".2byte",
fun(Stmt) -> Stmt#s_dot_2byte.exprs end,
fun(Stmt, Exprs) -> Stmt#s_dot_2byte{exprs = Exprs} end).
dot_4byte(Location, Tunit, #s_dot_4byte{} = Stmt0) ->
Size = 4, % FIXME: target-specific
Align = 1,
integer_data_directive(Location, Tunit, Stmt0, Size, Align, ".4byte",
fun(Stmt) -> Stmt#s_dot_4byte.exprs end,
fun(Stmt, Exprs) -> Stmt#s_dot_4byte{exprs = Exprs} end).
label(Location, Tunit, #s_label{name = Name}) ->
case tunit:get_symbol(Tunit, Name) of
#symbol{section = false, st_value = false} = Symbol -> define_label(Tunit, Symbol);
#symbol{} -> fmterr(Location, "label ~s already defined", [Name]);
false -> define_new_label(Tunit, Name)
end.
define_new_label(Tunit, Name) ->
Symbol =
#symbol{ name = Name
, section = false % overridden below
, st_value = false % overridden below
, st_size = false
, st_info = 0
, st_name = 0
, st_shndx = 0
},
define_label(Tunit, Symbol).
define_label(Tunit, Symbol) ->
#tunit{cursect = Cursect} = Tunit,
#section{dot = Dot} = tunit:get_section(Tunit, Cursect),
{ok, tunit:put_symbol(Tunit, Symbol#symbol{section = Cursect, st_value = Dot})}.
local_label(_Location, Tunit, #s_local_label{number = Number}) ->
Serial = local_label_serial(Tunit, Number) + 1,
Name = local_label_name(Number, Serial),
define_new_label(tunit:put_local_label(Tunit, Number, Serial), Name).
local_label_serial(Tunit, Number) ->
case tunit:get_local_label(Tunit, Number) of
false -> 0;
Serial -> Serial
end.
local_label_name(Number, Serial) ->
lists:flatten(io_lib:format(".L~.10b\^B~.10b", [Number, Serial])).
insn(Location, Tunit, #s_insn{} = Stmt) ->
#tunit{cursect = Cursect} = Tunit,
#section{data = {stmts, Stmts}, dot = Dot} = Section = tunit:get_section(Tunit, Cursect),
case Dot rem 4 of % FIXME: target-specific
0 ->
NewStmt = insn_fixup(Tunit, Stmt),
NewSection =
Section#section{ data = {stmts, [NewStmt | Stmts]}
, dot = Dot + 4 % FIXME: target-specific
},
{ok, tunit:put_section(Tunit, NewSection)};
_ -> fmterr(Location, "misaligned address for instruction", [])
end.
insn_fixup(Tunit, Insn) ->
Address = Insn#s_insn.address,
Insn#s_insn{address = expr_fixup(Tunit, Address)}.
expr_fixup(Tunit, Expr) ->
#expr{operand1 = Operand1, operand2 = Operand2} = Expr,
Expr#expr{operand1 = operand_fixup(Tunit, Operand1),
operand2 = operand_fixup(Tunit, Operand2)}.
operand_fixup(Tunit, {Number, Direction}) ->
LabelSerial = local_label_serial(Tunit, Number),
ReferenceSerial =
case Direction of
$b -> LabelSerial;
$f -> LabelSerial + 1
end,
local_label_name(Number, ReferenceSerial);
operand_fixup(_Tunit, Operand) -> Operand.
%% Initialization --------------------------------------------------------------
tunit_init() ->
SectionText = input_pass1:section_dot_text(),
Cursect = SectionText#section.name,
tunit:put_section(tunit:new(Cursect), SectionText).
%% Error reporting -------------------------------------------------------------
fmterr({FileName, LineNr}, Fmt, Args) ->
{error, {?MODULE, {FileName, LineNr, Fmt, Args}}}.
-spec format_error(term()) -> io_lib:chars().
format_error({FileName, LineNr, Fmt, Args}) ->
io_lib:format("file ~s line ~p: " ++ Fmt, [FileName, LineNr | Args]).

View File

@ -1,6 +1,6 @@
%% -*- erlang -*- %% -*- erlang -*-
%% rebar.config for pdp10-tools %% rebar.config for pdp10-tools
%% Copyright (C) 2018-2023 Mikael Pettersson %% Copyright (C) 2018-2024 Mikael Pettersson
%% %%
%% This file is part of pdp10-tools. %% This file is part of pdp10-tools.
%% %%
@ -53,7 +53,8 @@
%% indirect calls to Module:format_error/1 %% indirect calls to Module:format_error/1
, {assemble, format_error, 1} , {assemble, format_error, 1}
, {elf2boot, format_error, 1} , {elf2boot, format_error, 1}
, {input, format_error, 1} , {input_pass1, format_error, 1}
, {input_pass2, format_error, 1}
, {ld, format_error, 1} , {ld, format_error, 1}
, {ld_input, format_error, 1} , {ld_input, format_error, 1}
, {ld_output, format_error, 1} , {ld_output, format_error, 1}