4 年之前 · 4d8e94bf5c
--- a/book.tex
+++ b/book.tex
@@ -7500,8 +7500,8 @@ language, whose syntax is defined in Figure~\ref{fig:x86-3}.
 
															 \Arg &::=&  \gray{  \INT{\Int} \mid \REG{\Reg}
														
 
															     \mid (\key{deref}\,\Reg\,\Int) } \\
														
 
															    &\mid& \gray{ (\key{byte-reg}\; \Reg) 
														
 
															-    \mid   (\key{global}\; \itm{name})  } \\
														
 
															-   &\mid& (\key{fun-ref}\; \itm{label})\\
														
 
															+   \mid   (\key{global}\; \itm{name})  }
														
 
															+   \mid (\key{fun-ref}\; \itm{label})\\
														
 
															 \itm{cc} & ::= & \gray{  \key{e} \mid \key{l} \mid \key{le} \mid \key{g} \mid \key{ge}  } \\
														
 
															 \Instr &::=& \gray{  (\key{addq} \; \Arg\; \Arg) \mid
														
 
															              (\key{subq} \; \Arg\; \Arg) \mid
														
@@ -7517,7 +7517,7 @@ language, whose syntax is defined in Figure~\ref{fig:x86-3}.
 
															        \mid (\key{j}\itm{cc} \; \itm{label})
														
 
															        \mid (\key{label} \; \itm{label})  } \\
														
 
															      &\mid& (\key{indirect-callq}\;\Arg ) \mid (\key{tail-jmp}\;\Arg) \\
														
 
															-     &\mid& (\key{leaq}\;\Arg\;\Arg)\\
														
 
															+     &\mid& (\key{leaq}\;\Arg\;\Reg)\\
														
 
															 \Block &::= & \gray{(\key{block} \;\itm{info}\; \Instr\ldots)} \\
														
 
															 \Def &::= & (\key{define} \; (\itm{label}) \;\itm{info}\; ((\itm{label} \,\key{.}\, \Block)\ldots))\\
														
 
															 x86_3 &::= & (\key{program} \;\itm{info} \;\Def\ldots)
														
@@ -7530,12 +7530,28 @@ x86_3 &::= & (\key{program} \;\itm{info} \;\Def\ldots)
 
															 \end{figure}
														
 
															 \begin{figure}[tp]
														
 
															-UNDER CONSTRUCTION
														
 
															+\fbox{
														
 
															+  \begin{minipage}{0.96\textwidth}
														
 
															+    \small
														
 
															+\[
														
 
															+\begin{array}{lcl}
														
 
															+  \Arg &::=&  \gray{  \INT{\Int} \mid \REG{\Reg} \mid \DEREF{\Reg}{\Int}
														
 
															+     \mid \BYTEREG{\Reg} } \\
														
 
															+     &\mid& \gray{ (\key{Global}~\Var) } \mid \FUNREF{\itm{label}} \\
														
 
															+  \Instr &::=& \ldots \mid \INDCALLQ{\itm{label}}
														
 
															+    \mid \TAILJMP{\Arg}\\
														
 
															+    &\mid& \BININSTR{\code{'leaq}}{\Arg}{\REG{\Reg}}\\
														
 
															+  \Def &::= & \DEF{\itm{label}}{([\Var\key{:}\Type]\ldots)}{\Type}{((\itm{label}\,\key{.}\,\Block)\ldots)} \\
														
 
															+x86_3 &::= & \PROGRAMDEFS{\itm{info}}{(\Def\ldots)}
														
 
															+\end{array}
														
 
															+\]
														
 
															+\end{minipage}
														
 
															+}
														
 
															   \caption{The abstract syntax of x86$_3$ (extends x86$_2$ of Figure~\ref{fig:x86-2}).}
														
 
															 \label{fig:x86-3}
														
 
															 \end{figure}
														
 
															-\margincomment{TODO: abstract syntax for $x86_3$.}
														
 
															+
														
 
															 An assignment of a function reference to a variable becomes a
														
 
															 load-effective-address instruction as follows: \\
														
@@ -7598,12 +7614,16 @@ use for them. If you implemented the move-biasing challenge
 
															 (Section~\ref{sec:move-biasing}), the register allocator will try to
														
 
															 assign the parameter variables to the corresponding argument register,
														
 
															 in which case the \code{patch-instructions} pass will remove the
														
 
															-\code{movq} instruction. Also, note that the register allocator will
														
 
															-perform liveness analysis on this sequence of move instructions and
														
 
															-build the interference graph. So, for example, $x_1$ will be marked as
														
 
															-interfering with \code{rsi} and that will prevent the assignment of
														
 
															-$x_1$ to \code{rsi}, which is good, because that would overwrite the
														
 
															-argument that needs to move into $x_2$.
														
 
															+\code{movq} instruction. This happens in the example translation in
														
 
															+Figure~\ref{fig:add-fun} of Section~\ref{sec:functions-example}, in
														
 
															+the \code{add} function.
														
 
															+%
														
 
															+Also, note that the register allocator will perform liveness analysis
														
 
															+on this sequence of move instructions and build the interference
														
 
															+graph. So, for example, $x_1$ will be marked as interfering with
														
 
															+\code{rsi} and that will prevent the assignment of $x_1$ to
														
 
															+\code{rsi}, which is good, because that would overwrite the argument
														
 
															+that needs to move into $x_2$.
														
 
															 Next, consider the compilation of function calls. In the mirror image
														
 
															 of handling the parameters of function definitions, the arguments need
														
@@ -7664,7 +7684,7 @@ graph for each function (not just one for the whole program).
 
															 Recall that in Section~\ref{sec:reg-alloc-gc} we discussed the need to
														
 
															 spill vector-typed variables that are live during a call to the
														
 
															 \code{collect}.  With the addition of functions to our language, we
														
 
															-need to revisit this issue. Many functions will perform allocation and
														
 
															+need to revisit this issue. Many functions perform allocation and
														
 
															 therefore have calls to the collector inside of them. Thus, we should
														
 
															 not only spill a vector-typed variable when it is live during a call
														
 
															 to \code{collect}, but we should spill the variable if it is live
														
@@ -7680,35 +7700,100 @@ In \code{patch-instructions}, you should deal with the x86
 
															 idiosyncrasy that the destination argument of \code{leaq} must be a
														
 
															 register. Additionally, you should ensure that the argument of
														
 
															 \code{TailJmp} is \itm{rax}, our reserved register---this is to make
														
 
															-code generation more convenient, because we will be trampling many
														
 
															-registers before the tail call (as explained below).
														
 
															+code generation more convenient, because we trample many registers
														
 
															+before the tail call (as explained in the next section).
														
 
															 \section{Print x86}
														
 
															-For the \code{print-x86} pass, we recommend the following translations:
														
 
															+For the \code{print-x86} pass, the cases for \code{FunRef} and
														
 
															+\code{IndirectCallq} are straightforward: output their concrete
														
 
															+syntax.
														
 
															 \begin{lstlisting}
														
 
															   (FunRef |\itm{label}|) |$\Rightarrow$| |\itm{label}|(%rip)
														
 
															-  (IndirectCallq |\itm{arg}|) |$\Rightarrow$| callq *|\itm{arg}|
														
 
															+  (IndirectCallq |\itm{arg}|) |$\Rightarrow$| callq *|\itm{arg}'|
														
 
															 \end{lstlisting}
														
 
															-Handling \code{TailJmp} requires a bit more care. A straightforward
														
 
															-translation of \code{TailJmp} would be \code{jmp *$\itm{arg}$}, which
														
 
															-is what we will want to do, but before the jump we need to pop the
														
 
															-current frame. So we need to restore the state of the registers to the
														
 
															-point they were at when the current function was called.  This
														
 
															-sequence of instructions is the same as the code for the conclusion of
														
 
															-a function.
														
 
															+
														
 
															+The \code{TailJmp} node requires a bit work. A straightforward
														
 
															+translation of \code{TailJmp} would be \code{jmp *$\itm{arg}$}, but
														
 
															+before the jump we need to pop the current frame. This sequence of
														
 
															+instructions is the same as the code for the conclusion of a function,
														
 
															+except the \code{retq} is replaced with \code{jmp *$\itm{arg}$}.
														
 
															 Note that your \code{print-x86} pass needs to add the code for saving
														
 
															 and restoring callee-saved registers, if you have not already
														
 
															 implemented that. This is necessary when generating code for function
														
 
															 definitions.
														
 
															+\begin{exercise}\normalfont
														
 
															+Expand your compiler to handle $R_4$ as outlined in this chapter.
														
 
															+Create 5 new programs that use functions, including examples that pass
														
 
															+functions and return functions from other functions and including
														
 
															+recursive functions. Test your compiler on these new programs and all
														
 
															+of your previously created test programs.
														
 
															+\end{exercise}
														
 
															+
														
 
															+
														
 
															+\begin{figure}[tbp]
														
 
															+\begin{tikzpicture}[baseline=(current  bounding  box.center)]
														
 
															+\node (R4) at (0,2)  {\large $R_4$};
														
 
															+\node (R4-2) at (3,2)  {\large $R_4$};
														
 
															+\node (R4-3) at (6,2)  {\large $R_4$};
														
 
															+\node (F1-1) at (12,0)  {\large $F_1$};
														
 
															+\node (F1-2) at (9,0)  {\large $F_1$};
														
 
															+\node (F1-3) at (6,0)  {\large $F_1$};
														
 
															+\node (F1-4) at (3,0)  {\large $F_1$};
														
 
															+\node (C3-1) at (6,-2)  {\large $C_3$};
														
 
															+\node (C3-2) at (3,-2)  {\large $C_3$};
														
 
															+
														
 
															+\node (x86-2) at (3,-4)  {\large $\text{x86}^{*}_3$};
														
 
															+\node (x86-3) at (6,-4)  {\large $\text{x86}^{*}_3$};
														
 
															+\node (x86-4) at (9,-4) {\large $\text{x86}_3$};
														
 
															+\node (x86-5) at (9,-6) {\large $\text{x86}^{\dagger}_3$};
														
 
															+
														
 
															+\node (x86-2-1) at (3,-6)  {\large $\text{x86}^{*}_3$};
														
 
															+\node (x86-2-2) at (6,-6)  {\large $\text{x86}^{*}_3$};
														
 
															+
														
 
															+\path[->,bend left=15] (R4) edge [above] node
														
 
															+     {\ttfamily\footnotesize\color{red} typecheck} (R4-2);
														
 
															+\path[->,bend left=15] (R4-2) edge [above] node
														
 
															+     {\ttfamily\footnotesize uniquify} (R4-3);
														
 
															+\path[->,bend left=15] (R4-3) edge [right] node
														
 
															+     {\ttfamily\footnotesize\color{red} reveal-functions} (F1-1);
														
 
															+\path[->,bend left=15] (F1-1) edge [below] node
														
 
															+     {\ttfamily\footnotesize\color{red} limit-functions} (F1-2);
														
 
															+\path[->,bend right=15] (F1-2) edge [above] node
														
 
															+     {\ttfamily\footnotesize expose-alloc.} (F1-3);
														
 
															+\path[->,bend right=15] (F1-3) edge [above] node
														
 
															+     {\ttfamily\footnotesize\color{red} remove-complex.} (F1-4);
														
 
															+\path[->,bend left=15] (F1-4) edge [right] node
														
 
															+     {\ttfamily\footnotesize\color{red} explicate-control} (C3-1);
														
 
															+\path[->,bend left=15] (C3-1) edge [below] node
														
 
															+     {\ttfamily\footnotesize\color{red} uncover-locals} (C3-2);
														
 
															+\path[->,bend right=15] (C3-2) edge [left] node
														
 
															+     {\ttfamily\footnotesize\color{red} select-instr.} (x86-2);
														
 
															+\path[->,bend left=15] (x86-2) edge [left] node
														
 
															+     {\ttfamily\footnotesize\color{red} uncover-live} (x86-2-1);
														
 
															+\path[->,bend right=15] (x86-2-1) edge [below] node 
														
 
															+     {\ttfamily\footnotesize \color{red}build-inter.} (x86-2-2);
														
 
															+\path[->,bend right=15] (x86-2-2) edge [left] node
														
 
															+     {\ttfamily\footnotesize allocate-reg.} (x86-3);
														
 
															+\path[->,bend left=15] (x86-3) edge [above] node
														
 
															+     {\ttfamily\footnotesize\color{red} patch-instr.} (x86-4);
														
 
															+\path[->,bend right=15] (x86-4) edge [left] node {\ttfamily\footnotesize\color{red} print-x86} (x86-5);
														
 
															+\end{tikzpicture}
														
 
															+\caption{Diagram of the passes for $R_4$, a language with functions.}
														
 
															+\label{fig:R4-passes}
														
 
															+\end{figure}
														
 
															+
														
 
															+Figure~\ref{fig:R4-passes} gives an overview of the passes for
														
 
															+compiling $R_4$ to x86.
														
 
															+
														
 
															 \section{An Example Translation}
														
 
															+\label{sec:functions-example}
														
 
															 Figure~\ref{fig:add-fun} shows an example translation of a simple
														
 
															 function in $R_4$ to x86. The figure also includes the results of the
														
 
															-\code{explicate-control} and \code{select-instructions} passes.  We
														
 
															-have omitted the \code{HasType} AST nodes for readability.
														
 
															+\code{explicate-control} and \code{select-instructions} passes.
														
 
															 \begin{figure}[tbp]
														
 
															 \begin{tabular}{ll}
														
@@ -7805,68 +7890,7 @@ mainconclusion:
 
															 \label{fig:add-fun}
														
 
															 \end{figure}
														
 
															-\begin{exercise}\normalfont
														
 
															-Expand your compiler to handle $R_4$ as outlined in this chapter.
														
 
															-Create 5 new programs that use functions, including examples that pass
														
 
															-functions and return functions from other functions and including
														
 
															-recursive functions. Test your compiler on these new programs and all
														
 
															-of your previously created test programs.
														
 
															-\end{exercise}
														
 
															-
														
 
															-\begin{figure}[p]
														
 
															-\begin{tikzpicture}[baseline=(current  bounding  box.center)]
														
 
															-\node (R4) at (0,2)  {\large $R_4$};
														
 
															-\node (R4-2) at (3,2)  {\large $R_4$};
														
 
															-\node (R4-3) at (6,2)  {\large $R_4$};
														
 
															-\node (F1-1) at (12,0)  {\large $F_1$};
														
 
															-\node (F1-2) at (9,0)  {\large $F_1$};
														
 
															-\node (F1-3) at (6,0)  {\large $F_1$};
														
 
															-\node (F1-4) at (3,0)  {\large $F_1$};
														
 
															-\node (C3-1) at (6,-2)  {\large $C_3$};
														
 
															-\node (C3-2) at (3,-2)  {\large $C_3$};
														
 
															-
														
 
															-\node (x86-2) at (3,-4)  {\large $\text{x86}^{*}_3$};
														
 
															-\node (x86-3) at (6,-4)  {\large $\text{x86}^{*}_3$};
														
 
															-\node (x86-4) at (9,-4) {\large $\text{x86}_3$};
														
 
															-\node (x86-5) at (9,-6) {\large $\text{x86}^{\dagger}_3$};
														
 
															-
														
 
															-\node (x86-2-1) at (3,-6)  {\large $\text{x86}^{*}_3$};
														
 
															-\node (x86-2-2) at (6,-6)  {\large $\text{x86}^{*}_3$};
														
 
															-
														
 
															-\path[->,bend left=15] (R4) edge [above] node
														
 
															-     {\ttfamily\footnotesize\color{red} typecheck} (R4-2);
														
 
															-\path[->,bend left=15] (R4-2) edge [above] node
														
 
															-     {\ttfamily\footnotesize uniquify} (R4-3);
														
 
															-\path[->,bend left=15] (R4-3) edge [right] node
														
 
															-     {\ttfamily\footnotesize\color{red} reveal-functions} (F1-1);
														
 
															-\path[->,bend left=15] (F1-1) edge [below] node
														
 
															-     {\ttfamily\footnotesize\color{red} limit-functions} (F1-2);
														
 
															-\path[->,bend right=15] (F1-2) edge [above] node
														
 
															-     {\ttfamily\footnotesize expose-alloc.} (F1-3);
														
 
															-\path[->,bend right=15] (F1-3) edge [above] node
														
 
															-     {\ttfamily\footnotesize\color{red} remove-complex.} (F1-4);
														
 
															-\path[->,bend left=15] (F1-4) edge [right] node
														
 
															-     {\ttfamily\footnotesize\color{red} explicate-control} (C3-1);
														
 
															-\path[->,bend left=15] (C3-1) edge [below] node
														
 
															-     {\ttfamily\footnotesize\color{red} uncover-locals} (C3-2);
														
 
															-\path[->,bend right=15] (C3-2) edge [left] node
														
 
															-     {\ttfamily\footnotesize\color{red} select-instr.} (x86-2);
														
 
															-\path[->,bend left=15] (x86-2) edge [left] node
														
 
															-     {\ttfamily\footnotesize\color{red} uncover-live} (x86-2-1);
														
 
															-\path[->,bend right=15] (x86-2-1) edge [below] node 
														
 
															-     {\ttfamily\footnotesize \color{red}build-inter.} (x86-2-2);
														
 
															-\path[->,bend right=15] (x86-2-2) edge [left] node
														
 
															-     {\ttfamily\footnotesize allocate-reg.} (x86-3);
														
 
															-\path[->,bend left=15] (x86-3) edge [above] node
														
 
															-     {\ttfamily\footnotesize\color{red} patch-instr.} (x86-4);
														
 
															-\path[->,bend right=15] (x86-4) edge [left] node {\ttfamily\footnotesize\color{red} print-x86} (x86-5);
														
 
															-\end{tikzpicture}
														
 
															-\caption{Diagram of the passes for $R_4$, a language with functions.}
														
 
															-\label{fig:R4-passes}
														
 
															-\end{figure}
														
 
															-Figure~\ref{fig:R4-passes} gives an overview of the passes needed for
														
 
															-the compilation of $R_4$.
														
 
															 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
														
--- a/defs.tex
+++ b/defs.tex
@@ -68,10 +68,12 @@
 
															 \newcommand{\BININSTR}[3]{\key{(Instr}\;#1\;\key{(list}\;#2\;#3\key{))}}
														
 
															 \newcommand{\UNIINSTR}[2]{\key{(Instr}\;#1\;\key{(list}\;#2\key{))}}
														
 
															 \newcommand{\CALLQ}[1]{\key{(Callq}~#1\key{)}}
														
 
															+\newcommand{\INDCALLQ}[1]{\key{(IndirectCallq}~#1\key{)}}
														
 
															 \newcommand{\RETQ}{\key{(Retq)}}
														
 
															 \newcommand{\PUSHQ}[1]{\key{(Pushq}~#1\key{)}}
														
 
															 \newcommand{\POPQ}[1]{\key{(Popq}~#1\key{)}}
														
 
															 \newcommand{\JMP}[1]{\key{(Jmp}~#1\key{)}}
														
 
															+\newcommand{\TAILJMP}[1]{\key{(TailJmp}~#1\key{)}}
														
 
															 \newcommand{\JMPIF}[2]{\key{(JmpIf}~#1~#2\key{)}}