9 年前 · fcf4ac89d6
--- a/book.tex
+++ b/book.tex
@@ -15,7 +15,8 @@
 
				 
			
 
				 \lstset{%
			
 
				 language=Lisp,
			
 
				-basicstyle=\ttfamily\small
			
 
				+basicstyle=\ttfamily\small,
			
 
				+escapechar=@
			
 
				 }
			
 
				 
			
 
				 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
			
@@ -751,26 +752,21 @@ result.
 
				 \chapter{Register Allocation}
			
 
				 \label{ch:register-allocation}
			
 
				 
			
 
				+In Chapter~\ref{ch:int-exp} we simplified the generation of x86
			
 
				+assembly by placing all variables on the stack. We can improve the
			
 
				+performance of the generated code considerably if we instead try to
			
 
				+place as many variables as possible into registers.  The CPU can
			
 
				+access a register in a single cycle, whereas accessing the stack can
			
 
				+take from several cycles (to go to cache) to hundreds of cycles (to go
			
 
				+to main memory).  Figure~\ref{fig:reg-eg} shows a program with four
			
 
				+variables that serves as a running example. We show the source program
			
 
				+and also the output of instruction selection. At that point the
			
 
				+program is almost x86 assembly but not quite; it still contains
			
 
				+variables instead of stack locations or registers.
			
 
				 
			
 
				-% three new passes between instruction selection and spill code
			
 
				-% uncover-live
			
 
				-% build-interference
			
 
				-% allocate registers (uses assign-homes)
			
 
				-
			
 
				-\[
			
 
				-\xymatrix{
			
 
				-  C_0 \ar@/^/[r]^-{\textsf{select\_instr.}}
			
 
				-    & \text{x86}^{*} \ar[d]^-{\textsf{uncover\_live}} \\
			
 
				-    & \text{x86}^{*} \ar[d]^-{\textsf{build\_interference}} \\
			
 
				-    & \text{x86}^{*} \ar[d]_-{\textsf{allocate\_register}} \\
			
 
				-    & \text{x86}^{*} \ar@/^/[r]^-{\textsf{patch\_instr.}} 
			
 
				-    & \text{x86} 
			
 
				-}
			
 
				-\]
			
 
				-
			
 
				-% example
			
 
				-% some vars with disjoint live ranges: x y
			
 
				-% some vars with overlapping live ranges: z
			
 
				+\begin{figure}
			
 
				+\begin{minipage}{0.45\textwidth}
			
 
				+Source program:
			
 
				 \begin{lstlisting}
			
 
				 (let ([x 30])
			
 
				   (let ([z (+ x 4)])
			
@@ -778,8 +774,9 @@ result.
 
				       (let ([w (+ z 10)])
			
 
				         (- w y)))))
			
 
				 \end{lstlisting}
			
 
				-
			
 
				-after select instructions
			
 
				+\end{minipage}
			
 
				+\begin{minipage}{0.45\textwidth}
			
 
				+After instruction selection:
			
 
				 \begin{lstlisting}
			
 
				 (program (x z y w)
			
 
				   (mov (int 30) (var x))
			
@@ -791,50 +788,148 @@ after select instructions
 
				   (mov (var w) (reg rax))
			
 
				   (sub (var y) (reg rax)))
			
 
				 \end{lstlisting}
			
 
				+\end{minipage}
			
 
				+\caption{Program to serve as running example for this chapter.}
			
 
				+\label{fig:reg-eg}
			
 
				+\end{figure}
			
 
				+
			
 
				+
			
 
				+The goal of register allocation is to fit as many variables into
			
 
				+registers as possible. It is often the case that we have more
			
 
				+variables than registers, so we can't naively map each variable to a
			
 
				+register. Fortunately, it is also common for different variables to be
			
 
				+needed during different periods of time, and in such cases the
			
 
				+variables can be mapped to the same register.  Consider variables $x$
			
 
				+and $y$ in Figure~\ref{fig:reg-eg}.  After the variable $x$ is moved
			
 
				+to $z$ it is no longer needed.  Variable $y$, on the other hand, is
			
 
				+used only after this point, so $x$ and $y$ could share the same
			
 
				+register. The topic of the next section is how we compute where a
			
 
				+variable is needed.
			
 
				 
			
 
				 
			
 
				 \section{Liveness Analysis}
			
 
				 
			
 
				-\begin{lstlisting}
			
 
				-(program (x z y w)
			
 
				-; { }
			
 
				-  (mov (int 30) (var x))
			
 
				-; { x }
			
 
				-  (mov (var x) (var z))
			
 
				-; { z }
			
 
				-  (add (int 4) (var z))
			
 
				-; { z }
			
 
				-  (mov (int 2) (var y))
			
 
				-; { y, z }
			
 
				-  (mov (var z) (var w))
			
 
				-; { w, y }
			
 
				-  (add (int 10) (var w))
			
 
				-; { w, y }
			
 
				-  (mov (var w) (reg rax))
			
 
				-; { y, rax }
			
 
				-  (sub (var y) (reg rax)))
			
 
				+A variable is \emph{live} if the variable is used at some later point
			
 
				+in the program and there is not an intervening assignment to the
			
 
				+variable.
			
 
				+%
			
 
				+To understand the latter condition, consider the following code
			
 
				+fragment in which there are two writes to $y$. Are $x$ and
			
 
				+$y$ both live at the same time? 
			
 
				+\begin{lstlisting}[numbers=left,numberstyle=\tiny]
			
 
				+(mov (int 5) (var x))    ; @$x \gets 5$@
			
 
				+(mov (int 30) (var y))   ; @$y \gets 30$@
			
 
				+(mov (var x) (var z))    ; @$z \gets x$@
			
 
				+(mov (int 10) (var y))   ; @$y \gets 10$@
			
 
				+(add (var y) (var z))    ; @$z \gets z + y$@
			
 
				 \end{lstlisting}
			
 
				+The answer is no because the value $30$ written to $y$ on line 2 is
			
 
				+never used. The variable $y$ is read on line 5 and there is an
			
 
				+intervening write to $y$ on line 4, so the read on line 5 receives the
			
 
				+value written on line 4, not line 2.
			
 
				+
			
 
				+The live variables can be computed by traversing the instruction
			
 
				+sequence back to front (i.e., backwards in execution order).  Let
			
 
				+$I_1,\ldots, I_n$ be the instruction sequence. We write
			
 
				+$L_{\mathsf{after}}(k)$ for the set of live variables after
			
 
				+instruction $I_k$ and $L_{\mathsf{before}}(k)$ for the set of live
			
 
				+variables before instruction $I_k$. The live variables after an
			
 
				+instruction are always the same as the live variables before the next
			
 
				+instruction.
			
 
				+\begin{equation*}
			
 
				+  L_{\mathsf{after}}(k) = L_{\mathsf{before}}(k+1)
			
 
				+\end{equation*}
			
 
				+To start things off, there are no live variables after the last
			
 
				+instruction, so 
			
 
				+\begin{equation*}
			
 
				+  L_{\mathsf{after}}(n) = \emptyset 
			
 
				+\end{equation*}
			
 
				+We then apply the following rule repeatedly, traversing the
			
 
				+instruction sequence back to front.
			
 
				+\begin{equation*}
			
 
				+  L_{\mathtt{before}}(k) = (L_{\mathtt{after}}(k) - W(k)) \cup R(k),
			
 
				+\end{equation*}
			
 
				+where $W(k)$ are the variables written to by instruction $I_k$ and
			
 
				+$R(k)$ are the variables read by instruction $I_k$.
			
 
				+Figure~\ref{fig:live-eg} shows the results of live variables analysis
			
 
				+for the running example. Next to each instruction we write its
			
 
				+$L_{\mathtt{after}}$ set.
			
 
				 
			
 
				+\begin{figure}[tbp]
			
 
				+\begin{lstlisting}
			
 
				+(program (x z y w)           ; @$\{ \}$@
			
 
				+  (mov (int 30) (var x))     ; @$\{ x \}$@
			
 
				+  (mov (var x) (var z))      ; @$\{ z \}$@
			
 
				+  (add (int 4) (var z))      ; @$\{ z \}$@
			
 
				+  (mov (int 2) (var y))      ; @$\{ y, z \}$@
			
 
				+  (mov (var z) (var w))      ; @$\{ w, y \}$@
			
 
				+  (add (int 10) (var w))     ; @$\{ w, y \}$@
			
 
				+  (mov (var w) (reg rax))    ; @$\{ y, \itm{rax} \}$@
			
 
				+  (sub (var y) (reg rax)))   ; @$\{ \}$@
			
 
				+\end{lstlisting}
			
 
				+\caption{Running example program annotated with live variables.}
			
 
				+\label{fig:live-eg}
			
 
				+\end{figure}
			
 
				 
			
 
				 
			
 
				 \section{Build Interference Graph}
			
 
				 
			
 
				-%% (hash
			
 
				-%%    'z1498
			
 
				-%%    (set 'rax 'x1497 'y1499)
			
 
				-%%    'x1497
			
 
				-%%    (set 'z1498)
			
 
				-%%    'rax
			
 
				-%%    (set 'z1498 'y1499)
			
 
				-%%    'y1499
			
 
				-%%    (set 'rax 'z1498)))
			
 
				+Based on the liveness analysis, we know the program regions where each
			
 
				+variable is needed.  However, during register allocation, we need to
			
 
				+answer questions of the specific form: are variables $u$ and $v$ ever
			
 
				+live at the same time?  (And therefore cannot be assigned to the same
			
 
				+register.)  To make this question easier to answer, we create an
			
 
				+explicit data structure, an \emph{interference graph}.  An
			
 
				+interference graph is an undirected graph that has an edge between two
			
 
				+variables if they are live at the same time, that is, if they
			
 
				+interfere with each other.
			
 
				+
			
 
				+The most obvious way to compute the interference graph is to look at
			
 
				+the set of live variables between each statement in the program, and
			
 
				+add an edge to the graph for every pair of variables in the same set.
			
 
				+This approach is less than ideal for two reasons. First, it can be
			
 
				+rather expensive because it takes $O(n^2)$ time to look at every pair
			
 
				+in a set of $n$ live variables. Second, there is a special case in
			
 
				+which two variables that are live at the same time do not actually
			
 
				+interfere with each other: when they both contain the same value
			
 
				+because we have assigned one to the other.
			
 
				+
			
 
				+A better way to compute the edges of the intereference graph is given
			
 
				+by the following rules.
			
 
				+
			
 
				+\begin{itemize}
			
 
				+\item If instruction $I_k$ is a move: (\key{mov} $s$\, $d$), then add
			
 
				+  the edge $(d,v)$ for every $v \in L_{\mathsf{after}}(k)$ unless $v =
			
 
				+  d$ or $v = s$.
			
 
				+
			
 
				+\item If instruction $I_k$ is not a move but some other arithmetic
			
 
				+  instruction such as (\key{add} $s$\, $d$), then add the edge $(d,v)$
			
 
				+  for every $v \in L_{\mathsf{after}}(k)$ unless $v = d$.
			
 
				+  
			
 
				+\item If instruction $I_k$ is of the form (\key{call}
			
 
				+  $\mathit{label}$), then add an edge $(r,v)$ for every caller-save
			
 
				+  register $r$ and every variable $v \in L_{\mathsf{after}}(k)$.
			
 
				+\end{itemize}
			
 
				+
			
 
				+Working from the top to bottom of Figure~\ref{fig:live-eg}, $y$
			
 
				+interferes with $z$, $w$ interfers with $y$, 
			
 
				+[?? w should not conflict with z! ??]
			
 
				+The resulting interference graph is shown in
			
 
				+Figure~\ref{fig:interfere}.
			
 
				 
			
 
				+\begin{figure}[tbp]
			
 
				+\large
			
 
				 \[
			
 
				-\xymatrix{
			
 
				+\xymatrix@=40pt{
			
 
				   w \ar@{-}[d] \ar@{-}[dr] &  x \ar@{-}[d] \\
			
 
				   y \ar@{-}[r] & z
			
 
				 }
			
 
				 \]
			
 
				+\caption{Interference graph for the example program.}
			
 
				+\label{fig:interfere}
			
 
				+\end{figure}
			
 
				+
			
 
				+
			
 
				 
			
 
				 
			
 
				 \section{Graph Coloring via Sudoku}
			
@@ -867,6 +962,24 @@ patch instructions fixes the move from
 
				 	movq	%rax, -8(%rbp)
			
 
				 \end{lstlisting}
			
 
				 
			
 
				+% three new passes between instruction selection and spill code
			
 
				+% uncover-live
			
 
				+% build-interference
			
 
				+% allocate registers (uses assign-homes)
			
 
				+
			
 
				+\[
			
 
				+\xymatrix{
			
 
				+  C_0 \ar@/^/[r]^-{\textsf{select\_instr.}}
			
 
				+    & \text{x86}^{*} \ar[d]^-{\textsf{uncover\_live}} \\
			
 
				+    & \text{x86}^{*} \ar[d]^-{\textsf{build\_interference}} \\
			
 
				+    & \text{x86}^{*} \ar[d]_-{\textsf{allocate\_register}} \\
			
 
				+    & \text{x86}^{*} \ar@/^/[r]^-{\textsf{patch\_instr.}} 
			
 
				+    & \text{x86} 
			
 
				+}
			
 
				+\]
			
 
				+
			
 
				+
			
 
				+
			
 
				 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
			
 
				 \chapter{Booleans, Conditions, and Type Checking}
			
 
				 \label{ch:bool-types}