exo5_raffaele_ancarola.tex
No OneTemporary
Actions

Subscribers

None

File Metadata

Created: Tue, Dec 3, 23:08

exo5_raffaele_ancarola.tex
View Options

	\documentclass{article}
	% Change "article" to "report" to get rid of page number on title page
	\usepackage{amsmath,amsfonts,amsthm,amssymb}
	\usepackage{setspace}
	\usepackage{fancyhdr}
	\usepackage{lastpage}
	\usepackage{extramarks}
	\usepackage{chngpage}
	\usepackage{soul}
	\usepackage[usenames,dvipsnames]{color}
	\usepackage{graphicx,float,wrapfig}
	\usepackage{ifthen}
	\usepackage{listings}
	\usepackage{courier}
	\usepackage{makecell}

	\usepackage{caption}
	\usepackage{subcaption}
	\usepackage{wrapfig}
	\usepackage{multicol}
	\usepackage{float}
	\usepackage{verbatim}
	\usepackage[T1]{fontenc}
	\usepackage{comment}
	\usepackage{systeme}
	\usepackage[table,xcdraw]{xcolor}
	\usepackage{array}
	\usepackage{physics}
	% !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!
	%
	% Here put your info (name, due date, title etc).
	% the rest should be left unchanged.
	%
	%
	%
	% !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!


	% Homework Specific Information
	\newcommand{\hmwkTitle}{Exercise 5}
	\newcommand{\hmwkSubTitle}{}
	\newcommand{\hmwkDueDate}{\today}
	\newcommand{\hmwkClass}{Introduction to multiprocessor architecture}
	\newcommand{\hmwkClassTime}{}
	%\newcommand{\hmwkClassInstructor}{Prof. Oleg Yazyev}
	\newcommand{\hmwkAuthorName}{Raffaele Ancarola}
	%
	%

	% In case you need to adjust margins:
	\topmargin=-0.45in %
	\evensidemargin=0in %
	\oddsidemargin=0in %
	\textwidth=6.5in %
	\textheight=9.5in %
	\headsep=0.25in %

	% This is the color used for comments below
	\definecolor{MyDarkGreen}{rgb}{0.0,0.4,0.0}

	% units of mesure
	\usepackage{siunitx}
	% comments
	\usepackage{comment}

	% pgfplots environment
	%package setup for graphs
	\usepackage{tikz}
	\usepackage{pgfplots}
	\usepackage{pgfplotstable}
	\usetikzlibrary{patterns}

	\usepgfplotslibrary{external}
	\pgfplotsset{compat=newest}

	%pgfplot setup
	\makeatletter
	\pgfplotsset{
	/pgfplots/flexible xticklabels from table/.code n args={3}{%
	\pgfplotstableread[#3]{#1}\coordinate@table
	\pgfplotstablegetcolumn{#2}\of{\coordinate@table}\to\pgfplots@xticklabels
	\let\pgfplots@xticklabel=\pgfplots@user@ticklabel@list@x
	},
	% layer definition
	layers/my layer set/.define layer set={
	background,
	main,
	foreground
	}{
	% you could state styles here which should be moved to
	% corresponding layers, but that is not necessary here.
	% That is why we don't state anything here
	},
	% activate the newly created layer set
	set layers=my layer set
	}
	\makeatother

	\IfFileExists{./tikzext.perm}{\tikzexternalize[prefix=tikzext/]}{\tikzexternalize}


	% pfgplots add graphics
	\makeatletter
	\newcommand\addplotgraphicsnatural[2][]{%
	\begingroup
	% set options in this local group (will be lost afterwards):
	\pgfqkeys{/pgfplots/plot graphics}{#1}%
	% measure the natural size of the graphics:
	\setbox0=\hbox{\includegraphics{#2}}%
	%
	% compute the required unit vector ratio:
	\pgfmathparse{\wd0/(\pgfkeysvalueof{/pgfplots/plot graphics/xmax} - \pgfkeysvalueof{/pgfplots/plot graphics/xmin})}%
	\let\xunit=\pgfmathresult
	\pgfmathparse{\ht0/(\pgfkeysvalueof{/pgfplots/plot graphics/ymax} - \pgfkeysvalueof{/pgfplots/plot graphics/ymin})}%
	\let\yunit=\pgfmathresult
	%
	% configure pgfplots to use it.
	% The \xdef expands all macros except those prefixed by '\noexpand'
	% and assigns the result to a global macro named '\marshal'.
	\xdef\marshal{%
	\noexpand\pgfplotsset{unit vector ratio={\xunit\space \yunit}}%
	}%
	\endgroup
	%
	% use our macro here:
	\marshal
	%
	\addplot graphics[#1] {#2};
	}
	\makeatother



	% For faster processing, load Matlab syntax for listings
	\lstloadlanguages{Matlab}%
	\lstset{language=Matlab, % Use MATLAB
	frame=single, % Single frame around code
	basicstyle=\small\ttfamily, % Use small true type font
	keywordstyle=[1]\color{Blue}\bf, % MATLAB functions bold and blue
	keywordstyle=[2]\color{Purple}, % MATLAB function arguments purple
	keywordstyle=[3]\color{Blue}\underbar, % User functions underlined and blue
	identifierstyle=, % Nothing special about identifiers
	% Comments small dark green courier
	commentstyle=\usefont{T1}{pcr}{m}{sl}\color{MyDarkGreen}\small,
	stringstyle=\color{Purple}, % Strings are purple
	showstringspaces=false, % Don't put marks in string spaces
	tabsize=3, % 5 spaces per tab
	breaklines=True,
	%
	%%% Put standard MATLAB functions not included in the default
	%%% language here
	morekeywords={xlim,ylim,var,alpha,factorial,poissrnd,normpdf,normcdf},
	%
	%%% Put MATLAB function parameters here
	morekeywords=[2]{on, off, interp},
	%
	%%% Put user defined functions here
	morekeywords=[3]{FindESS, homework_example},
	%
	morecomment=[l][\color{Blue}]{...}, % Line continuation (...) like blue comment
	numbers=left, % Line numbers on left
	firstnumber=1, % Line numbers start with line 1
	numberstyle=\tiny\color{Blue}, % Line numbers are blue
	stepnumber=1 % Line numbers go in steps of 5
	}

	% Setup the header and footer
	\pagestyle{fancy} %
	\lhead{\hmwkAuthorName} %
	%\chead{\hmwkClass\ (\hmwkClassInstructor\ \hmwkClassTime): \hmwkTitle} %
	\rhead{\hmwkClass\ : \hmwkTitle} %
	%\rhead{\firstxmark} %
	\lfoot{\lastxmark} %
	\cfoot{} %
	\rfoot{Page\ \thepage\ of\ \protect\pageref{LastPage}} %
	\renewcommand\headrulewidth{0.4pt} %
	\renewcommand\footrulewidth{0.4pt} %

	% This is used to trace down (pin point) problems
	% in latexing a document:
	%\tracingall

	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
	% Some tools
	\newcommand{\enterProblemHeader}[1]{\nobreak\extramarks{#1}{#1 continued on next page\ldots}\nobreak%
	\nobreak\extramarks{#1 (continued)}{#1 continued on next page\ldots}\nobreak}%
	\newcommand{\exitProblemHeader}[1]{\nobreak\extramarks{#1 (continued)}{#1 continued on next page\ldots}\nobreak%
	\nobreak\extramarks{#1}{}\nobreak}%

	\newlength{\labelLength}
	\newcommand{\labelAnswer}[2]
	{\settowidth{\labelLength}{#1}%
	\addtolength{\labelLength}{0.25in}%
	\changetext{}{-\labelLength}{}{}{}%
	\noindent\fbox{\begin{minipage}[c]{\columnwidth}#2\end{minipage}}%
	\marginpar{\fbox{#1}}%

	% We put the blank space above in order to make sure this
	% \marginpar gets correctly placed.
	\changetext{}{+\labelLength}{}{}{}}%

	\setcounter{secnumdepth}{0}
	\newcommand{\homeworkProblemName}{}%
	\newcounter{homeworkProblemCounter}%
	\newenvironment{homeworkProblem}[1][Problem \arabic{homeworkProblemCounter}]%
	{\stepcounter{homeworkProblemCounter}%
	\renewcommand{\homeworkProblemName}{#1}%
	\section{\homeworkProblemName}%
	\enterProblemHeader{\homeworkProblemName}}%
	{\exitProblemHeader{\homeworkProblemName}}%

	\newcommand{\problemAnswer}[1]
	{\noindent\fbox{\begin{minipage}[c]{\columnwidth}#1\end{minipage}}}%

	\newcommand{\problemLAnswer}[1]
	{\labelAnswer{\homeworkProblemName}{#1}}

	\newcommand{\homeworkSectionName}{}%
	\newlength{\homeworkSectionLabelLength}{}%
	\newenvironment{homeworkSection}[1]%
	{% We put this space here to make sure we're not connected to the above.
	% Otherwise the changetext can do funny things to the other margin

	\renewcommand{\homeworkSectionName}{#1}%
	\settowidth{\homeworkSectionLabelLength}{\homeworkSectionName}%
	\addtolength{\homeworkSectionLabelLength}{0.25in}%
	\changetext{}{-\homeworkSectionLabelLength}{}{}{}%
	\subsection{\homeworkSectionName}%
	\enterProblemHeader{\homeworkProblemName\ [\homeworkSectionName]}}%
	{\enterProblemHeader{\homeworkProblemName}%

	% We put the blank space above in order to make sure this margin
	% change doesn't happen too soon (otherwise \sectionAnswer's can
	% get ugly about their \marginpar placement.
	\changetext{}{+\homeworkSectionLabelLength}{}{}{}}%

	\newcommand{\sectionAnswer}[1]
	{% We put this space here to make sure we're disconnected from the previous
	% passage

	\noindent\fbox{\begin{minipage}[c]{\columnwidth}#1\end{minipage}}%
	\enterProblemHeader{\homeworkProblemName}\exitProblemHeader{\homeworkProblemName}%
	\marginpar{\fbox{\homeworkSectionName}}%

	% We put the blank space above in order to make sure this
	% \marginpar gets correctly placed.
	}%

	%%% I think \captionwidth (commented out below) can go away
	%%%
	%% Edits the caption width
	%\newcommand{\captionwidth}[1]{%
	% \dimen0=\columnwidth \advance\dimen0 by-#1\relax
	% \divide\dimen0 by2
	% \advance\leftskip by\dimen0
	% \advance\rightskip by\dimen0
	%}

	% Includes a figure
	% The first parameter is the label, which is also the name of the figure
	% with or without the extension (e.g., .eps, .fig, .png, .gif, etc.)
	% IF NO EXTENSION IS GIVEN, LaTeX will look for the most appropriate one.
	% This means that if a DVI (or PS) is being produced, it will look for
	% an eps. If a PDF is being produced, it will look for nearly anything
	% else (gif, jpg, png, et cetera). Because of this, when I generate figures
	% I typically generate an eps and a png to allow me the most flexibility
	% when rendering my document.
	% The second parameter is the width of the figure normalized to column width
	% (e.g. 0.5 for half a column, 0.75 for 75% of the column)
	% The third parameter is the caption.
	\newcommand{\scalefig}[3]{
	\begin{figure}[ht!]
	% Requires \usepackage{graphicx}
	\centering
	\includegraphics[width=#2\columnwidth]{#1}
	%%% I think \captionwidth (see above) can go away as long as
	%%% \centering is above
	%\captionwidth{#2\columnwidth}%
	\caption{#3}
	\label{#1}
	\end{figure}}

	% Includes a MATLAB script.
	% The first parameter is the label, which also is the name of the script
	% without the .m.
	% The second parameter is the optional caption.
	\newcommand{\matlabscript}[2]
	{\begin{itemize}\item[]\lstinputlisting[caption=#2,label=#1]{#1.m}\end{itemize}}

	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%


	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
	% Make title
	%\title{\vspace{2in}\textmd{\textbf{\hmwkClass:\ \hmwkTitle\ifthenelse{\equal{\hmwkSubTitle}{}}{}{\\\hmwkSubTitle}}}\\\normalsize\vspace{0.1in}\small{Due\ on\ \hmwkDueDate}\\\vspace{0.1in}\large{\textit{\hmwkClassInstructor\ \hmwkClassTime}}\vspace{3in}}
	%\title{\vspace{2in}\textmd{\textbf{\hmwkClass:\ \hmwkTitle\ifthenelse{\equal{\hmwkSubTitle}{}}{}{\\\hmwkSubTitle}}}\\\normalsize\vspace{0.1in}\small{Due\ on\ \hmwkDueDate}\\\vspace{0.1in}\large{\textit{ \hmwkClassTime}}\vspace{3in}}
	\title{\textmd{\textbf{\hmwkClass:\ \hmwkTitle\ifthenelse{\equal{\hmwkSubTitle}{}}{}{\\\hmwkSubTitle}}}\\\normalsize\vspace{0.1in}\small{Due\ on\ \hmwkDueDate}\\\vspace{0.1in}\large{\textit{ \hmwkClassTime}}}
	\date{\today}
	\author{\textbf{\hmwkAuthorName}}
	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

	\begin{document}
	%\begin{spacing}{1.1}
	\maketitle
	% Uncomment the \tableofcontents and \newpage lines to get a Contents page
	% Uncomment the \setcounter line as well if you do NOT want subsections
	% listed in Contents
	%\setcounter{tocdepth}{1}
	%\newpage
	%\tableofcontents
	%\newpage

	% When problems are long, it may be desirable to put a \newpage or a
	% \clearpage before each homeworkProblem environment

	%\newpage

	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
	\begin{homeworkProblem}

	\begin{homeworkSection}{(1)}
	The \textit{locking} process is performed using a boolean shared flag $X$ ($X = 1 \implies$ locked)
	which is supposed to be coherently accessible from all cores.
	\texttt{TS} operation involves into the bus a \texttt{BusRdX} operation which reads
	the value of $X$ with the intent to modify it, then invalidating all other cores' cache.
	\\
	Suppose that $P_0, P_1, ... , P_n$ aptempt to obtain the lock in order to execute a critical section and $P_0$ anticipate all others.
	While $P_0$ is executing it's own critical section, $P_1, ..., P_n$ are continously aptempting \texttt{TS} in order to check $X$ state and see whether the lock is present or not.
	This way to check generates high coherence traffic, because any time that a processor $P_i$ (for $1 \le i \le n$) calls \texttt{TS}, all other caches get invalidated causing a miss on $X$ for the next processor aptempting to read it.
	By estimation, with $n$ waiting processors, there is a $\mathcal{O}(n)$ number of invalidations for each check of $X$, resulting in a coherence traffic in the order of $\mathcal{O}(n^2)$.
	\end{homeworkSection}
	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

	\begin{homeworkSection}{(2)}
	Taking the previous example, the main purpose of introducing \texttt{TTS} is to make $P_1, P_2, ... , P_n$ perform \texttt{BusRd} on $X$
	instead of \texttt{BusRdX} while $P_0$ hold the lock.
	This small difference allows $P_i$ to locally check $X$ without invalidating all other caches,
	because the read value doesn't need to be overwritten unless the lock is released.
	\\
	A local cache read would work because once $P_0$ stores $1$ on $X$, the next store operation
	should be aptempted only after the execution of the critical section. In the meantime,
	$P_1, ... , P_n$ aptempt to read $X$, which would miss the first time and hit all others.
	When $P_0$ releases the lock, $X$ is set to $0$ and once this value is read by another processor $P_i$,
	then $P_i$ would perform \texttt{TS} and eventually get lock ownership.
	\\
	This way, the coherence traffic is reduced to $\mathcal{O}(n)$ operations.
	\end{homeworkSection}

	\begin{homeworkSection}{(3)}
	Exponential back-off consists on the same model as \texttt{TS} but with the addiction of an exponentially increasing waiting time after each check.
	Apparently, it could be a good practice because invalidation are not all performed at the same time, allowing to reduce traffic.
	\\
	However, the method leads to a severe unfairness problem and consequent latency under contention: newer checking processors would obtain lock earlier than older ones.
	\\
	Supposing the same situation of the previous points and suppose a processor $P_i$ performs the first check after $\Delta t$ and fails,
	the next check is scheduled after $2 \cdot \Delta t$. Supposing in the meantime that $P_0$ releases the lock and another
	processor $P_j$ performs a check, then $P_j$ will gain advance on $P_i$ and will take the lock ownership before it.
	If many other $m$ processors act like $P_j$, then the $m^{th}$ scheduled time $P_i$ must wait before the next check is $2^m$,
	which can be long enough to make all other processors take precedence on $P_i$ while it was the first one requesting the lock.
	In the worst case, under contention, this process enforces $P_i$ to wait until all other cores have finished their critical section, causing unneeded synchronization, then huge latency.
	\end{homeworkSection}

	\begin{homeworkSection}{(4)}
	Supposing $X$ is the lock flag register and corresponds to a cache miss for both processors, then in order:

	\begin{enumerate}
	\item $P_0$ broadcasts \texttt{BusRdX} reading $0$, stores $1$ in its cache and then passes into critical section.
	\item $P_1$ broadcasts \texttt{BusRdX} but $X$ must be taken from $P_0$'s cache.
	\item $P_0$ broadcasts \texttt{DataWB} as requested by $P_1$ and reads $1$.

	\item $P_1$ writes $1$ broadcasting \texttt{BusInv}, then invalidating $P_0$'s cache. \label{repeat}
	\item $P_1$ checks $X$ broadcasting \texttt{BusRdX} and repeat from (\ref{repeat}) while $X = 1$. \label{check}

	\item $P_0$ writes $0$ on $X$, then $P_1$ aptempts \texttt{BusRdX} finding $X = 0$ and exits loop.
	\item $P_1$ writes $1$ on $X$, $P_0$'s cache gets invalidated.
	\item $P_1$ executes the critical section.
	\end{enumerate}

	Steps \ref{repeat} and \ref{check} correspond to the waiting loop of $P_1$.
	Its aptempt to pass in critical section fails because $X \neq 0$ during the waiting loop and
	each performed store-conditional operation would always write $1$ on $X$.
	When $P_0$ rewrites $0$ on $X$, the value on $P_1$'s cache gets invalidated, meaning that the next test-conditional would
	miss $X$ and consequently $P_1$ would read $0$ with the intent to write $1$. At that moment the operation is successful
	and finally $P_1$ can enter the critical section.
	\end{homeworkSection}

	\end{homeworkProblem}

	%\end{spacing}

	\end{document}

exo5_raffaele_ancarola.texNo OneTemporaryActions

File Metadata

exo5_raffaele_ancarola.texView Options

Event Timeline

exo5_raffaele_ancarola.tex
No OneTemporary
Actions

exo5_raffaele_ancarola.tex
View Options