Merge branch 'master' of 47.105.50.196:NiuTrans/Toy-MT-Introduction

5ab166f8 · xiaotong · 8468cf3c · beb99716 · 5ab166f8 · 5ab166f8
Commit 5ab166f8 authored May 12, 2020 by xiaotong
--- a/Book/Chapter1/Figures/figure-Example-NMT.tex
+++ b/Book/Chapter1/Figures/figure-Example-NMT.tex
-
 \definecolor{ublue}{rgb}{0.152,0.250,0.545}
 \definecolor{ugreen}{rgb}{0,0.5,0}


--- a/Book/Chapter1/Figures/figure-Example-RBMT.tex
+++ b/Book/Chapter1/Figures/figure-Example-RBMT.tex
-
 \definecolor{ublue}{rgb}{0.152,0.250,0.545}
 \definecolor{ugreen}{rgb}{0,0.5,0}


--- a/Book/Chapter1/Figures/figure-Example-SMT.tex
+++ b/Book/Chapter1/Figures/figure-Example-SMT.tex
-
 \definecolor{ublue}{rgb}{0.152,0.250,0.545}
 \definecolor{ugreen}{rgb}{0,0.5,0}


--- a/Book/Chapter1/Figures/figure-Required-parts-of-MT.tex
+++ b/Book/Chapter1/Figures/figure-Required-parts-of-MT.tex
--- a/Book/Chapter1/chapter1.tex
+++ b/Book/Chapter1/chapter1.tex
@@ -222,7 +222,7 @@
    \centering
 \input{./Chapter1/Figures/figure-comparison-mt-ht-1}
 \end{figure}
-\begin{figure}[htp]
+\begin{figure}[t]
    \centering
 \input{./Chapter1/Figures/figure-comparison-mt-ht-2}
    \caption{机器翻译与人工翻译实例结果对比}

--- a/Book/Chapter2/Figures/figure-Example-of-word-segmentation-based-on-dictionary.tex
+++ b/Book/Chapter2/Figures/figure-Example-of-word-segmentation-based-on-dictionary.tex
-
 \definecolor{ublue}{rgb}{0.152,0.250,0.545}
 \definecolor{ugreen}{rgb}{0,0.5,0}


--- a/Book/Chapter2/Figures/figure-Probability-density-function&Distribution-function.tex
+++ b/Book/Chapter2/Figures/figure-Probability-density-function&Distribution-function.tex


-
 %%% outline
 %-------------------------------------------------------------------------
 \begin{tikzpicture}

--- a/Book/Chapter2/Figures/figure-Self-information-function.tex
+++ b/Book/Chapter2/Figures/figure-Self-information-function.tex
--- a/Book/Chapter4/chapter4.tex
+++ b/Book/Chapter4/chapter4.tex
@@ -1204,7 +1204,7 @@ h_i (d,\textbf{t},\textbf{s})=\sum_{r \in d}h_i (r)
 \label{eq:4-27}
 \end{eqnarray}

-\parinterval 其中：
+\noindent 其中：

 \begin{itemize}
 \vspace{0.5em}
@@ -1430,12 +1430,12 @@ span\textrm{[0,4]}&=&\textrm{``猫} \quad \textrm{喜欢} \quad \textrm{吃} \qu
 \parinterval 可以说基于句法的翻译模型贯穿了现代统计机器翻译的发展历程。从概念上讲，不管是层次短语模型，还是语言学句法模型都是基于句法的模型。基于句法的机器翻译模型种类繁多，这里先对相关概念进行简要介绍，以避免后续论述中产生歧义。表\ref{tab:4-2}给出了基于句法的机器翻译中涉及的一些概念。

 %----------------------------------------------
-\begin{table}[htp]{
+\begin{table}[hbp]{
 \begin{center}
 \caption{基于句法的机器翻译中常用概念}
 \label{tab:4-2}
 {
-\begin{tabular}{l | l}
+\begin{tabular}{p{6.5em} | l}
 术语 & 说明 \\
 \hline
 \rule{0pt}{15pt}翻译规则 & 翻译的最小单元（或步骤） \\
@@ -1454,6 +1454,18 @@ span\textrm{[0,4]}&=&\textrm{``猫} \quad \textrm{喜欢} \quad \textrm{吃} \qu
 \rule{0pt}{15pt}基于树 &（源语言）使用树结构（大多指句法树） \\
 \rule{0pt}{15pt}基于串 &（源语言）使用词串，比如串到树翻译系统的解码器一般\\
 &都是基于串的解码方法 \\
+\end{tabular}
+}
+\end{center}
+}\end{table}
+\vspace{3em}
+\begin{table}[htp]{
+\begin{center}
+\vspace{1em}
+{
+\begin{tabular}{p{6.5em} | l}
+术语 & 说明 \\
+\hline
 \rule{0pt}{15pt}基于森林 &（源语言）使用句法森林，这里森林只是对多个句法树的一\\
 &种压缩表示 \\
 \rule{0pt}{15pt}词汇化规则 & 含有终结符的规则 \\
@@ -1626,7 +1638,7 @@ r_9: \quad \textrm{IP(}\textrm{NN}_1\ \textrm{VP}_2) \rightarrow \textrm{S(}\tex
 \end{eqnarray}
 }

-\parinterval 可以得到一个翻译推导：
+\noindent 可以得到一个翻译推导：
 {\footnotesize
 \begin{eqnarray}
 && \langle\ \textrm{IP}^{[1]},\ \textrm{S}^{[1]}\ \rangle \nonumber \\
@@ -1638,14 +1650,16 @@ r_9: \quad \textrm{IP(}\textrm{NN}_1\ \textrm{VP}_2) \rightarrow \textrm{S(}\tex
 &                 & \ \ \textrm{S(NP(DT(the) NNS(imports))}\ \textrm{VP(VBP}^{[6]}\ \textrm{ADVP(RB(drastically)}\  \textrm{VBN}^{[5]})))\ \rangle \nonumber \\
 & \xrightarrow[r_4]{\textrm{VV}^{[5]} \Leftrightarrow \textrm{VBN}^{[5]}} & \langle\ \textrm{IP(NN(进口)}\ \textrm{VP(AD(大幅度)}\ \textrm{VP(VV(减少)}\ \textrm{AS}^{[6]}))), \hspace{10em} \nonumber \\
 &                 & \ \ \textrm{S(NP(DT(the) NNS(imports))}\ \textrm{VP(VBP}^{[6]}\ \nonumber \\
-&                 & \ \ \textrm{ADVP(RB(drastically)}\ \textrm{VBN(fallen)})))\ \rangle \nonumber \\
+&                 & \ \ \textrm{ADVP(RB(drastically)}\ \textrm{VBN(fallen)})))\ \rangle \nonumber
+\end{eqnarray}
+\begin{eqnarray}
 & \xrightarrow[r_6]{\textrm{AS}^{[6]} \Leftrightarrow \textrm{VBP}^{[6]}} & \langle\ \textrm{IP(NN(进口)}\ \textrm{VP(AD(大幅度)}\ \textrm{VP(VV(减少)}\ \textrm{AS(了)}))), \nonumber \\
 &                 & \ \ \textrm{S(NP(DT(the) NNS(imports))}\ \textrm{VP(VBP(have)}\ \nonumber \\
 &                 & \ \ \textrm{ADVP(RB(drastically)}\ \textrm{VBN(fallen)})))\ \rangle \hspace{15em} \nonumber
 \end{eqnarray}
 }

-\parinterval 其中，箭头$\rightarrow$表示推导之意。显然，可以把翻译看作是基于树结构的推导过程（记为$d$）。因此，与层次短语模型一样，基于语言学句法的机器翻译也是要找到最佳的推导$\hat{d} = \arg\max\textrm{P}(d)$。
+\noindent 其中，箭头$\rightarrow$表示推导之意。显然，可以把翻译看作是基于树结构的推导过程（记为$d$）。因此，与层次短语模型一样，基于语言学句法的机器翻译也是要找到最佳的推导$\hat{d} = \arg\max\textrm{P}(d)$。

 %----------------------------------------------------------------------------------------
 %    NEW SUBSUB-SECTION
@@ -1664,7 +1678,7 @@ r_9: \quad \textrm{IP(}\textrm{NN}_1\ \textrm{VP}_2) \rightarrow \textrm{S(}\tex
 \end{figure}
 %-------------------------------------------

-\parinterval 其中，源语言树片段中的叶子结点NN表示变量，它与右手端的变量NN对应。这里仍然可以使用基于树结构的规则对上面这个树到串的映射进行表示。参照规则形式$\langle\  \alpha_h, \beta_h\ \rangle \to \langle\ \alpha_r, \beta_r, \sim\ \rangle$，有：
+\noindent 其中，源语言树片段中的叶子结点NN表示变量，它与右手端的变量NN对应。这里仍然可以使用基于树结构的规则对上面这个树到串的映射进行表示。参照规则形式$\langle\  \alpha_h, \beta_h\ \rangle \to \langle\ \alpha_r, \beta_r, \sim\ \rangle$，有：
 \begin{eqnarray}
 \alpha_h & = & \textrm{VP} \nonumber \\
 \beta_h & = & \textrm{VP}\ (=\alpha_h) \nonumber \\
@@ -1800,7 +1814,7 @@ r_9: \quad \textrm{IP(}\textrm{NN}_1\ \textrm{VP}_2) \rightarrow \textrm{S(}\tex
 \textrm{VP(PP(P(对)}\ \textrm{NP(NN(回答)))}\ \textrm{VP}_1) \rightarrow \textrm{VP}_1\ \textrm{with}\ \textrm{the}\ \textrm{answer} \nonumber
 \end{eqnarray}

-\parinterval 其中，蓝色部分表示可以抽取到的规则，显然它的根节点和叶子非终结符节点都是可信节点。由于源语言树片段中包含一个变量（VP），因此需要对VP节点的Span所表示的目标语言范围进行泛化（红色方框部分）。
+\noindent 其中，蓝色部分表示可以抽取到的规则，显然它的根节点和叶子非终结符节点都是可信节点。由于源语言树片段中包含一个变量（VP），因此需要对VP节点的Span所表示的目标语言范围进行泛化（红色方框部分）。

 %----------------------------------------------
 \begin{figure}[htp]
@@ -1985,7 +1999,7 @@ r_9: \quad \textrm{IP(}\textrm{NN}_1\ \textrm{VP}_2) \rightarrow \textrm{S(}\tex
 \textrm{VP(}\textrm{PP}_1\ \textrm{VP(VV(表示)}\ \textrm{NN}_2\textrm{))} \rightarrow \textrm{VP(VBZ(was)}\ \textrm{VP(}\textrm{VBN}_2\ \textrm{PP}_1\textrm{))} \nonumber
 \end{eqnarray}

-\parinterval 其中，规则的左部是源语言句法树结构，右部是目标语言句法树结构，变量的下标表示对应关系。为了获取这样的规则，需要进行树到树规则抽取。最直接的办法是把GHKM方法推广到树到树翻译的情况。比如，可以利用双语结构的约束和词对齐，定义树的切割点，之后找到两种语言树结构的映射关系\cite{liu2009improving}。
+\noindent 其中，规则的左部是源语言句法树结构，右部是目标语言句法树结构，变量的下标表示对应关系。为了获取这样的规则，需要进行树到树规则抽取。最直接的办法是把GHKM方法推广到树到树翻译的情况。比如，可以利用双语结构的约束和词对齐，定义树的切割点，之后找到两种语言树结构的映射关系\cite{liu2009improving}。

 %----------------------------------------------------------------------------------------
 %    NEW SUBSUB-SECTION
@@ -2007,7 +2021,7 @@ r_9: \quad \textrm{IP(}\textrm{NN}_1\ \textrm{VP}_2) \rightarrow \textrm{S(}\tex
 \parinterval 换一个角度来看，词对齐实际上只是帮助模型找到两种语言句法树中节点的对应关系。如果能够直接得到句法树节点的对应，就可以避免掉词对齐的错误。也就是，可以直接使用节点对齐来进行树到树规则的抽取。首先，利用外部的节点对齐工具获得两棵句法树节点之间的对齐关系。之后，将每个对齐的节点看作是树片段的根节点，再进行规则抽取。图\ref{fig:4-62}展示了基于节点对齐的规则抽取结果。

 %----------------------------------------------
-\begin{figure}[htp]
+\begin{figure}[htb]
 \centering
 \input{./Chapter4/Figures/tree-to-tree-rule-extraction-base-node-alignment}
 \caption{基于节点对齐的树到树规则抽取}
@@ -2205,12 +2219,24 @@ d_1 = {d'} \circ {r_5}
 \caption{基于串的解码 vs 基于树的解码}
 \label{tab:4-4}
 {
-\begin{tabular}{l | l l}
+\begin{tabular}{l | p{16.5em} l}
 对比 & 基于树的解码 & 基于串的解码 \\
 \hline
 \rule{0pt}{15pt}解码方法 & $\hat{d} = \arg\max_{d \in D_{\textrm{tree}}} \textrm{score} (d)$ & $\hat{d} = \arg\max_{d \in D} \textrm{score} (d)$ \\
 \rule{0pt}{15pt}搜索空间 & 与输入的源语句法树兼容的推导$D_{\textrm{tree}}$ & 所有的推导$D$ \\
-\rule{0pt}{15pt}适用模型 & 树到串、树到树 & 所有的句法模型 \\
+\rule{0pt}{15pt}适用模型 & 树到串、树到树 & 所有的句法模型
+\end{tabular}
+}
+\end{center}
+}\end{table}
+\begin{table}[htp]{
+\begin{center}
+\vspace{1em}
+{
+\begin{tabular}{l | p{16.5em} l}
+对比 & 基于树的解码 & 基于串的解码 \\
+\hline
+
 \rule{0pt}{15pt}解码算法 & Chart解码 & CKY + 规则二叉化 \\
 \rule{0pt}{15pt}速度 & 快 & 一般较慢
 \end{tabular}

--- a/Book/Chapter6/Chapter6.tex
+++ b/Book/Chapter6/Chapter6.tex
--- a/Book/Chapter6/Figures/figure-A-combination-of-position-encoding-and-word-encoding.tex
+++ b/Book/Chapter6/Figures/figure-A-combination-of-position-encoding-and-word-encoding.tex

-
 \begin{tikzpicture}
 \begin{scope}
 \tikzstyle{rnode} = [draw,minimum width=3.5em,minimum height=1.2em]

--- a/Book/Chapter6/Figures/figure-A-working-example-of-neural-machine-translation.tex
+++ b/Book/Chapter6/Figures/figure-A-working-example-of-neural-machine-translation.tex
-
  \begin{tikzpicture}
   
        \setlength{\base}{1cm}

--- a/Book/Chapter6/Figures/figure-Attention-of-source-and-target-words.tex
+++ b/Book/Chapter6/Figures/figure-Attention-of-source-and-target-words.tex

-
 %

 %---------------------------------------

--- a/Book/Chapter6/Figures/figure-Automatic-generation-of-ancient-poems-based-on-encoder-decoder-framework.tex
+++ b/Book/Chapter6/Figures/figure-Automatic-generation-of-ancient-poems-based-on-encoder-decoder-framework.tex

-
 \begin{tikzpicture}
 \begin{scope}
 \tikzstyle{lnode} = [minimum height=2em,minimum width=8em,inner sep=3pt,rounded corners=2pt,draw,fill=red!20];

--- a/Book/Chapter6/Figures/figure-Automatically-generate-instances-of-couplets.tex
+++ b/Book/Chapter6/Figures/figure-Automatically-generate-instances-of-couplets.tex

-
 \begin{tikzpicture}
 \begin{scope}
 \tikzstyle{lnode} = [minimum height=2.5em,minimum width=12em,inner sep=3pt,rounded corners=2pt,draw=red!75!black,fill=red!5];

--- a/Book/Chapter6/Figures/figure-Beam-search-process.tex
+++ b/Book/Chapter6/Figures/figure-Beam-search-process.tex


-
 %-----------------------------------------



--- a/Book/Chapter6/Figures/figure-Calculation-of-context-vector-C.tex
+++ b/Book/Chapter6/Figures/figure-Calculation-of-context-vector-C.tex

-
 \begin{tikzpicture}
 \begin{scope}


--- a/Book/Chapter6/Figures/figure-Calculation-process-of-context-vector-C.tex
+++ b/Book/Chapter6/Figures/figure-Calculation-process-of-context-vector-C.tex
@@ -4,7 +4,6 @@



-
 \begin{tikzpicture}

 \begin{scope}

--- a/Book/Chapter6/Figures/figure-Comparison-of-the-number-of-padding-in-batch.tex
+++ b/Book/Chapter6/Figures/figure-Comparison-of-the-number-of-padding-in-batch.tex


-
 \begin{tikzpicture}

 \begin{scope}[scale=1.5]

--- a/Book/Chapter6/Figures/figure-Data-parallel-process.tex
+++ b/Book/Chapter6/Figures/figure-Data-parallel-process.tex

-
 %----------------------------------



--- a/Book/Chapter6/Figures/figure-Decode-the-word-probability-distribution-at-the-first-position.tex
+++ b/Book/Chapter6/Figures/figure-Decode-the-word-probability-distribution-at-the-first-position.tex
@@ -3,7 +3,6 @@



-
 \begin{tikzpicture}
 \begin{scope}
 \tikzstyle{rnnnode} = [minimum height=1.1em,minimum width=3.5em,inner sep=2pt,rounded corners=1pt,draw,fill=red!20];

--- a/Book/Chapter6/Figures/figure-Decoding-process-based-on-greedy-method.tex
+++ b/Book/Chapter6/Figures/figure-Decoding-process-based-on-greedy-method.tex
-
 \begin{tikzpicture}
 \begin{scope}
 \tikzstyle{rnnnode} = [minimum height=1.1em,minimum width=2.1em,inner sep=2pt,rounded corners=1pt,draw,fill=red!20];

--- a/Book/Chapter6/Figures/figure-Dependencies-between-words-in-a-recurrent-neural-network.tex
+++ b/Book/Chapter6/Figures/figure-Dependencies-between-words-in-a-recurrent-neural-network.tex


-
 \begin{tikzpicture}
 \begin{scope}
 \node [anchor=west] (w0) at (0,0) {$w_1$};

--- a/Book/Chapter6/Figures/figure-Dependencies-between-words-of-Attention.tex
+++ b/Book/Chapter6/Figures/figure-Dependencies-between-words-of-Attention.tex


-
 \begin{tikzpicture}
 \begin{scope}
 \node [anchor=west] (w0) at (0,-2) {$w_1$};

--- a/Book/Chapter6/Figures/figure-Different-regularization-methods.tex
+++ b/Book/Chapter6/Figures/figure-Different-regularization-methods.tex



-
 \begin{tikzpicture}
 \begin{scope}
 \tikzstyle{lnode} = [minimum height=1.5em,minimum width=3em,inner sep=3pt,rounded corners=1.5pt,draw,fill=orange!20];

--- a/Book/Chapter6/Figures/figure-Double-layer-RNN.tex
+++ b/Book/Chapter6/Figures/figure-Double-layer-RNN.tex
-
 %--------------------------------------------------------------------------------
    \begin{tikzpicture}
        \setlength{\base}{0.9cm}

--- a/Book/Chapter6/Figures/figure-Example-of-automatic-translation-of-classical-Chinese.tex
+++ b/Book/Chapter6/Figures/figure-Example-of-automatic-translation-of-classical-Chinese.tex
-
 %---------------------------------------

 \begin{frame}{}

--- a/Book/Chapter6/Figures/figure-Example-of-context-vector-calculation-process.tex
+++ b/Book/Chapter6/Figures/figure-Example-of-context-vector-calculation-process.tex



-
 %-------------------------------------------



--- a/Book/Chapter6/Figures/figure-Example-of-self-attention-mechanism-calculation.tex
+++ b/Book/Chapter6/Figures/figure-Example-of-self-attention-mechanism-calculation.tex


-
 \begin{tikzpicture}
 \begin{scope}


--- a/Book/Chapter6/Figures/figure-Generate-summary.tex
+++ b/Book/Chapter6/Figures/figure-Generate-summary.tex


-
 %%% outline
 %-------------------------------------------------------------------------
 \begin{tikzpicture}

--- a/Book/Chapter6/Figures/figure-Mask-instance-for-future-positions-in-Transformer.tex
+++ b/Book/Chapter6/Figures/figure-Mask-instance-for-future-positions-in-Transformer.tex



-
 \begin{tikzpicture}
 \begin{scope}
 \tikzstyle{attnode} = [minimum size=1.5em,inner sep=0pt,rounded corners=1pt,draw]

--- a/Book/Chapter6/Figures/figure-Matrix-Representation-of-Attention-Weights-Between-Chinese-English-Sentence-Pairs.tex
+++ b/Book/Chapter6/Figures/figure-Matrix-Representation-of-Attention-Weights-Between-Chinese-English-Sentence-Pairs.tex
@@ -3,7 +3,6 @@



-
 %-------------------------------------------
 \begin{tikzpicture}


--- a/Book/Chapter6/Figures/figure-Model-structure-based-on-recurrent-neural-network-translation.tex
+++ b/Book/Chapter6/Figures/figure-Model-structure-based-on-recurrent-neural-network-translation.tex
-
 %--------------------------------------------------------------------------
   \begin{tikzpicture}
   

--- a/Book/Chapter6/Figures/figure-Multi-Head-Attention-Model.tex
+++ b/Book/Chapter6/Figures/figure-Multi-Head-Attention-Model.tex


-
 \begin{tikzpicture}
 \begin{scope}


--- a/Book/Chapter6/Figures/figure-Output-layer-structur.tex
+++ b/Book/Chapter6/Figures/figure-Output-layer-structur.tex

-
 % not compatible with [scale=?]



--- a/Book/Chapter6/Figures/figure-Point-product-attention-model.tex
+++ b/Book/Chapter6/Figures/figure-Point-product-attention-model.tex
@@ -3,7 +3,6 @@



-
 \begin{tikzpicture}
 \begin{scope}


--- a/Book/Chapter6/Figures/figure-Position-of-difference-and-layer-regularization-in-the-model.tex
+++ b/Book/Chapter6/Figures/figure-Position-of-difference-and-layer-regularization-in-the-model.tex
@@ -2,7 +2,6 @@



-
 \begin{tikzpicture}
 \begin{scope}
 \tikzstyle{Sanode} = [minimum height=1.4em,minimum width=7em,inner sep=3pt,rounded corners=1.5pt,draw,fill=orange!20];

--- a/Book/Chapter6/Figures/figure-Position-of-feedforward-neural-network-in-the-model.tex
+++ b/Book/Chapter6/Figures/figure-Position-of-feedforward-neural-network-in-the-model.tex


-
 \begin{tikzpicture}
 \begin{scope}
 \tikzstyle{Sanode} = [minimum height=1.4em,minimum width=7em,inner sep=3pt,rounded corners=1.5pt,draw,fill=orange!20];

--- a/Book/Chapter6/Figures/figure-Position-of-self-attention-mechanism-in-the-model.tex
+++ b/Book/Chapter6/Figures/figure-Position-of-self-attention-mechanism-in-the-model.tex



-
 \begin{tikzpicture}
 \begin{scope}
 \tikzstyle{Sanode} = [minimum height=1.4em,minimum width=7em,inner sep=3pt,rounded corners=1.5pt,draw,fill=orange!20];

--- a/Book/Chapter6/Figures/figure-Presentation-space.tex
+++ b/Book/Chapter6/Figures/figure-Presentation-space.tex
--- a/Book/Chapter6/Figures/figure-Query-model-corresponding-to-attention-mechanism.tex
+++ b/Book/Chapter6/Figures/figure-Query-model-corresponding-to-attention-mechanism.tex
@@ -7,7 +7,6 @@



-
 \begin{tikzpicture}
 \begin{scope}


--- a/Book/Chapter6/Figures/figure-Query-model-corresponding-to-traditional-query-model-vs-attention-mechanism.tex
+++ b/Book/Chapter6/Figures/figure-Query-model-corresponding-to-traditional-query-model-vs-attention-mechanism.tex


-
 %-----------------------------------------------------

 \begin{tikzpicture}

--- a/Book/Chapter6/Figures/figure-Query-model-corresponding-to-traditional-query-model-vs-attention-mechanism02.tex
+++ b/Book/Chapter6/Figures/figure-Query-model-corresponding-to-traditional-query-model-vs-attention-mechanism02.tex



-
 %-----------------------------------------------------

 \begin{tikzpicture}

--- a/Book/Chapter6/Figures/figure-Relationship-between-learning-rate-and-number-of-updates.tex
+++ b/Book/Chapter6/Figures/figure-Relationship-between-learning-rate-and-number-of-updates.tex



-
            \begin{tikzpicture}
            \footnotesize{
                \begin{axis}[

--- a/Book/Chapter6/Figures/figure-Residual-network-structure.tex
+++ b/Book/Chapter6/Figures/figure-Residual-network-structure.tex


-
 \begin{tikzpicture}
 \begin{scope}
 \tikzstyle{lnode} = [minimum height=1.5em,minimum width=3em,inner sep=3pt,rounded corners=1.5pt,draw,fill=orange!20];

--- a/Book/Chapter6/Figures/figure-Structure-of-a-recurrent-network-model.tex
+++ b/Book/Chapter6/Figures/figure-Structure-of-a-recurrent-network-model.tex


-
 %------------------------------------------------------------

 \begin{tikzpicture}

--- a/Book/Chapter6/Figures/figure-Structure-of-the-network-during-Transformer-training.tex
+++ b/Book/Chapter6/Figures/figure-Structure-of-the-network-during-Transformer-training.tex


-
 \begin{tikzpicture}
 \begin{scope}
 \tikzstyle{rnnnode} = [minimum height=1.1em,minimum width=2.1em,inner sep=2pt,rounded corners=1pt,draw,fill=red!20];

--- a/Book/Chapter6/Figures/figure-Transformer-input-and-position-encoding.tex
+++ b/Book/Chapter6/Figures/figure-Transformer-input-and-position-encoding.tex


-
 \begin{tikzpicture}
 \begin{scope}
 \tikzstyle{Sanode} = [minimum height=1.4em,minimum width=7em,inner sep=3pt,rounded corners=1.5pt,draw];

--- a/Book/Chapter6/Figures/figure-Word-embedding-structure.tex
+++ b/Book/Chapter6/Figures/figure-Word-embedding-structure.tex
-
  
 %------------------------------------------------------
        \begin{tikzpicture}

--- a/Book/Chapter7/Figures/figure-Underfitting-vs-Overfitting.tex
+++ b/Book/Chapter7/Figures/figure-Underfitting-vs-Overfitting.tex
-
 \begin{tabular}{l l l}
 \begin{tikzpicture}
 \draw[->, thick] (0,0) to (3,0);