Merge branch 'master' into liyanyang

bdcfc769 · Lee · b041e362 · abfdaf38 · bdcfc769 · bdcfc769
Commit bdcfc769 authored Dec 16, 2019 by Lee
--- a/Section04-Phrasal-and-Syntactic-Models/section04-test.tex
+++ b/Section04-Phrasal-and-Syntactic-Models/section04-test.tex
--- a/Section04-Phrasal-and-Syntactic-Models/section04.tex
+++ b/Section04-Phrasal-and-Syntactic-Models/section04.tex
@@ -1067,10 +1067,11 @@ $d$是一个$(\textbf{s},\textbf{t})$上基于短语的翻译推导，$\textrm{P
 %%%------------------------------------------------------------------------------------------------------------
 %%% 翻译推导的建模
 \begin{frame}{对翻译推导进行建模}
+\vspace{-0.4em}
 \begin{itemize}
 \item $\textrm{P}(\textbf{t}|\textbf{s}) = \sum_{d} \textrm{P}(d,\textbf{t}|\textbf{s})$带来新的问题：如何描述$\textrm{P}(d,\textbf{t}|\textbf{s})$ \\
-\vspace{0.5em}
+\vspace{0.0em}
 \begin{center}
 \begin{tikzpicture}
@@ -1105,6 +1106,7 @@ $d$是一个$(\textbf{s},\textbf{t})$上基于短语的翻译推导，$\textrm{P
 \item<2-> 希望有这样一种模型可以对任意的因素进行方便的建模。经典的判别式模型成为了不二的选择
 \end{itemize}
+\vspace{-0.2em}
 \visible<2->{
 \textbf{Discriminative Training and Maximum Entropy Models for Statistical Machine Translation}\\
 \textbf{Franz Och and Hermann Ney, 2002, In Proc of ACL}
@@ -1364,7 +1366,19 @@ $d$是一个$(\textbf{s},\textbf{t})$上基于短语的翻译推导，$\textrm{P
 %%%------------------------------------------------------------------------------------------------------------
 %%%  短语系统的问题
 \begin{frame}{基于短语的方法的不足}
-% David Chiang ACL2005的论文
+\begin{itemize}
+\item 短语可以很好的捕捉词语之间的局部搭配和调序，但是长距离依赖需要更长的短语
+    \begin{itemize}
+    \item 实践中发现使用超过长度3的短语作用不大
+    \item 短语非常稀疏，包含多个词的短语大多非常低频
+    \end{itemize}
+    \begin{tabular}{l | r}
+    短语(中文) & 训练数据中频次 \hline \\
+    包含 & 3341 \\
+    包含 多个 & 213 \\
+    \end{tabular}
+\end{itemize}
 \end{frame}
 %%%------------------------------------------------------------------------------------------------------------

--- a/Section06-Neural-Machine-Translation/section06.tex
+++ b/Section06-Neural-Machine-Translation/section06.tex