Commit 3ff225fd by 姜雨帆

Merge branch 'master' into jiangyufan

parents 82369ec5 c947c3e9
...@@ -108,20 +108,20 @@ ...@@ -108,20 +108,20 @@
\centering \centering
%\includegraphics[scale=0.7]{./Chapter6/Figures/mTER of different systems.png} %\includegraphics[scale=0.7]{./Chapter6/Figures/mTER of different systems.png}
\input{./Chapter6/Figures/figure-score-of-mTER} \input{./Chapter6/Figures/figure-score-of-mTER}
\caption{不同系统在不同长度句子的mTER分值(神经机器翻译系统:NMT;统计机器翻译系统:SPB、HPB、PBSY)} \caption{不同系统在不同长度句子上的mTER分值}
\label{fig:6-3} \label{fig:6-3}
\end{figure} \end{figure}
%---------------------------------------------- %----------------------------------------------
\parinterval 除了上面例子中展示的流畅度和准确度外,NMT的译文质量已全面优于统计机器翻译\cite{Bentivogli2016NeuralVP}。在IWSLT 2015英语-德语任务中,与三个最先进的统计机器翻译系统(PBSY、HPB、SPB)相比,NMT译文的mTER得分在不同长度句子上都得到了明显的下降,如图\ref{fig:6-3}(mTER越低越好)。其次,NMT翻译的单词的形态错误率(表\ref{tab:HTER} ``\%Δ'')和单词词义错误率(表\ref{tab:HTER}``word'')都远低于统计机器翻译系统。并且,NMT译文与参考译文之间的KRS得分(88.3)大于表\ref{tab:KRS}中任何一个PBMT系统(KRS得分表明了系统翻译的句子与标准句子之间的字序相关性,其分值越高越好) \parinterval 除了上面例子中展示的流畅度和准确度外,神经机器翻译在其它评价指标上的表现也全面超越统计机器翻译\cite{Bentivogli2016NeuralVP}。比如,在IWSLT 2015英语-德语任务中,与三个最先进的统计机器翻译系统(PBSY、HPB、SPB)相比,神经机器翻译系统的mTER得分在不同长度句子上都得到了明显的下降,如图\ref{fig:6-3}\footnote{mTER是一种错误率度量,值越低表明译文越好。}。其次,神经机器翻译的单词形态错误率和单词词义错误率都远低于统计机器翻译系统(表\ref{tab:HTER} )。并且,神经机器翻译系统的KRS得分也优于统计机器翻译系统(表\ref{tab:KRS}\footnote{KRS得分度量了了机器翻译译文与参考译文之间的字序相关性,其分值越高越好。}
%---------------------------------------------- %----------------------------------------------
% 表 % 表
\begin{table}[htp] \begin{table}[htp]
\centering \centering
\caption{NMT与最优秀的统计机器翻译系统译文的错误率得分} \caption{NMT与SMT系统的译文错误率\cite{Bentivogli2016NeuralVP}}
\label{tab:HTER} \label{tab:HTER}
\begin{tabular}{c|ccc} \begin{tabular}{r|llc}
% & \multicolumn{2}{c}{HTERnoShift} & \\ % & \multicolumn{2}{c}{HTERnoShift} & \\
\textbf{system} & \textbf{word} & \textbf{lemma} & \textbf{\%Δ} \\ \hline \textbf{system} & \textbf{word} & \textbf{lemma} & \textbf{\%Δ} \\ \hline
PBSY &27.1 & 22.5 & -16.9 \\ PBSY &27.1 & 22.5 & -16.9 \\
...@@ -135,9 +135,9 @@ NMT & $ 21.7^{\ast}$ & $18.7^{\ast}$ & -1 ...@@ -135,9 +135,9 @@ NMT & $ 21.7^{\ast}$ & $18.7^{\ast}$ & -1
% 表 % 表
\begin{table}[htp] \begin{table}[htp]
\centering \centering
\caption{根据HTER计算和KRS中的移位运算对单词重新排序进行评估。对于每个系统,将报告生成的单词数,移位错误数及其相应的百分比} \caption{NMT与SMT系统的KRS得分、移位错误数和百分比\cite{Bentivogli2016NeuralVP}}
\label{tab:KRS} \label{tab:KRS}
\begin{tabular}{l | l l l l} \begin{tabular}{r | l l l l}
\textbf{system} &\textbf{\#words} & \textbf{\#shifts} & \textbf{\%shifts} & \textbf{KRS}\\ \hline \textbf{system} &\textbf{\#words} & \textbf{\#shifts} & \textbf{\%shifts} & \textbf{KRS}\\ \hline
PBSY & 11.517 & 354 & 3.1 &84.6 \\ PBSY & 11.517 & 354 & 3.1 &84.6 \\
HPB & 11.417 & 415 & 3.6 &84.3 \\ HPB & 11.417 & 415 & 3.6 &84.3 \\
...@@ -169,13 +169,13 @@ NMT & $ 21.7^{\ast}$ & $18.7^{\ast}$ & -1 ...@@ -169,13 +169,13 @@ NMT & $ 21.7^{\ast}$ & $18.7^{\ast}$ & -1
%-------------------------------------- %--------------------------------------
\parinterval 在最近两年,神经机器翻译的发展更加迅速,新的模型、方法层出不穷。表\ref{tab:result-of-wmt14}就给了2019年对当时一些主流的神经机器翻译模型的对比\cite{WangLearning}。可以看到,相比2017年,2018-2019年中机器翻译仍然有明显的进步。 \parinterval 在最近两年,神经机器翻译的发展更加迅速,新的模型、方法层出不穷。表\ref{tab:result-of-wmt14}给出了2019年一些主流的神经机器翻译模型的对比\cite{WangLearning}。可以看到,相比2017年,2018-2019年中机器翻译仍然有明显的进步。
%---------------------------------------------- %----------------------------------------------
% 表 % 表
\begin{table}[htp] \begin{table}[htp]
\centering \centering
\caption{WMT14英德数据集上神经机器翻译系统的表现\cite{WangLearning}} \caption{WMT14英德数据集上不同神经机器翻译系统的表现\cite{WangLearning}}
\label{tab:result-of-wmt14} \label{tab:result-of-wmt14}
\begin{tabular}{ l | l l l} \begin{tabular}{ l | l l l}
\textbf{模型} &\textbf{作者} & \textbf{年份} & \textbf{BLEU} \\ \hline \textbf{模型} &\textbf{作者} & \textbf{年份} & \textbf{BLEU} \\ \hline
......
...@@ -6,28 +6,32 @@ ...@@ -6,28 +6,32 @@
\begin{tikzpicture} \begin{tikzpicture}
\begin{scope}[local bounding box=WMT] \begin{scope}[local bounding box=WMT]
\draw[->,thick] (0.4,0) to (9.5,0); \draw[->,thick] (0.4,0) to (9.5,0);
\draw[->,thick] (0.4,-0) to (0.4,3.5); \draw[->,thick] (0.4,-0) to (0.4,4.3);
\draw[thick] (0.4,2) to (0.6,2);
\draw[thick] (0.4,4) to (0.6,4);
\node[font=\scriptsize] at (0,2) {10};
\node[font=\scriptsize] at (0,4) {20};
% 2015 % 2015
\node[minimum width=0.5cm,thick,minimum height=7*0.2cm,draw,fill=blue!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (smt2015) at (1.5*0.7,0.5pt) {}; \node[minimum width=0.5cm,thick,minimum height=7*0.2cm,draw,fill=blue!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (smt2015) at (1.5*0.7,0.5pt) {};
\node[minimum width=0.5cm,thick,minimum height=2*0.2cm,draw,fill=red!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (nmt2015) at (smt2015.south east) {}; \node[minimum width=0.5cm,thick,minimum height=2*0.2cm,draw,fill=red!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (nmt2015) at (smt2015.south east) {};
\node[font=\normalsize,anchor=north] () at (smt2015.south east) {2015}; \node[font=\scriptsize,anchor=north] () at ([yshift=-0.2em]smt2015.south east) {2015};
% 2016 % 2016
\node[minimum width=0.5cm,thick,minimum height=3*0.2cm,draw,fill=blue!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (smt2016) at ($(nmt2015.south east)+(0.7,0)$) {}; \node[minimum width=0.5cm,thick,minimum height=3*0.2cm,draw,fill=blue!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (smt2016) at ($(nmt2015.south east)+(0.7,0)$) {};
\node[minimum width=0.5cm,thick,minimum height=8*0.2cm,draw,fill=red!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (nmt2016) at (smt2016.south east) {}; \node[minimum width=0.5cm,thick,minimum height=8*0.2cm,draw,fill=red!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (nmt2016) at (smt2016.south east) {};
\node[font=\normalsize,anchor=north] () at (smt2016.south east) {2016}; \node[font=\scriptsize,anchor=north] () at ([yshift=-0.2em]smt2016.south east) {2016};
% 2017 % 2017
\node[minimum width=0.5cm,thick,minimum height=3*0.2cm,draw,fill=blue!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (smt2017) at ($(nmt2016.south east)+(0.7,0)$) {}; \node[minimum width=0.5cm,thick,minimum height=3*0.2cm,draw,fill=blue!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (smt2017) at ($(nmt2016.south east)+(0.7,0)$) {};
\node[minimum width=0.5cm,thick,minimum height=13*0.2cm,draw,fill=red!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (nmt2017) at (smt2017.south east) {}; \node[minimum width=0.5cm,thick,minimum height=13*0.2cm,draw,fill=red!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (nmt2017) at (smt2017.south east) {};
\node[font=\normalsize,anchor=north] () at (smt2017.south east) {2017}; \node[font=\scriptsize,anchor=north] () at ([yshift=-0.2em]smt2017.south east) {2017};
% 2018 % 2018
\node[minimum width=0.5cm,thick,minimum height=0cm,draw,fill=blue!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (smt2018) at ($(nmt2017.south east)+(0.7,0)$) {}; \node[minimum width=0.5cm,thick,minimum height=0cm,draw,fill=blue!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (smt2018) at ($(nmt2017.south east)+(0.7,0)$) {};
\node[minimum width=0.5cm,thick,minimum height=14*0.2cm,draw,fill=red!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (nmt2018) at (smt2018.south east) {}; \node[minimum width=0.5cm,thick,minimum height=14*0.2cm,draw,fill=red!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (nmt2018) at (smt2018.south east) {};
\node[font=\normalsize,anchor=north] () at (smt2018.south east) {2018}; \node[font=\scriptsize,anchor=north] () at ([yshift=-0.2em]smt2018.south east) {2018};
% 2019 % 2019
\node[minimum width=0.5cm,thick,minimum height=0cm,draw,fill=blue!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (smt2019) at ($(nmt2018.south east)+(0.7,0)$) {}; \node[minimum width=0.5cm,thick,minimum height=0cm,draw,fill=blue!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (smt2019) at ($(nmt2018.south east)+(0.7,0)$) {};
\node[minimum width=0.5cm,thick,minimum height=15*0.2cm,draw,fill=red!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (nmt2019) at (smt2019.south east) {}; \node[minimum width=0.5cm,thick,minimum height=21*0.2cm,draw,fill=red!30!white,inner sep=0pt,outer sep=0pt,anchor=south west] (nmt2019) at (smt2019.south east) {};
\node[font=\normalsize,anchor=north] () at (smt2019.south east) {2019}; \node[font=\scriptsize,anchor=north] () at ([yshift=-0.2em]smt2019.south east) {2019};
\end{scope} \end{scope}
% legend % legend
...@@ -38,5 +42,9 @@ ...@@ -38,5 +42,9 @@
\node[minimum width=0.5cm,rectangle,draw,fill=red!30!white,anchor=north west,label={[label distance=1pt,font=\scriptsize]0:神经机器翻译}] () at (\XCoord,\YCoord) {}; \node[minimum width=0.5cm,rectangle,draw,fill=red!30!white,anchor=north west,label={[label distance=1pt,font=\scriptsize]0:神经机器翻译}] () at (\XCoord,\YCoord) {};
\node[font=\normalsize,rotate=90] () at ([xshift=-1em]WMT.west) {数量}; % \node[font=\normalsize,rotate=90] () at ([xshift=-1em]WMT.west) {数量};
\node[font=\normalsize] () at (0.4,4.5) {数量};
\node[font=\normalsize] () at (9.5,-0.3) {年份};
\end{tikzpicture} \end{tikzpicture}
\ No newline at end of file
...@@ -2,7 +2,7 @@ ...@@ -2,7 +2,7 @@
\definecolor{ublue}{rgb}{0.152,0.250,0.545} \definecolor{ublue}{rgb}{0.152,0.250,0.545}
\begin{tikzpicture} \begin{tikzpicture}
\begin{axis}[ \begin{axis}[
width=10cm, height=6cm, width=10cm, height=5cm,
symbolic x coords={1-15,16-25,26-35,>35}, symbolic x coords={1-15,16-25,26-35,>35},
xtick=data, xtick=data,
ytick={10,12,...,28}, ytick={10,12,...,28},
...@@ -17,14 +17,14 @@ tick align=inside, ...@@ -17,14 +17,14 @@ tick align=inside,
ymajorgrids, ymajorgrids,
major grid style={draw=ublue,dashed}, major grid style={draw=ublue,dashed},
legend pos=outer north east, legend pos=outer north east,
legend style={anchor=north west,yshift=-2.5cm}, legend style={anchor=north west,yshift=-1cm},
ymin=10, ymin=10,
ymax=28] ymax=28]
\addplot [sharp plot,very thick,red!60,mark=diamond*] coordinates{(1-15,11.3) (16-25,16.4) (26-35,17) (>35,19.8)}; \addplot [sharp plot,very thick,red!60,mark=diamond*] coordinates{(1-15,11.3) (16-25,16.4) (26-35,17) (>35,19.8)};
\addplot [sharp plot,very thick,purple!60,mark=triangle*] coordinates{(1-15,14.4) (16-25,22.6) (26-35,23.8) (>35,25.9)}; \addplot [sharp plot,very thick,purple!60,mark=triangle*] coordinates{(1-15,14.4) (16-25,22.6) (26-35,23.8) (>35,25.9)};
\addplot [sharp plot,very thick,green!60,mark=square*] coordinates{(1-15,14.9) (16-25,23.7) (26-35,24.7) (>35,26.4)}; \addplot [sharp plot,very thick,green!60,mark=square*] coordinates{(1-15,14.9) (16-25,23.7) (26-35,24.7) (>35,26.4)};
\addplot [sharp plot,very thick,blue!60,mark=*] coordinates{(1-15,17.5) (16-25,24) (26-35,25) (>35,27)}; \addplot [sharp plot,very thick,blue!60,mark=*] coordinates{(1-15,17.5) (16-25,24) (26-35,25) (>35,27)};
\legend{\scriptsize{NMT},\scriptsize{SPB},\scriptsize{HPB},\scriptsize{PBSY}} \legend{\scriptsize{NMT},\scriptsize{SPB},\scriptsize{HPB},\scriptsize{PBSY}}
\end{axis} \end{axis}
\end{tikzpicture} \end{tikzpicture}
......
Markdown 格式
0%
您添加了 0 到此讨论。请谨慎行事。
请先完成此评论的编辑!
注册 或者 后发表评论