-
Notifications
You must be signed in to change notification settings - Fork 0
/
thesis.tex.bak
370 lines (314 loc) · 16 KB
/
thesis.tex.bak
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
\documentclass[12pt,final,twoside]{report}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Some credits:
% The template initially was created by Prof. Dr. Holger Karl/Uni Paderborn '2006
% and was expanded and updated by Dipl.-Inform. Stefan Heinrich/Uni Paderborn/Uni Hamburg since 2008.
% Suggestions for changes are always welcome.
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Meta information:
\newcommand{\trtitle}{Word2Vec and Echo State Network For Thematic Role Assignment}
\newcommand{\trtype}{Master Thesis} %{Diplomarbeit} %{Dissertation}
\newcommand{\trcourseofstudies}{Intelligent Adaptive Systems} %{Bioinformatik}
\newcommand{\trauthor}{Surender Kumar}
\newcommand{\trauthortitle}{} %{Dipl.-Inform.\ }
\newcommand{\tremail}{[email protected]}
\newcommand{\trmatrikelnummer}{6519753}
\newcommand{\trstreet}{Kaemmererufer 13}
\newcommand{\trcity}{22303 Hamburg}
\newcommand{\trevaluatorA}{\href{mailto:[email protected]}{Prof. Dr. Stefan Wermter}}
\newcommand{\trevaluatorB}{\href{mailto:[email protected]}{ Dr. Sven Magg}}
%\newcommand{\trbetreuung}{\href{mailto:[email protected]}{Dipl.-Inform. To Be Defined}}
\newcommand{\trdepartment}{Knowledge Technology, WTM}
\newcommand{\trdate}{14.10.2016}
\newcommand{\trkeywords}{Word2Vec, ESN, NLP, TRA, Language, Semantic role labelling}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Languages:
% If the thesis is written in English:
\usepackage[english]{babel}
\selectlanguage{english}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Bind packages:
\usepackage{acronym} % Acronyms
\usepackage{algorithmic} % Algorithms and Pseudocode
\usepackage{algorithm} % Algorithms and Pseudocode
\usepackage{amsfonts} % AMS Math Packet (Fonts)
\usepackage{amsmath} % AMS Math Packet
\usepackage{amssymb} % Additional mathematical symbols
\usepackage{amsthm}
\usepackage{booktabs} % Nicer tables
%\usepackage[font=small,labelfont=bf]{caption} % Numbered captions for figures
\usepackage{color} % Enables defining of colours via \definecolor
\definecolor{uhhRed}{RGB}{226,0,26} % Official Uni Hamburg Red
\definecolor{uhhGrey}{RGB}{136,136,136} % Official Uni Hamburg Grey
\definecolor{uhhLightGrey}{RGB}{220, 220, 220}
\usepackage{fancybox} % Put equations in a frame
\usepackage{fancyhdr} % Packet for nicer headers
%\usepackage{fancyheadings} % Nicer numbering of headlines
\usepackage[body={5.8in,9in}]{geometry} % Type area (size, margins...)
\usepackage[inline, shortlabels]{enumitem}
\setlist{itemjoin ={,\enspace},itemjoin* = { and\enspace}}
%\geometry{a4paper,outer=3.35cm} % !!!Release version (Normal margins)
\geometry{a4paper,outer=2.5cm} % !!!Print version (Additional margin on the left for the binding)
%\geometry{a4paper} % !!!Proofread version (Additional margin on the right for corrections)
%\geometry{a4paper,outer=3.15cm} % !!!Draft version (Same margins on left and right)
%\geometry{paperheight=10.0in,paperwidth=6.4in,top=0.51in,left=0.3in} % !!!Developer version (Minimal margins)
\usepackage{graphicx} % Inclusion of graphics
\usepackage{latexsym} % Special symbols
\usepackage{longtable} % Allow tables over several parges
\usepackage{listings} % Nicer source code listings
\usepackage{multicol} % Content of a table over several columns
\usepackage{multirow} % Content of a table over several rows
\usepackage{rotating} % Alows to rotate text and objects
\usepackage[hang]{subfigure} % Allows to use multiple (partial) figures in a fig
%HINT: subfigure may be outdated already - maybe try subfig instead
%\usepackage[font=footnotesize,labelfont=rm]{subfig} % Pictures in a floating environment
\usepackage{tabularx} % Tables with fixed width but variable rows
\usepackage{tabulary}
\usepackage{url,xspace,boxedminipage} % Accurate display of URLs
\usepackage[table,xcdraw]{xcolor}
\usepackage{booktabs,caption,fixltx2e}
\usepackage[flushleft]{threeparttable}
\usepackage{color, colortbl}
\usepackage{hhline}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% PDF Information und Definitions:
\author{\trauthor}
\ifx\pdftexversion\undefined
\usepackage{hyperref}
\else
\usepackage[colorlinks=false, % link is colores (true) or has colored frame (false)
linkcolor=uhhRed, % case colorlinks=true: define color.
urlcolor=uhhRed,
citecolor=uhhRed,
bookmarks, % Place bookmarks erstellen
bookmarksopen=true, % Bookmarks will be shown at start (true/false)
pdfpagemode=UseOutlines,
bookmarksopenlevel=1, % Define the depth of shown links
bookmarksnumbered, % Numbers of chapers in Bookmarks
pdftitle={\trtitle},
pdfsubject={\trtype},
pdfkeywords={\trkeywords},
pdfauthor={\trauthor},
plainpages=false
]{hyperref}
\fi
\ifx\pdftexversion\undefined
\else
\pdfoutput=1 % Disable PDF-Output
\pdfimageresolution=1200
\pdfcompresslevel=2 % 0 = no compression, 9 = strongest compression
\fi
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Configurationen:
\hyphenation{whe-ther} % Manually use: "\-" in a word: Staats\-ver\-trag
\numberwithin{equation}{section}
%\lstloadlanguages{C} % Set the default language for listings
\DeclareGraphicsExtensions{.pdf,.jpg,.png,.eps} % first try pdf, then eps, png and jpg
\graphicspath{{./src/}} % Path to a folder where all pictures are located
\pagestyle{fancy} % Use nicer header and footer
% Redefine the environments for floating objects:
\setcounter{topnumber}{3}
\setcounter{bottomnumber}{2}
\setcounter{totalnumber}{4}
\renewcommand{\topfraction}{0.9} %Standard: 0.7
\renewcommand{\bottomfraction}{0.5} %Standard: 0.3
\renewcommand{\textfraction}{0.1} %Standard: 0.2
\renewcommand{\floatpagefraction}{0.8} %Standard: 0.5
% Tables with a nicer padding:
\renewcommand{\arraystretch}{1.2}
\newcolumntype{Y}{>{\centering\arraybackslash}X}
% Chapter and Sections will not be written in capitals
\renewcommand{\chaptermark}[1]{\markboth{\chaptername \ \thechapter.\ #1}{}}
\renewcommand{\sectionmark}[1]{\markright{\thesection.\ #1}}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Additional 'theorem' and 'definition' blocks:
\theoremstyle{plain}
\newtheorem{theorem}{Theorem}[chapter]
%\newtheorem{theorem}{Satz}[chapter] % Wenn in Deutsch geschrieben wird.
\newtheorem{axiom}{Axiom}[chapter]
%\newtheorem{axiom}{Fakt}[chapter] % Wenn in Deutsch geschrieben wird.
%Usage:%\begin{axiom}[optional description]%Main part%\end{fakt}
\theoremstyle{definition}
\newtheorem{definition}{Definition}[chapter]
%Additional types of axioms:
\newtheorem{lemma}[axiom]{Lemma}
\newtheorem{observation}[axiom]{Observation}
%Additional types of definitions:
\theoremstyle{remark}
%\newtheorem{remark}[definition]{Bemerkung} % Wenn in Deutsch geschrieben wird.
\newtheorem{remark}[definition]{Remark}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Provides TODOs within the margin:
\newcommand{\TODO}[1]{\marginpar{\emph{\small{{\bf TODO: } #1}}}}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Abbreviations and mathematical symbols
\newcommand{\modd}{\text{ mod }}
\newcommand{\RS}{\mathbb{R}}
\newcommand{\NS}{\mathbb{N}}
\newcommand{\ZS}{\mathbb{Z}}
\newcommand{\dnormal}{\mathit{N}}
\newcommand{\duniform}{\mathit{U}}
\newcommand{\erdos}{Erd\H{o}s}
\newcommand{\renyi}{-R\'{e}nyi}
% it is recommented to define complex terms as expression/newcommand and use the expression in the tex instead.
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Document:
\begin{document}
\pagenumbering{Roman} % Roman pagenumbering for lists and meta pages
\renewcommand{\headheight}{14.5pt} % Size of headings
\thispagestyle{empty}
\fancyhead[LO,RE]{} % Define the header style for the meta pages
%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Cover sheet
\begin{titlepage}
%---Possibility 1:
\begin{flushleft}
\includegraphics[width=85mm]{uhhLogoL.pdf}\\
\end{flushleft}
%---Possibility 2:
%\includegraphics*[width=0.09\textwidth]{uhhIconR_}
%\parbox[c]{10cm}{
% \begin{center}
% Universit\"at Hamburg --- MIN-Fakult\"at\\
% \trfachgruppe
% \end{center}
% }\hfill
%\includegraphics*[width=0.09\textwidth]{infIcon_}
%\vspace{0.2cm}
%---
\rule{\textwidth}{0.4pt}
\newline
\vspace{2.0cm}
\begin{center}
\LARGE \textbf{\trtitle}
\end{center}
\vspace{2.0cm}
\begin{center}
\textbf{\trtype}\\
%am Fachgebiet \trdepartment\\
at the Research Group \trdepartment\\
\trevaluatorA\medskip\\
Department Informatik\\
MIN-Fakult\"at\\
Universit\"at Hamburg \\[0.5cm]
Submitted by \\
\textbf{\trauthortitle\href{mailto:\tremail}{\trauthor}}\\
on\\
\trdate
\end{center}
\vspace{1cm}
\begin{center}
\begin{tabular}{ll}
Evaluators: & \trevaluatorA \\
& \trevaluatorB \\
%Betreuung: & \trbetreuung \\ % Adviser are not allowed to demand getting credited, but are happy getting credited by the students initiative
\end{tabular}
\end{center}
\vfill
\begin{tabular}{l}
\trauthor \\
Matriculation Number: \trmatrikelnummer \\
\trstreet \\
\trcity
\end{tabular}
\newline
\rule{\textwidth}{0.4pt}
\newpage
\end{titlepage}
%backsite of cover sheet is empty!
\thispagestyle{empty}
\hspace{1cm}
\newpage
%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Abstract:
\section*{Abstract}\label{sec:abstract}
%\fancyhead[LE,RO]{\it Abstract}
%\addcontentsline{toc}{chapter}{\numberline{}Abstract}
Humans have a remarkable capability of acquiring language and in particular more than one language. More interestingly, they learn it within the same neural computing substrate. But, how the structure of a sentence is mapped to its meaning within the brain is still an open issue? To understand this process of language acquisition, several neural language models have been proposed. Most of the existing models are either using syntactic parse trees to create handcrafted features or using localist vector representation of words to process the sentences. Hinaut et al. \cite{xavier:2013:RT} proposed the $\theta$RARes (Thematic Role Assignment Reservoir) neural language acquisition model, for the Thematic Role Assignment (TRA) task. The model learns the thematic roles, i.e., ``Who did what to whom", purely from the grammatical structure of the sentences. The semantic information was removed from the sentences by replacing semantic words with a unique token (`SW'). The model process the transformed sentences considering the words as discrete atomic symbols i.e. using localist word representation. The localist representation of the words does not carry any semantic and syntactic information about the words. This thesis proposes an end-to-end neural language model, Word2Vec-$\theta$RARes, in an extension of $\theta$RARes model. In addition to utilizing syntactic information and modeling temporal aspect of the input sentences, the proposed model also takes into account the semantics of the words. The model contains a Word2Vec unit to generate the distributed vector representation of words which captures the semantic and syntactic relationships. The model also contains a Recurrent Neural Network namely, Echo state Network (ESN), with fixed random connections, which is capable of modeling the sequential data. Thus, the model receives a raw sentence as an input which is processed word by word across time, and the meaning of the sentence is generated as an output. The results of the experiments conducted using the Word2Vec-$\theta$RARes model shows that the exposure of semantic and syntactic information to the ESN increases the performance on the TRA task. Apart from this, the Word2Vec-$\theta$RARes model also re-analyse the meaning of the sentence on arrival of words. Also, in some cases, the model correctly predicts the meaning of the sentences even before the sentences are finished.
\cleardoublepage
%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Lists:
%\setcounter{tocdepth}{1} % depth of the table of contents (for BSc and MSc Thesis 1 is recommented)
\fancyhead[LE,RO]{\it Contents}
\tableofcontents
\cleardoublepage
% List of Figures and List of tables are optional. -> Not needed in most theses.
\fancyhead[LE,RO]{\it List of Figures}
\listoffigures
\cleardoublepage
\fancyhead[LE,RO]{\it List of Tables}
\listoftables
\cleardoublepage
\fancyhead[LE,RO]{\it Abbreviations}
\input{glossary.tex}
\cleardoublepage
%\lstlistoflistings
%\cleardoublepage
\fancyhead[LE]{\it \leftmark} % Define the header style for the text pages
\fancyhead[RO]{\it \rightmark} % Define the header style for the text pages
\fancyhead[LO,RE]{} % Define the header style for the text pages
%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% The content will be included here:
\pagenumbering{arabic}
\input{1introduction.tex}
\cleardoublepage
\input{2basics.tex}
\cleardoublepage
\input{3openIssues.tex}
\cleardoublepage
\input{4approach.tex}
\cleardoublepage
\input{5experiments.tex}
\cleardoublepage
\input{6results.tex}
\cleardoublepage
\input{7conclusions.tex}
\cleardoublepage
%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Appendices:
% these are optional! For most Bachelor-theses and some Master-thesis none of them is needed.
% Just comment them if not needed.
\appendix
\fancyhead[LO,RE]{} % Define the header style for the appendixpages
\fancyhead[LE,RO]{\it Appendix A. Complete Simulation Results}%Adapt letter!
\input{appA.tex}
\cleardoublepage
% ... add as much appendices as you need (one can also add source code, for example)
%\fancyhead[LE]{\it \leftmark}
%\chapter{}
\fancyhead[LE,RO]{\it Bibliography} % A bibliography never have a letter or numbering!
\bibliographystyle{plain} % Style for presenting the literature
\addcontentsline{toc}{chapter}{Bibliography}% Add to the TOC
\bibliography{thesis,esn,word2vec}
\cleardoublepage
%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Formal page 1
\vspace{2cm}
\chapter*{Erkl\"arung der Urheberschaft}
\label{sec:urheber}
\fancyhead[LE]{\it Erkl\"arung der Urheberschaft}
Ich versichere an Eides statt, dass ich die \trtype{} im Studiengang \trcourseofstudies{} selbstst\"andig verfasst und keine anderen als die angegebenen Hilfsmittel -- insbesondere keine im Quellenverzeichnis nicht benannten Internet-Quellen -- benutzt habe. Alle Stellen, die w\"ortlich oder sinngem\"a{\ss} aus Ver\"offentlichungen entnommen wurden, sind als solche kenntlich gemacht. Ich versichere weiterhin, dass ich die Arbeit vorher nicht in einem anderen Pr\"ufungsverfahren eingereicht habe und die eingereichte schriftliche Fassung der auf dem elektronischen Speichermedium entspricht.
%Ich versichere an Eides statt, dass ich die vorliegende \trtype{} selbstst\"andig und ohne unerlaubte Hilfe Dritter angefertigt habe. Alle Stellen, die inhaltlich oder w\"ortlich aus anderen Ver\"offentlichungen stammen, sind kenntlich gemacht. Diese Arbeit lag in gleicher oder \"ahnlicher Weise noch keiner Pr\"ufungsbeh\"orde vor und wurde bisher noch nicht ver\"offentlicht.
\vspace{4cm}
\noindent Ort, Datum \hfill Unterschrift
%The backcover is always empty
\newpage
\thispagestyle{empty}
\hspace{1cm}
\newpage
%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% Formal page 2
\vspace{2cm}
\chapter*{Erkl\"arung zur Ver\"offentlichung}
\label{sec:urheber}
\fancyhead[LE]{\it Erkl\"arung zur Ver\"offentlichung}
Ich erkl\"are mein Einverst\"andnis mit der Einstellung dieser \trtype{} in den Bestand der Bibliothek.
\vspace{4cm}
\noindent Ort, Datum \hfill Unterschrift
%The backcover is always empty
\newpage
\thispagestyle{empty}
\hspace{1cm}
\newpage
\end{document}
%EOF