Bachelor-Final-Presentation: Added first draft

2025-04-26 06:48:04 +02:00 · 2014-10-31 06:48:58 +01:00 · 2014-10-31 06:48:58 +01:00 · 1ee32917ab
commit 1ee32917ab
parent 22b5998d56
30 changed files with 544 additions and 0 deletions
--- a/presentations/Bachelor-Final-Presentation/LaTeX/Bachelor-Final-Presentation.tex
+++ b/presentations/Bachelor-Final-Presentation/LaTeX/Bachelor-Final-Presentation.tex
@ -0,0 +1,47 @@
+\documentclass[hyperref={pdfpagelabels=false},usepdftitle=false]{beamer}
+\usepackage{/home/moose/Downloads/LaTeX-examples/presentations/Bachelor-Final-Presentation/templates/myStyle}
+
+\begin{document}
+\selectlanguage{english}
+
+\title{\titleText}
+\subtitle{Bachelor's thesis of Martin Thoma}
+\author{\tutor}
+\date{5th of June, 2014}
+%\subject{Programmieren}
+
+\frame{\titlepage}
+
+\frame{
+    \frametitle{Contents}
+    \setcounter{tocdepth}{1}
+    \tableofcontents
+    \setcounter{tocdepth}{2}
+}
+
+%\AtBeginSection[]{
+%    \InsertToC[sections={\thesection}]  % shows only subsubsections of one subsection
+%}
+
+\section{What is my Bachelor's thesis about?}
+\input{introduction}
+
+\section{write-math.com and HWRT}
+\input{write-math}
+
+% \section{Preprocessing and Features}
+% \input{preprocessing}
+% \input{features}
+
+\section{Evaluation}
+\input{evaluation}
+
+% \section{What will I do next?}
+% \input{will-do}
+
+\section*{End}
+\subsection{End}
+\input{sources}
+\framedgraphic{Thanks for Your Attention!}{../images/xi.png}
+
+\end{document}
--- a/presentations/Bachelor-Final-Presentation/LaTeX/Makefile
+++ b/presentations/Bachelor-Final-Presentation/LaTeX/Makefile
@ -0,0 +1,10 @@
+SOURCE = Bachelor-Final-Presentation
+
+make:
+	#latexmk -pdf -pdflatex="pdflatex -interactive=nonstopmode" -use-make $(SOURCE).tex
+	pdflatex -shell-escape $(SOURCE).tex -output-format=pdf #shellescape wird fürs logo benötigt
+	pdflatex -shell-escape $(SOURCE).tex -output-format=pdf # nochmaliges ausführen wegen Inhaltsverzeichnissen
+	make clean
+
+clean:
+	rm -rf  $(TARGET) *.class *.html *.log *.aux *.out *.glo *.glg *.gls *.ist *.xdy *.1 *.toc *.snm *.nav *.vrb *.fls *.fdb_latexmk *.pyg
--- a/presentations/Bachelor-Final-Presentation/LaTeX/evaluation.tex
+++ b/presentations/Bachelor-Final-Presentation/LaTeX/evaluation.tex
@ -0,0 +1,111 @@
+\subsection{Merged Symbols}
+\begin{frame}[fragile]{Merged symbols (MER error)}
+\begin{table}[ht]
+    \centering
+    \begin{tabular}{lc|lc}
+        \toprule
+        \multicolumn{2}{c}{Base symbol} & \multicolumn{2}{c}{equivalent symbols}\\
+        \LaTeX         & Rendered       & \LaTeX                 & Rendered  \\\midrule
+        \verb+\sum+    & $\sum$         & \verb+$\Sigma$+        & $\Sigma$\\
+        \verb+\prod+   & $\prod$        & \verb+$\Pi$+           & $\Pi$\\
+        ~              & ~              & \verb+$\sqcap$+        & $\sqcap$\\
+        \verb+\coprod+ & $\coprod$      & \verb+$\amalg$+        & $\amalg$\\
+        ~              & ~              & \verb+$\sqcup$+        & $\sqcup$\\
+        \verb+\perp+   & $\perp$        & \verb+$\bot$+          & $\bot$\\
+        \verb+\models+ & $\models$      & \verb+$\vDash$+        & $\vDash$\\
+        \verb+|+       & |              & \verb+\mid+            & $\mid$  \\
+        \verb+\Delta+  & $\Delta$       & \verb+$\triangle$+     & $\triangle$\\
+        ~              & ~              & \verb+$\vartriangle$+  & $\vartriangle$\\
+        \bottomrule
+    \end{tabular}
+\end{table}
+\end{frame}
+
+\begin{frame}[fragile]{Merged symbols (MER error)}
+\begin{table}[ht]
+    \centering
+    \begin{tabular}{lc|lc}
+        \toprule
+        \multicolumn{2}{c}{Base symbol} & \multicolumn{2}{c}{equivalent symbols}\\
+        \LaTeX         & Rendered       & \LaTeX                 & Rendered  \\\midrule
+        \verb+\|+      & $\|$           & \verb+$\parallel$+     & $\parallel$\\
+        \verb+\ohm+    & $\Omega$         & \verb+$\Omega$+      & $\Omega$\\
+        \verb+\setminus+ & $\setminus$  & \verb+$\backslash$+    & $\backslash$\\
+        \verb+\checked+ & {\mbox {\wasyfamily \char 8}} & \verb+$\checkmark$+    & $\checkmark$\\
+        \verb+\&+      & $\&$           & \verb+$\with$+         & $\&$\\
+        \verb+\#+      & $\#$           & \verb+$\sharp$+        & $\sharp$\\
+        \verb+\S+      & $\S$           & \verb+$\mathsection$+  & $\mathsection$\\
+        \verb+\nabla+  & $\nabla$       & \verb+\triangledown+   & $\triangledown$\\
+        \verb+\lhd+    & $\lhd$         & \verb+$\triangleleft$+ & $\triangleleft$\\
+        ~              & ~              & \verb+$\vartriangleleft$+ & $\vartriangleleft$\\
+        \verb+\oiint+  & $\oiint$       & \verb+$\varoiint$+     & $\varoiint$\\
+        \bottomrule
+    \end{tabular}
+\end{table}
+\end{frame}
+
+
+\begin{frame}[fragile]{Merged symbols (MER error)}
+\begin{table}[ht]
+    \centering
+    \begin{tabular}{lc|lc}
+        \toprule
+        \multicolumn{2}{c}{Base symbol} & \multicolumn{2}{c}{equivalent symbols}\\
+        \LaTeX         & Rendered       & \LaTeX                 & Rendered  \\\midrule
+        \verb+\mathbb{R}+ & $\mathbb{R}$ & \verb+$\mathds{R}$+   & $\mathds{R}$\\
+        \verb+\mathbb{Q}+ & $\mathbb{Q}$ & \verb+\mathds{Q}+     & $\mathds{Q}$\\
+        \verb+\mathbb{Z}+ & $\mathbb{Z}$ & \verb+\mathds{Z}+     & $\mathds{Z}$\\
+        \verb+\mathcal{A}+ & $\mathcal{A}$ & \verb+\mathscr{A}+  & $\mathscr{A}$\\
+        \verb+\mathcal{D}+ & $\mathcal{D}$ & \verb+\mathscr{D}+  & $\mathscr{D}$\\
+        \verb+\mathcal{N}+ & $\mathcal{N}$ & \verb+\mathscr{N}+  & $\mathscr{N}$\\
+        \verb+\mathcal{R}+ & $\mathcal{R}$ & \verb+\mathscr{R}+  & $\mathscr{R}$\\
+        \verb+\propto+ & $\propto$      & \verb+$\varpropto$+    & $\varpropto$\\
+        \bottomrule
+    \end{tabular}
+\end{table}
+\end{frame}
+
+\subsection{Evaluation}
+\begin{frame}{Experiments}
+    \textbf{Preprocessing:} Scaling, shifting and linear interpolation\\
+    \textbf{Features:} Coordinates of 80 points (4 strokes with 20 points each)\\
+    \textbf{Learning:} MLP, 1000 epochs, LR $\eta=0.1$, Momentum $\alpha=0.1$
+\begin{table}[h]
+    \centering
+    \begin{tabular}{clrrr}
+    \toprule
+    \multirow{2}{*}{System}  & \multirow{2}{*}{Topology} & \multicolumn{3}{c}{Classification error}\\ 
+          &                         & TOP1                   & TOP3                  & MER \\\midrule
+    $B_1$ & 160:500:369             & $\SI{23.34}{\percent}$ & $\SI{6.80}{\percent}$ & $\SI{6.64}{\percent}$ \\
+    $B_2$ & 160:500:500:369         & \underline{$\SI{21.51}{\percent}$} & $\SI{5.75}{\percent}$ & $\SI{5.67}{\percent}$ \\
+    $B_3$ & 160:500:500:500:369     & $\SI{21.93}{\percent}$ & \underline{$\SI{5.74}{\percent}$} & \underline{$\SI{5.64}{\percent}$} \\
+    $B_4$ & 160:500:500:500:500:369 & $\SI{23.88}{\percent}$ & $\SI{6.12}{\percent}$ & $\SI{6.04}{\percent}$ \\
+    \bottomrule
+    \end{tabular}
+    \caption{Baseline systems with three different classification error measures.
+             All errors were measured on the test set.}
+\label{table:baseline-systems}
+\end{table}
+\end{frame}
+
+\subsection{Complex classifier}
+\begin{frame}{Complex classifier}
+    \textbf{Preprocessing:} Connect strokes, scale, shift and linear interpolation\\
+    \textbf{Features:} Coordinates of 80 points (4 strokes with 20 points each), re-curvature per stroke, ink, stroke count, aspect ratio\\
+    \textbf{Learning:} MLP, 1000 epochs, LR $\eta=0.1$, Momentum $\alpha=0.1$
+\begin{table}[htb]
+    \centering
+    \begin{tabular}{lrrrrrr}
+    \toprule
+    \multirow{2}{*}{System}  & \multicolumn{3}{c}{Classification error}\\ 
+              & TOP1                   & change                 & TOP3                  & change                 & MER                   & change \\\midrule
+    $B_{1,c}$ & $\SI{20.96}{\percent}$ & $\SI{-2.38}{\percent}$ & $\SI{5.24}{\percent}$ & $\SI{-1.56}{\percent}$ & $\SI{5.13}{\percent}$ & $\SI{-1.51}{\percent}$ \\
+    $B_{2,c}$ & $\SI{20.10}{\percent}$ & $\SI{-1.41}{\percent}$ & $\SI{4.44}{\percent}$ & $\SI{-1.31}{\percent}$ & $\SI{4.36}{\percent}$ & $\SI{-1.31}{\percent}$ \\
+    $B_{3,c}$ & $\SI{21.51}{\percent}$ & $\SI{-0.42}{\percent}$ & $\SI{4.89}{\percent}$ & $\SI{-0.85}{\percent}$ & $\SI{4.80}{\percent}$ & $\SI{-0.84}{\percent}$ \\
+    $B_{4,c}$ & $\SI{00.00}{\percent}$ & $\SI{-0.00}{\percent}$ & $\SI{0.00}{\percent}$ & $\SI{-0.00}{\percent}$ & $\SI{0.00}{\percent}$ & $\SI{-0.00}{\percent}$ \\
+    \bottomrule
+    \end{tabular}
+    \caption{Error rates of the complex recognizer systems.}
+\label{table:complex-recognizer-systems-evaluation}
+\end{table}
+\end{frame}
--- a/presentations/Bachelor-Final-Presentation/LaTeX/features.tex
+++ b/presentations/Bachelor-Final-Presentation/LaTeX/features.tex
@ -0,0 +1,23 @@
+\subsection{Features}
+\begin{frame}{Features}
+    \begin{itemize}
+        \item Local
+        \begin{itemize}
+            \item Coordinates
+            \item Speed
+            \item Binary pen pressure
+            \item Direction
+            \item Curvature
+            \item Bitmap-environment
+            \item Hat-Feature
+        \end{itemize}
+        \item Global
+        \begin{itemize}
+            \item \# of points
+            \item \# of strokes
+            \item Center point
+            \item Bitmap
+            \item Bounding box (width, height, time)
+        \end{itemize}
+    \end{itemize}
+\end{frame}
--- a/presentations/Bachelor-Final-Presentation/LaTeX/formula-recognition-logo.png
+++ b/presentations/Bachelor-Final-Presentation/LaTeX/formula-recognition-logo.png
--- a/presentations/Bachelor-Final-Presentation/LaTeX/introduction.tex
+++ b/presentations/Bachelor-Final-Presentation/LaTeX/introduction.tex
@ -0,0 +1,30 @@
+\subsection{Online and offline recognition}
+
+\begin{frame}{What is my Bachelor's thesis about?}
+    \begin{itemize}
+        \item Recognition of handwritten mathematical symbols
+        \item On-line recognition, not OCR!
+        \item Given a series of points $(x(t), y(t), b(t))$\\
+              I want to get the proper \LaTeX{} command.
+    \end{itemize}
+\end{frame}
+
+\begin{frame}{Why did I work on this topic?}
+    \begin{itemize}
+        \item \LaTeX{} is easy as soon as you know the \textbackslash{}commands.
+        \item It's hard to find the \LaTeX{} command of single symbols.
+        \item It's much harder to find complete formulas.
+    \end{itemize}
+
+    % I want to
+    % \begin{itemize}
+    %     \item provide a tool that enables beginners to get the best \LaTeX{} command
+    %           for their formula,
+    %     \item find out what works best for symbol recognition
+    %     \item and provide data and a platform to test new ideas for classifiers
+    % \end{itemize}
+
+    For now: recognition of isolated symbols. That means:
+
+    single symbol \enquote{formulas} rather than multi-symbol formulas
+\end{frame}
--- a/presentations/Bachelor-Final-Presentation/LaTeX/logos/formula-recognition-logo.png
+++ b/presentations/Bachelor-Final-Presentation/LaTeX/logos/formula-recognition-logo.png
--- a/presentations/Bachelor-Final-Presentation/LaTeX/preprocessing.tex
+++ b/presentations/Bachelor-Final-Presentation/LaTeX/preprocessing.tex
@ -0,0 +1,18 @@
+\subsection{Preprocessing}
+\begin{frame}{Preprocessing}
+    \begin{itemize}
+        \item Normalizing
+        \begin{itemize}
+            \item Scaling
+            \item Shifting
+            \item Resampling
+        \end{itemize}
+        \item Noise reduction
+        \begin{itemize}
+            \item Smoothing (e.g. moving average)
+            \item Dot reduction
+            \item Filtering (by distance, speed or angle)
+            \item Stroke connection
+        \end{itemize}
+    \end{itemize}
+\end{frame}
--- a/presentations/Bachelor-Final-Presentation/LaTeX/sources.tex
+++ b/presentations/Bachelor-Final-Presentation/LaTeX/sources.tex
@ -0,0 +1,12 @@
+\subsection{Sources}
+\begin{frame}{Image Sources}
+    \begin{itemize}
+	\item \href{https://commons.wikimedia.org/wiki/File:Server-multiple.svg}{Server} by RRZEicons
+    \item \href{https://commons.wikimedia.org/wiki/File:Computer-aj_aj_ashton_01.svg}{Desktop Computer} by Ed g2s,
+          Ironbrother, Kierancassel and Msgj
+    \item \href{https://commons.wikimedia.org/wiki/File:Server_by_mimooh.svg}{Server} by Mimooh
+    \end{itemize}
+
+    The presentation can be found at \url{http://tinyurl.com/write-math-short-presentation}
+\end{frame}
+
--- a/presentations/Bachelor-Final-Presentation/LaTeX/will-do.tex
+++ b/presentations/Bachelor-Final-Presentation/LaTeX/will-do.tex
@ -0,0 +1,24 @@
+\subsection{What will I do next?}
+\begin{frame}{What will I do next?}
+    \begin{itemize}
+        \item Include the currently best model in write-math.com
+        \item Evaluate preprocessing steps
+        \item Try other features
+        \item Try other topologies / trainings (e.g. pretraining, newbob)
+        \item Eventually try convolutional neural nets
+    \end{itemize}
+\end{frame}
+
+% \subsection{Far future}
+% \begin{frame}{What could be done?}
+%     \begin{itemize}
+%         \item Make use of audio data in a multimodal approach\\
+%               e.g. $R$ and $\mathcal{R}$
+%         \item Currently, the Lecture Translation system doesn't recognize math.\\
+%               You get \enquote{integral of e raised to the power of x d x} instead
+%               of $\int e^x \mathrm{d} x$.
+%         \item Spoken math is ambigous: $\sqrt{a+b}$ vs. $\sqrt{a} + b$
+%         \item The language model I create could help to find probable formulas
+%         \item The platform could be used to get more input data of users
+%     \end{itemize}
+% \end{frame}
--- a/presentations/Bachelor-Final-Presentation/LaTeX/write-math.tex
+++ b/presentations/Bachelor-Final-Presentation/LaTeX/write-math.tex
@ -0,0 +1,149 @@
+\subsection{Write Math}
+
+\begin{frame}{write-math.com}
+    \begin{itemize}
+        \item a website where users can add labeled training data and unlabeled
+              data which they want to classify. I call this data \enquote{recording}
+        \begin{figure}[ht]
+            \centering
+            \subfloat{
+                \includegraphics[height=0.1\textwidth]{../images/279952.pdf}
+            }%
+            \qquad
+            \subfloat{
+                \includegraphics[height=0.1\textwidth]{../images/281507.pdf}
+            }%
+            \qquad
+            \subfloat{
+                \includegraphics[height=0.1\textwidth]{../images/287612.pdf}
+            }%
+            \qquad
+            \subfloat{
+                \includegraphics[height=0.1\textwidth]{../images/292175.pdf}
+            }%
+            \caption*{4 recordings}
+        \end{figure}
+        \item works with desktop computers and touch devices
+        \item symbol recognition can be done by multiple classifiers
+        \item users can contribute formulas as recordings and as \LaTeX{} answers
+              for recordings
+        \item users can vote for \LaTeX{} answers:
+              \Large $\leq$, $\leqq$, $\leqslant$, \dots \normalsize
+        \item user who entered the recording can accept one answer
+    \end{itemize}
+\end{frame}
+
+% \framedgraphic{Classify}{../images/classify.png}
+% \framedgraphic{Workflow}{../images/workflow.png}
+% \framedgraphic{User page}{../images/user-page.png}
+% \framedgraphic{Information about recordings}{../images/view.png}
+% \framedgraphic{Symbol page}{../images/symbol.png}
+% \framedgraphic{Training}{../images/train.png}
+% \framedgraphic{Ranking}{../images/ranking.png}
+
+
+\begin{frame}[fragile]{Statistics}
+    \begin{itemize}
+        \item 127 users with at least 5 recordings
+        \item $\num{1111}$ symbols, but only $\num{369}$ used for experiments
+        \item $\num{235831}$ recordings (e.g. $\num{3489}$ times \verb+\int+, but only 50 times \verb+X+)
+    \end{itemize}
+\end{frame}
+
+% \begin{frame}{First classification worker}
+%     \begin{itemize}
+%         \item preprocessing: Scale to fit into unit square while keeping the aspect
+%               ratio
+%         \item applies greedy time warping
+%         \item compares a new recording with every recording
+%               in the database
+%         \item[$\Rightarrow$] Classification time is in $\mathcal{O}(\text{recordings})$,
+%               but we rather would like $\mathcal{O}(\text{symbols})$
+%         \item the current server / workflow can only handle about 4000 recordings
+%         \item[$\Rightarrow$] Another way to classify is necessary
+%     \end{itemize}
+% \end{frame}
+
+\begin{frame}[fragile]{Handwriting Recognition Toolkit (hwrt)}
+    \begin{itemize}
+        \item Many preprocessing algorithms / features implemented
+        \item Plug-in system for preprocessing algorithms / features
+        \item Needs neural network toolkit
+        \item Hosted at \url{https://github.com/MartinThoma/hwrt}
+        \item Installable via \verb+pip+ (Python package installer):\\
+              \verb+$ pip install hwrt+
+    \end{itemize}
+\end{frame}
+
+\begin{frame}[fragile]{hwrt preprocessing configuration file}
+    \begin{verbatim}
+data-source: raw-datasets/2014-08-26-20-14-data-raw.pickle
+queue:
+  - RemoveDuplicateTime: null
+  - ScaleAndShift:
+      - max_width: 1.0
+      - max_height: 1.0
+      - center: true
+  - SpaceEvenlyPerStroke:
+      - kind: linear
+      - number: 20
+    \end{verbatim}
+\end{frame}
+
+\subsection{Preprocessing algorithms}
+\begin{frame}{Preprocessing algorithms}
+    \begin{itemize}
+        \item Normalizing
+        \begin{itemize}
+            \item Scaling
+            \item Shifting
+            \item Resampling
+        \end{itemize}
+        \item Noise reduction
+        \begin{itemize}
+            \item Smoothing (e.g. moving average)
+            \item Dot reduction
+            \item Filtering (by distance, speed or angle)
+            \item Stroke connection
+        \end{itemize}
+    \end{itemize}
+\end{frame}
+
+\begin{frame}[fragile]{hwrt feature configuration file}
+    \begin{verbatim}
+data-source: preprocessed/baseline
+data-multiplication:
+  - Multiply:
+      - nr: 1
+features:
+  - ConstantPointCoordinates:
+      - strokes: 4
+      - points_per_stroke: 20
+      - fill_empty_with: 0
+      - pen_down: false
+    \end{verbatim}
+\end{frame}
+
+\subsection{Features}
+\begin{frame}{Features}
+    \begin{itemize}
+        \item Local
+        \begin{itemize}
+            \item Coordinates
+            \item Speed
+            \item Binary pen pressure
+            \item Direction
+            \item Curvature
+            \item Bitmap-environment
+            \item Hat-Feature
+        \end{itemize}
+        \item Global
+        \begin{itemize}
+            \item \# of points
+            \item \# of strokes
+            \item Center point
+            \item Bitmap
+            \item Bounding box (width, height, time)
+        \end{itemize}
+    \end{itemize}
+\end{frame}