Преглед изворни кода

added short presentation of my bachelors thesis

Martin Thoma пре 11 година
родитељ
комит
bf45366b88

+ 5 - 0
presentations/Bachelor-Short/.gitignore

@@ -0,0 +1,5 @@
+logos/kitlogo*
+templates/*kit*.sty
+templates/example.bib
+templates/semirounded.sty
+templates/tikzuml.sty

+ 10 - 0
presentations/Bachelor-Short/LaTeX/Makefile

@@ -0,0 +1,10 @@
+SOURCE = bachelor-short
+
+make:
+	#latexmk -pdf -pdflatex="pdflatex -interactive=nonstopmode" -use-make $(SOURCE).tex
+	pdflatex -shell-escape $(SOURCE).tex -output-format=pdf #shellescape wird fürs logo benötigt
+	pdflatex -shell-escape $(SOURCE).tex -output-format=pdf # nochmaliges ausführen wegen Inhaltsverzeichnissen
+	make clean
+
+clean:
+	rm -rf  $(TARGET) *.class *.html *.log *.aux *.out *.glo *.glg *.gls *.ist *.xdy *.1 *.toc *.snm *.nav *.vrb *.fls *.fdb_latexmk *.pyg

+ 40 - 0
presentations/Bachelor-Short/LaTeX/bachelor-short.tex

@@ -0,0 +1,40 @@
+\documentclass[hyperref={pdfpagelabels=false},usepdftitle=false]{beamer}
+\usepackage{../templates/myStyle}
+
+\begin{document}
+\selectlanguage{english}
+
+\title{\titleText}
+\subtitle{Bachelor's thesis of Martin Thoma}
+\author{\tutor}
+\date{5th of June, 2014}
+%\subject{Programmieren}
+
+\frame{\titlepage}
+
+\frame{
+    \frametitle{Contents}
+    \setcounter{tocdepth}{1}
+    \tableofcontents
+    \setcounter{tocdepth}{2}
+}
+
+%\AtBeginSection[]{
+%    \InsertToC[sections={\thesection}]  % shows only subsubsections of one subsection
+%}
+
+\section{What is my Bachelor's thesis about?}
+\input{introduction}
+
+\section{What did I do so far?}
+\input{work-done}
+
+\section{What will I do next?}
+\input{will-do}
+
+\section{End}
+\subsection{End}
+\input{sources}
+\framedgraphic{Thanks for Your Attention!}{../images/xi.png}
+
+\end{document}

+ 29 - 0
presentations/Bachelor-Short/LaTeX/introduction.tex

@@ -0,0 +1,29 @@
+\subsection{Online and offline recognition}
+
+\begin{frame}{What is my Bachelor's thesis about?}
+    \begin{itemize}
+        \item Handwriting recogntion of mathematical formulas
+        \item On-line recognition, not OCR!
+        \item Given a series of points $(x(t), y(t), b)$\\
+              I want to get the proper \LaTeX{} code.
+    \end{itemize}
+\end{frame}
+
+\begin{frame}{Why do I work on this topic?}
+    \begin{itemize}
+        \item \LaTeX{} is easy as soon as you know the \textbackslash{}codes.
+        \item It's hard to find the \LaTeX{} code of single symbols.
+        \item It's much harder to find complete formulas.
+    \end{itemize}
+
+    I want to
+    \begin{itemize}
+        \item provide a tool that enables beginners to get the best \LaTeX{} code
+              for their formula,
+        \item find out what works best for symbol recognition
+        \item and provide data and a platform to test new ideas for classifiers
+    \end{itemize}
+
+    As soon as symbol recognition works good in terms of classification time and
+    performance, I will continue with formula recognition.
+\end{frame}

+ 9 - 0
presentations/Bachelor-Short/LaTeX/sources.tex

@@ -0,0 +1,9 @@
+\subsection{Image Sources}
+\begin{frame}{Image Sources}
+    \begin{itemize}
+	\item \href{https://commons.wikimedia.org/wiki/File:Server-multiple.svg}{Server} by RRZEicons
+    \item \href{https://commons.wikimedia.org/wiki/File:Computer-aj_aj_ashton_01.svg}{Desktop Computer} by Ed g2s,
+          Ironbrother, Kierancassel and Msgj
+    \item \href{https://commons.wikimedia.org/wiki/File:Server_by_mimooh.svg}{Server} by Mimooh
+    \end{itemize}
+\end{frame}

+ 32 - 0
presentations/Bachelor-Short/LaTeX/will-do.tex

@@ -0,0 +1,32 @@
+\subsection{What will I do next?}
+\begin{frame}{What will I do next?}
+    \begin{itemize}
+        \item Get classification performance with cross-validation
+        \item Implement neural net for classification
+        \begin{itemize}
+            \item preprocessing: compute cubic spline for each line
+            \begin{itemize}
+                \item equi-spaced points or
+                \item get equi-timed points
+            \end{itemize}
+            \item 5 - 20 input neurons for each line
+            \item 1076 output neurons (one for each symbol)
+        \end{itemize}
+        \item Get a language model (e.g. by parsing Wikipedia)
+        \item Use ANN with HMM (?)
+    \end{itemize}
+\end{frame}
+
+\subsection{Far future}
+\begin{frame}{What could be done?}
+    \begin{itemize}
+        \item Make use of audio data in a multimodal approach\\
+              e.g. $R$ and $\mathcal{R}$
+        \item Currently, the Lecture Translation system doesn't recognize math.\\
+              You get \enquote{integral of e raised to the power of x d x} instead
+              of $\int e^x \mathrm{d} x$.
+        \item Spoken math is ambigous: $\sqrt{a+b}$ vs. $\sqrt{a} + b$
+        \item The language model I create could help to find probable formulas
+        \item The platform could be used to get more input data of users
+    \end{itemize}
+\end{frame}

+ 51 - 0
presentations/Bachelor-Short/LaTeX/work-done.tex

@@ -0,0 +1,51 @@
+\subsection{Write Math}
+
+\begin{frame}{write-math.com}
+    \begin{itemize}
+        \item a website where users can add labeled training data
+        \item works with desktop computers and touch devices
+        \item symbol recognition can be done by multiple classifiers
+        \item users can contribute formulas
+        \item users can vote for formulas
+        \item user who wrote the formula can accept one formula
+    \end{itemize}
+\end{frame}
+
+\framedgraphic{Classify}{../images/classify.png}
+\framedgraphic{Workflow}{../images/workflow.png}
+\framedgraphic{User page}{../images/user-page.png}
+\framedgraphic{Information about handwritten-data}{../images/view.png}
+\framedgraphic{Non-mathematical symbols}{../images/yinyang.png}
+\framedgraphic{Training}{../images/train.png}
+\framedgraphic{Ranking}{../images/ranking.png}
+\framedgraphic{Symbol page}{../images/symbol.png}
+
+\begin{frame}{Statistics}
+    \begin{itemize}
+        \item 40 users
+        \item 1076 symbols
+        \item 5519 handwritten symbols (e.g. 195 times the letter \enquote{A})
+        \begin{itemize}
+            \item only 264 have 4 lines
+            \item only 36 have 5 lines
+            \item only 16 have 6 lines
+            \item only 19 have 7 lines or more
+            \item none has more than 12 lines
+        \end{itemize}
+    \end{itemize}
+\end{frame}
+
+\begin{frame}{First classification worker}
+    \begin{itemize}
+        \item preprocessing: Scale to fit into unit square while keeping the aspect
+              ratio
+        \item applies dynamic time warping
+        \item compares a new handwritten symbol with every handwritten symbol
+              in the database
+        \item[$\Rightarrow$] Classification time is in $\mathcal{O}(\text{handwritten symbols})$,
+              but we rather would like $\mathcal{O}(\text{symbols})$
+        \item the current server / workflow can only handle about 4000 handwritten
+              symbols
+        \item[$\Rightarrow$] Another way to classify is necessary
+    \end{itemize}
+\end{frame}

+ 12 - 0
presentations/Bachelor-Short/README.md

@@ -0,0 +1,12 @@
+About
+-----
+This is a short presentation for an English course. We explained
+the PageRank algorithm in 8 minutes.
+
+KIT-Style
+---------
+This one doesn't compile, as you need the KIT-Style (logos, layout, 
+color theme)
+
+Please take a look at the presentation "Tutorenschulung" for further
+information.

BIN
presentations/Bachelor-Short/images/classify.png


BIN
presentations/Bachelor-Short/images/golden-ratio-continued-fraction.png


BIN
presentations/Bachelor-Short/images/golden-ratio.png


BIN
presentations/Bachelor-Short/images/ranking.png


BIN
presentations/Bachelor-Short/images/symbol.png


BIN
presentations/Bachelor-Short/images/train.png


BIN
presentations/Bachelor-Short/images/user-page.png


BIN
presentations/Bachelor-Short/images/view.png


BIN
presentations/Bachelor-Short/images/workflow.png


BIN
presentations/Bachelor-Short/images/workflow.xcf


BIN
presentations/Bachelor-Short/images/xi.png


BIN
presentations/Bachelor-Short/images/yinyang.png


BIN
presentations/Bachelor-Short/logos/formula-recognition-logo.png


+ 100 - 0
presentations/Bachelor-Short/templates/myStyle.sty

@@ -0,0 +1,100 @@
+% use KIT-Theme
+% see http://sdqweb.ipd.kit.edu/wiki/Dokumentvorlagen
+%\usetheme{Frankfurt} % see http://deic.uab.es/~iblanes/beamer_gallery/index_by_theme.html as fallback
+\InputIfFileExists{../templates/beamerthemekit.sty}{\usepackage{../templates/beamerthemekit}}{\usetheme{Frankfurt}}
+\usefonttheme{professionalfonts}
+
+\usepackage{hyperref}
+\usepackage{lmodern}
+\usepackage{listings}
+\usepackage{wrapfig}        % see http://en.wikibooks.org/wiki/LaTeX/Floats,_Figures_and_Captions
+\usepackage[utf8]{inputenc} % this is needed for german umlauts
+\usepackage[english]{babel} % this is needed for german umlauts
+\usepackage[T1]{fontenc}    % this is needed for correct output of umlauts in pdf
+\usepackage{verbatim}
+\usepackage{tikz}
+\usetikzlibrary{arrows,shapes}
+\usepackage{relsize}
+\usepackage{subfigure}
+\usepackage{algorithm,algpseudocode}
+\usepackage{minted}         % needed for the inclusion of source code
+\usepackage{menukeys}
+\usepackage{xcolor}
+\usepackage{pifont}% http://ctan.org/pkg/pifont
+\usepackage{soul}
+\usepackage[babel]{csquotes}
+\usepackage{algorithm,algpseudocode}
+
+% Define some styles for graphs
+\tikzstyle{vertex}=[circle,fill=black!25,minimum size=20pt,inner sep=0pt]
+\tikzstyle{selected vertex} = [vertex, fill=red!24]
+\tikzstyle{blue vertex} = [vertex, fill=blue!24]
+\tikzstyle{edge} = [draw,thick,-]
+\tikzstyle{weight} = [font=\small]
+\tikzstyle{selected edge} = [draw,line width=5pt,-,red!50]
+\tikzstyle{ignored edge} = [draw,line width=5pt,-,black!20]
+
+%\algdef{SE}[IF]{NoThenIf}{EndIf}[1]{\algorithmicif\ #1\textbf{:}}{\algorithmicend\ \algorithmicif}%
+\algtext*{EndIf}        % Remove "end if" text
+\algtext*{EndWhile}     % Remove "end while" text
+\algtext*{EndFunction}  % Remove "end while" text
+\algnewcommand\Global{\textbf{global }}
+
+% http://tex.stackexchange.com/a/8388/5645
+\newcommand{\alertline}{%
+ \usebeamercolor[fg]{normal text}%
+ \only{\usebeamercolor[fg]{alerted text}}}
+
+\newcommand {\framedgraphic}[2] {
+    \begin{frame}{#1}
+        \begin{center}
+            \includegraphics[width=\textwidth,height=0.8\textheight,keepaspectratio]{#2}
+        \end{center}
+    \end{frame}
+}
+
+\hypersetup{%
+    breaklinks=true,
+    linktocpage=false,
+    colorlinks=true,
+    urlcolor=blue,
+    linkcolor=blue,
+    citecolor=black
+}
+
+\newcommand{\myCode}[1]{\colorbox{gray!30}{#1}}
+
+%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+% Make source code easier to copy                                   %
+%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+% from http://tex.stackexchange.com/questions/57151/how-do-i-prevent-conflicts-between-accsupp-and-hyperref
+\usepackage{accsupp}
+\newcommand\emptyaccsupp[1]{\BeginAccSupp{ActualText={}}#1\EndAccSupp{}}
+
+
+%default definition is: \def\theFancyVerbLine{\rmfamily\tiny\arabic{FancyVerbLine}}
+\let\theHFancyVerbLine\theFancyVerbLine% don't apply our patch to hyperref's version
+\def\theFancyVerbLine{\rmfamily\tiny\emptyaccsupp{\arabic{FancyVerbLine}}}
+
+%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+% Add some shortcuts                                                %
+%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+\newcommand{\cmark}{\ding{51}}% a checkmark
+\newcommand{\xmark}{\ding{55}}% a cross
+
+%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+% Set some template options - other tutors will have to adjust this %
+%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+\newcommand\tutor{Martin Thoma}
+\newcommand\titleText{On-line recognition of handwritten mathematical symbols}
+\institute{}
+\titleimage{formula-recognition-logo}
+
+\hypersetup{pdftitle={\titleText}}
+\beamertemplatenavigationsymbolsempty
+
+\newcommand\InsertToC[1][]{
+  \begin{frame}{Outline}
+    \tableofcontents[subsectionstyle=show/show/show, subsubsectionstyle=show/show/show, #1]
+  \end{frame}
+}