From 072d26e766931007a0f243674f7dfdff5c3104e9 Mon Sep 17 00:00:00 2001 From: Thomas Mesnard Date: Mon, 28 Dec 2015 20:51:50 +0100 Subject: Add plot More TIMIT ; log domain TIMIT: more complexity Nice poster Beautify code (mostly, add comments) Add final stuff. --- prez/Makefile | 8 + prez/azerty1.png | Bin 0 -> 51063 bytes prez/azerty1.svg | 888 ++++++++++++++++++ prez/azerty2.png | Bin 0 -> 23320 bytes prez/azerty2.svg | 524 +++++++++++ prez/azerty3.png | Bin 0 -> 89245 bytes prez/azerty3.svg | 989 ++++++++++++++++++++ prez/azerty4.png | Bin 0 -> 60795 bytes prez/azerty4.svg | 1968 ++++++++++++++++++++++++++++++++++++++++ prez/beamerposter.sty | 219 +++++ prez/beamerthemeconfposter.sty | 275 ++++++ prez/ctc_cost.png | Bin 0 -> 27263 bytes prez/ctc_cost_best.png | Bin 0 -> 47726 bytes prez/logo.png | Bin 0 -> 21710 bytes prez/placeholder.jpg | Bin 0 -> 20279 bytes prez/prez.tex | 449 +++++++++ prez/sample.bib | 8 + 17 files changed, 5328 insertions(+) create mode 100644 prez/Makefile create mode 100644 prez/azerty1.png create mode 100644 prez/azerty1.svg create mode 100644 prez/azerty2.png create mode 100644 prez/azerty2.svg create mode 100644 prez/azerty3.png create mode 100644 prez/azerty3.svg create mode 100644 prez/azerty4.png create mode 100644 prez/azerty4.svg create mode 100644 prez/beamerposter.sty create mode 100644 prez/beamerthemeconfposter.sty create mode 100644 prez/ctc_cost.png create mode 100644 prez/ctc_cost_best.png create mode 100644 prez/logo.png create mode 100644 prez/placeholder.jpg create mode 100644 prez/prez.tex create mode 100644 prez/sample.bib (limited to 'prez') diff --git a/prez/Makefile b/prez/Makefile new file mode 100644 index 0000000..0f6940d --- /dev/null +++ b/prez/Makefile @@ -0,0 +1,8 @@ +# IMG=azerty1.pdf_tex azerty2.pdf_tex azerty3.pdf_tex +IMG= + +prez.pdf: prez.tex $(IMG) + pdflatex prez.tex + +%.pdf_tex: %.svg + inkscape -z -D --file=$< --export-pdf=$(basename $@).pdf --export-latex diff --git a/prez/azerty1.png b/prez/azerty1.png new file mode 100644 index 0000000..9e2e283 Binary files /dev/null and b/prez/azerty1.png differ diff --git a/prez/azerty1.svg b/prez/azerty1.svg new file mode 100644 index 0000000..d86e525 --- /dev/null +++ b/prez/azerty1.svg @@ -0,0 +1,888 @@ + + + + + + + + + + + + + + image/svg+xml + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/prez/azerty2.png b/prez/azerty2.png new file mode 100644 index 0000000..c2636bb Binary files /dev/null and b/prez/azerty2.png differ diff --git a/prez/azerty2.svg b/prez/azerty2.svg new file mode 100644 index 0000000..0ccb650 --- /dev/null +++ b/prez/azerty2.svg @@ -0,0 +1,524 @@ + + + + + + + + + + + + + + image/svg+xml + + + + + + + + + + + + + + (b) + + + + + + + + error + + + + + + + + + + + output + (c) + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + (a) + + + + + + + + + + + diff --git a/prez/azerty3.png b/prez/azerty3.png new file mode 100644 index 0000000..13a7cd2 Binary files /dev/null and b/prez/azerty3.png differ diff --git a/prez/azerty3.svg b/prez/azerty3.svg new file mode 100644 index 0000000..d83e4d3 --- /dev/null +++ b/prez/azerty3.svg @@ -0,0 +1,989 @@ + + + + + + + + + + + + + + image/svg+xml + + + + + + + + + + + + + + 0 + + + + + + + + + + label probability + + + + + + + + + + + + + + + + """""" + + + 1 + 0 + 1 + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + n + + + dcl + + + dixv + Framewise + + + the sound of + + + Waveform + CTC + dhaxsaw + + + + + + + + + diff --git a/prez/azerty4.png b/prez/azerty4.png new file mode 100644 index 0000000..97e0b7b Binary files /dev/null and b/prez/azerty4.png differ diff --git a/prez/azerty4.svg b/prez/azerty4.svg new file mode 100644 index 0000000..317171a --- /dev/null +++ b/prez/azerty4.svg @@ -0,0 +1,1968 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + image/svg+xml + + + + + + + Input Sequence + + + + + + + + + + CTC layer + + + + + + + + + + + + + + + + + + + + + + + + ... + + + + + + + + + + + + + + + + ... + + + + h + + + + h + + + + h + + + + h + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + ... + + + + h + + + + h + + + + h + + + + h + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + Cost + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + Target Seq. + + + diff --git a/prez/beamerposter.sty b/prez/beamerposter.sty new file mode 100644 index 0000000..cbfe229 --- /dev/null +++ b/prez/beamerposter.sty @@ -0,0 +1,219 @@ +% Copyright 2007 by +% Philippe Dreuw and +% Thomas Deselaers +% Slight modifications made in August 2009 by Nathaniel Johnston (nathaniel@nathanieljohnston.com) +% +% This file may be distributed and/or modified +% +% 1. under the LaTeX Project Public License and/or +% 2. under the GNU Public License. +% +% +% ChangeLog: +% +% 1.07 - bugfixed custom size handling, portrait or landscape settings are ignored now +% 1.06 - added the type1cm package for scalable math fonts +% 1.05 - added version check for xkeyval package +% 1.04 - added custom size handling +% 1.03 - improved predefined size handling +% 1.02 - minor bugfixes +% 1.01 - bugfixed size handling +% 1.00 - first beamerposter release +% +\def\beamerposter@version{1.07} +\def\beamerposter@date{2008/03/11} +\def\beamerposter@msg{beamerposter: latex-beamer poster extension} +\typeout{Package: \beamerposter@date. v.\beamerposter@version. \beamerposter@msg} + +\NeedsTeXFormat{LaTeX2e} +\ProvidesPackage{beamerposter}[\beamerposter@date. v.\beamerposter@version. \beamerposter@msg] +\RequirePackage{xkeyval}[2006/11/18] +\RequirePackage{type1cm} %% get it from ftp://cam.ctan.org/tex-archive/macros/latex/contrib/type1cm.zip + +\newif\ifportrait +\newif\ifcustomsize +\newif\ifdebug + +\DeclareOptionX{size}[a0]{ + \typeout{beamerposter: checking size input, please wait.} + \XKV@cc*+[\val\nr]{#1}{a0b,a0,a1,a2,a3,a4,custom}{% + \typeout{beamerposter: the input \val\ \nr\ was correct, we proceed.} + \ifcase\nr\relax + %a0b + \setlength{\paperheight}{119cm} + \setlength{\paperwidth}{88cm} + \setlength{\textheight}{116cm} + \setlength{\textwidth}{88cm} + \or + %a0 + \setlength{\paperheight}{118.82cm} + \setlength{\paperwidth}{83.96cm} + \setlength{\textheight}{117.82cm} + \setlength{\textwidth}{82.96cm} + \or + %a1 + \setlength{\paperheight}{83.96cm} + \setlength{\paperwidth}{59.4cm} + \setlength{\textheight}{82.96cm} + \setlength{\textwidth}{58.4cm} + \or + %a2 + \setlength{\paperheight}{59.4cm} + \setlength{\paperwidth}{41.98cm} + \setlength{\textheight}{58.4cm} + \setlength{\textwidth}{40.98cm} + \or + %a3 + \setlength{\paperwidth}{41.98cm} + \setlength{\paperheight}{29.7cm} + \setlength{\textwidth}{40.98cm} + \setlength{\textheight}{28.7cm} + \or + %a4 + \setlength{\paperheight}{29.7cm} + \setlength{\paperwidth}{21.0cm} + \setlength{\textheight}{28.7cm} + \setlength{\textwidth}{20.0cm} + \or + \customsizetrue + \fi + }{% + \PackageWarning{beamerposter}{the input \val\ was incorrect and was ignored.} + }% + \typeout{beamerposter: finished size input check.} +} +\DeclareOptionX{orientation}[portrait]{ + \typeout{beamerposter: checking orientation input, please wait.} + \XKV@cc*+[\val\nr]{#1}{portrait,landscape}{% + \typeout{beamerposter: the input \val\ \nr\ was correct, we proceed.} + \ifcase\nr\relax + \portraittrue + \or + \portraitfalse + \fi + }{% + \PackageWarning{beamerposter}{the input \val\ was incorrect and was ignored.} + }% + \typeout{beamerposter: finished orientation check.} +} +\DeclareOptionX{scale}[1.0]{\edef\myfontscale{#1}\typeout{beamerposter: myfontscale=\myfontscale}} +\DeclareOptionX{width}{\edef\customwidth{#1}\typeout{beamerposter: custom poster width=\customwidth}} +\DeclareOptionX{height}{\edef\customheight{#1}\typeout{beamerposter: custom poster height=\customheight}} +\DeclareOptionX{debug}{\typeout{beamerposter: enabled debug mode}\debugtrue} +\DeclareOptionX*{\PackageWarning{beamerposter}{Unknown option ignored: \CurrentOption}} +%\DeclareOptionX*{\PassOptionsToClass{\CurrentOption}{beamer}} +\ExecuteOptionsX{size=a0,scale=1.0} +\ProcessOptionsX\relax + +\ifdebug + \RequirePackage[debug]{fp} +\else + \RequirePackage{fp} +\fi + +%% swap sizes for portrait orientation +\ifportrait + \newdimen\tmp + \setlength{\tmp}{\paperwidth} + \setlength{\paperwidth}{\paperheight} + \setlength{\paperheight}{\tmp} + \setlength{\tmp}{\textwidth} + \setlength{\textwidth}{\textheight} + \setlength{\textheight}{\tmp} +\else\relax +\fi + +%% overwrite dimensions if custom size +\ifcustomsize + \setlength{\paperwidth}{\customwidth cm} + \setlength{\paperheight}{\customheight cm} + \FPupn{\resulttextwidth}{1 customwidth -} + \FPupn{\resulttextheight}{1 customheight -} + \setlength{\textwidth}{\resulttextwidth cm} + \setlength{\textheight}{\resulttextheight cm} +\fi + +%% Setting proper dimensions for a DIN A0 printer +\setlength{\headheight}{0 cm} +\setlength{\headsep}{0 cm} +\setlength{\topmargin}{-12.7 mm} % -1in +1.47cm +\setlength{\oddsidemargin}{-25.4 mm} % -1in +0.4cm + +%% For the page layout +\ifdebug +\typeout{beamerposter: paperwidth=\the\paperwidth, paperheight=\the\paperheight} +\typeout{beamerposter: textwidth=\the\textwidth, textwidth=\the\textheight} +\fi +\geometry{ + paperwidth=\the\paperwidth, + paperheight=\the\paperheight, + hmargin=1cm,% + vmargin=0cm,% + head=0.5cm, % + headsep=0pt,% + foot=0.5cm % +} + +%% scalable vector fonts +\edef\fontSizeX{14.4}\edef\fontSizeY{18} +\FPupn{\resultscriptsizeX}{myfontscale fontSizeX * 2 round} +\FPupn{\resultscriptsizeY}{myfontscale fontSizeY * 2 round} +\renewcommand*{\tiny}{\fontsize{\resultscriptsizeX}{\resultscriptsizeY}\selectfont} + +\edef\fontSizeX{17.28}\edef\fontSizeY{22} +\FPupn{\resultfootnotesizeX}{myfontscale fontSizeX * 2 round} +\FPupn{\resultfootnotesizeY}{myfontscale fontSizeY * 2 round} +\renewcommand*{\scriptsize}{\fontsize{\resultfootnotesizeX}{\resultfootnotesizeY}\selectfont} + +\edef\fontSizeX{20.74}\edef\fontSizeY{25} +\FPupn{\resultsmallX}{myfontscale fontSizeX * 2 round} +\FPupn{\resultsmallY}{myfontscale fontSizeY * 2 round} +\renewcommand*{\footnotesize}{\fontsize{\resultsmallX}{\resultsmallY}\selectfont} + +\edef\fontSizeX{24.88}\edef\fontSizeY{30} +\FPupn{\resultnormalsizeX}{myfontscale fontSizeX * 2 round} +\FPupn{\resultnormalsizeY}{myfontscale fontSizeY * 2 round} +\renewcommand*{\small}{\fontsize{\resultnormalsizeX}{\resultnormalsizeY}\selectfont} + +\edef\fontSizeX{29.86}\edef\fontSizeY{37} +\FPupn{\resultlargeX}{myfontscale fontSizeX * 2 round} +\FPupn{\resultlargeY}{myfontscale fontSizeY * 2 round} +\renewcommand*{\normalsize}{\fontsize{\resultlargeX}{\resultlargeY}\selectfont} + +\edef\fontSizeX{35.83}\edef\fontSizeY{45} +\FPupn{\resultLargeX}{myfontscale fontSizeX * 2 round} +\FPupn{\resultLargeY}{myfontscale fontSizeY * 2 round} +\renewcommand*{\large}{\fontsize{\resultLargeX}{\resultLargeY}\selectfont} + +\edef\fontSizeX{43}\edef\fontSizeY{54} +\FPupn{\resultLARGEX}{myfontscale fontSizeX * 2 round} +\FPupn{\resultLARGEY}{myfontscale fontSizeY * 2 round} +\renewcommand*{\Large}{\fontsize{\resultLARGEX}{\resultLARGEY}\selectfont} + +\edef\fontSizeX{51.6}\edef\fontSizeY{64} +\FPupn{\resulthugeX}{myfontscale fontSizeX * 2 round} +\FPupn{\resulthugeY}{myfontscale fontSizeY * 2 round} +\renewcommand*{\LARGE}{\fontsize{\resulthugeX}{\resulthugeY}\selectfont} + +\edef\fontSizeX{61.92}\edef\fontSizeY{77} +\FPupn{\resultHugeX}{myfontscale fontSizeX * 2 round} +\FPupn{\resultHugeY}{myfontscale fontSizeY * 2 round} +\renewcommand*{\huge}{\fontsize{\resultHugeX}{\resultHugeY}\selectfont} + +\edef\fontSizeX{74.3}\edef\fontSizeY{93} +\FPupn{\resultveryHugeX}{myfontscale fontSizeX * 2 round} +\FPupn{\resultveryHugeY}{myfontscale fontSizeY * 2 round} +\renewcommand*{\Huge}{\fontsize{\resultveryHugeX}{\resultveryHugeY}\selectfont} + +\edef\fontSizeX{80.3}\edef\fontSizeY{101} +\FPupn{\resultVeryHugeX}{myfontscale fontSizeX * 2 round} +\FPupn{\resultVeryHugeY}{myfontscale fontSizeY * 2 round} +\newcommand*{\veryHuge}{\fontsize{\resultVeryHugeX}{\resultVeryHugeY}\selectfont} + +\edef\fontSizeX{107}\edef\fontSizeY{134} +\FPupn{\resultVERYHugeX}{myfontscale fontSizeX * 2 round} +\FPupn{\resultVERYHugeY}{myfontscale fontSizeY * 2 round} +\newcommand*{\VeryHuge}{\fontsize{\resultVERYHugeX}{\resultVERYHugeY}\selectfont} + +% set the normalfont (default) +\renewcommand*{\normalfont}{\normalsize} \ No newline at end of file diff --git a/prez/beamerthemeconfposter.sty b/prez/beamerthemeconfposter.sty new file mode 100644 index 0000000..2affaf1 --- /dev/null +++ b/prez/beamerthemeconfposter.sty @@ -0,0 +1,275 @@ +%============================================================================== +% Beamer style for the poster template posted at +% http://www.nathanieljohnston.com/2009/08/latex-poster-template/ +% +% Created by the Computational Physics and Biophysics Group at Jacobs University +% https://teamwork.jacobs-university.de:8443/confluence/display/CoPandBiG/LaTeX+Poster +% Modified by Nathaniel Johnston (nathaniel@nathanieljohnston.com) in August 2009 +% ============================================================================= + +\ProvidesPackage{beamerthemeconfposter} +\RequirePackage{tikz} % for drawing the nice rounded boxes +\usetikzlibrary{arrows,backgrounds} +\RequirePackage[T1]{fontenc} +\RequirePackage{lmodern} +\RequirePackage{textcomp} +\RequirePackage{amsmath,amssymb} +\usefonttheme{professionalfonts} +\newcommand{\makeruleinbox}{{\usebeamercolor[bg]{block alerted title}\centering\hspace*{-0.7cm}\rule{\inboxrule}{0.5cm}}} +\usepackage{ragged2e} + +% Spacing before and inside list environments to add white space before lists and between items inside lists +\makeatletter +\def\@listi{\leftmargin\leftmarginii +\topsep 1ex % Spacing before lists +\parsep 0\p@ \@plus\p@ +\itemsep 6pt} % Spacing between items +\makeatother + +\usecaptiontemplate{\small\structure{\insertcaptionname~\insertcaptionnumber: }\insertcaption} % A fix for figure numbering + +%----------------------------------------------------------- +% Define a whole bunch of custom colours and fonts +%----------------------------------------------------------- + +\definecolor{lgreen} {RGB}{180,210,100} +\definecolor{dblue} {RGB}{20,66,129} +\definecolor{ddblue} {RGB}{11,36,69} +\definecolor{lred} {RGB}{220,0,0} +\definecolor{nred} {RGB}{224,0,0} +\definecolor{norange}{RGB}{230,120,20} +\definecolor{nyellow}{RGB}{255,221,0} +\definecolor{ngreen} {RGB}{98,158,31} +\definecolor{dgreen} {RGB}{78,138,21} +\definecolor{nblue} {RGB}{28,130,185} +\definecolor{jblue} {RGB}{20,50,100} + + +%---------------------------------------------------------------------------- +% More colours added due to conflict with Colordvi package +% Addition done by Nishan Mudalige (math.mudalige@uoguelph.ca) in April 2011 +%---------------------------------------------------------------------------- + +\definecolor{GreenYellow} {RGB}{217, 229, 6} % GreenYellow Approximate PANTONE 388 +\definecolor{Yellow} {RGB}{254, 223, 0} % Yellow Approximate PANTONE YELLOW +\definecolor{Goldenrod} {RGB}{249, 214, 22} % Goldenrod Approximate PANTONE 109 +\definecolor{Dandelion} {RGB}{253, 200, 47} % Dandelion Approximate PANTONE 123 +\definecolor{Apricot} {RGB}{255, 170, 123} % Apricot Approximate PANTONE 1565 +\definecolor{Peach} {RGB}{255, 127, 69} % Peach Approximate PANTONE 164 +\definecolor{Melon} {RGB}{255, 129, 141} % Melon Approximate PANTONE 177 +\definecolor{YellowOrange} {RGB}{240, 171, 0} % YellowOrange Approximate PANTONE 130 +\definecolor{Orange} {RGB}{255, 88, 0} % Orange Approximate PANTONE ORANGE-021 +\definecolor{BurntOrange} {RGB}{199, 98, 43} % BurntOrange Approximate PANTONE 388 +\definecolor{Bittersweet} {RGB}{189, 79, 25} % Bittersweet Approximate PANTONE 167 +\definecolor{RedOrange} {RGB}{222, 56, 49} % RedOrange Approximate PANTONE 179 +\definecolor{Mahogany} {RGB}{152, 50, 34} % Mahogany Approximate PANTONE 484 +\definecolor{Maroon} {RGB}{152, 30, 50} % Maroon Approximate PANTONE 201 +\definecolor{BrickRed} {RGB}{170, 39, 47} % BrickRed Approximate PANTONE 1805 +\definecolor{Red} {RGB}{255, 0, 0} % Red Approx PANTONE LUMINOUS VIVID RED +\definecolor{BrilliantRed} {RGB}{237, 41, 57} % Red VERY-Approx PANTONE RED +\definecolor{OrangeRed} {RGB}{231, 58, 0} % OrangeRed No PANTONE match (TRIED PANTONE VIVID ORANGE RED) +\definecolor{RubineRed} {RGB}{202, 0, 93} % RubineRed Approximate PANTONE RUBINE-RED +\definecolor{WildStrawberry} {RGB}{203, 0, 68} % WildStrawberry Approximate PANTONE 206 +\definecolor{Salmon} {RGB}{250, 147, 171} % Salmon Approximate PANTONE 183 +\definecolor{CarnationPink} {RGB}{226, 110, 178} % CarnationPink Approximate PANTONE 218 +\definecolor{Magenta} {RGB}{255, 0, 144} % Magenta Approximate PANTONE PROCESS-MAGENTA +\definecolor{VioletRed} {RGB}{215, 31, 133} % VioletRed Approximate PANTONE 219 +\definecolor{Rhodamine} {RGB}{224, 17, 157} % Rhodamine Approximate PANTONE RHODAMINE-RED +\definecolor{Mulberry} {RGB}{163, 26, 126} % Mulberry Approximate PANTONE 241 +\definecolor{RedViolet} {RGB}{161, 0, 107} % RedViolet Approximate PANTONE 234 +\definecolor{Fuchsia} {RGB}{155, 24, 137} % Fuchsia Approximate PANTONE 248 +\definecolor{Lavender} {RGB}{240, 146, 205} % Lavender Approximate PANTONE 223 +\definecolor{Thistle} {RGB}{222, 129, 211} % Thistle Approximate PANTONE 245 +\definecolor{Orchid} {RGB}{201, 102, 205} % Orchid Approximate PANTONE 252 +\definecolor{DarkOrchid} {RGB}{153, 50, 204} % DarkOrchid No PANTONE match +\definecolor{Purple} {RGB}{182, 52, 187} % Purple Approximate PANTONE PURPLE +\definecolor{Plum} {RGB}{79, 50, 76} % Plum VERY-Approx PANTONE 518 +\definecolor{Violet} {RGB}{75, 8, 161} % Violet Approximate PANTONE VIOLET +\definecolor{RoyalPurple} {RGB}{82, 35, 152} % RoyalPurple Approximate PANTONE 267 +\definecolor{BlueViolet} {RGB}{33, 7, 106} % BlueViolet Approximate PANTONE 2755 +\definecolor{Periwinkle} {RGB}{136, 132, 213} % Periwinkle Approximate PANTONE 2715 +\definecolor{CadetBlue} {RGB}{95, 158, 160} % CadetBlue Approximate PANTONE (534+535)/2, Could not find get on my own so used PANTONE-CADET BLUE +\definecolor{CornflowerBlue} {RGB}{99, 177, 229} % CornflowerBlue Approximate PANTONE 292 +\definecolor{MidnightBlue} {RGB}{0, 65, 101} % MidnightBlue Approximate PANTONE 302 +\definecolor{NavyBlue} {RGB}{0, 70, 173} % NavyBlue Approximate PANTONE 293 +\definecolor{RoyalBlue} {RGB}{0, 35, 102} % RoyalBlue No PANTONE match +\definecolor{Blue} {RGB}{0, 24, 168} % Blue Approximate PANTONE BLUE-072 +\definecolor{Cerulean} {RGB}{0, 122, 201} % Cerulean Approximate PANTONE 3005 +\definecolor{Cyan} {RGB}{0, 159, 218} % Cyan Approximate PANTONE PROCESS-CYAN +\definecolor{ProcessBlue} {RGB}{0, 136, 206} % ProcessBlue Approximate PANTONE PROCESS-BLUE +\definecolor{SkyBlue} {RGB}{91, 198, 232} % SkyBlue Approximate PANTONE 2985 + +\definecolor{Turquoise} {RGB}{0, 255, 239} % Turquoise Approximate PANTONE (312+313)/2, Could not find get on my own so used PANTONE-TURQUOISE + +\definecolor{TealBlue} {RGB}{0, 124, 146} % TealBlue Approximate PANTONE 3145 +\definecolor{Aquamarine} {RGB}{0, 148, 179} % Aquamarine Approximate PANTONE 3135 +\definecolor{BlueGreen} {RGB}{0, 154, 166} % BlueGreen Approximate PANTONE 320 +\definecolor{Emerald} {RGB}{80, 200, 120} % Emerald No PANTONE match +\definecolor{JungleGreen} {RGB}{0, 115, 99} % JungleGreen Approximate PANTONE 328 +\definecolor{SeaGreen} {RGB}{0, 176, 146} % SeaGreen Approximate PANTONE 3268 +\definecolor{Green} {RGB}{0, 173, 131} % Green VERY-Approx PANTONE GREEN +\definecolor{ForestGreen} {RGB}{0, 105, 60} % ForestGreen Approximate PANTONE 349 +\definecolor{PineGreen} {RGB}{0, 98, 101} % PineGreen Approximate PANTONE 323 +\definecolor{LimeGreen} {RGB}{50, 205, 50} % LimeGreen No PANTONE match +\definecolor{YellowGreen} {RGB}{146, 212, 0} % YellowGreen Approximate PANTONE 375 +\definecolor{SpringGreen} {RGB}{201, 221, 3} % SpringGreen Approximate PANTONE 381 +\definecolor{OliveGreen} {RGB}{135, 136, 0} % OliveGreen Approximate PANTONE 582 +\definecolor{RawSienna} {RGB}{149, 82, 20} % RawSienna Approximate PANTONE 154 +\definecolor{Sepia} {RGB}{98, 60, 27} % Sepia Approximate PANTONE 161 +\definecolor{Brown} {RGB}{134, 67, 30} % Brown Approximate PANTONE 1615 +\definecolor{Tan} {RGB}{210, 180, 140} % Tan No PANTONE match +\definecolor{Gray} {RGB}{139, 141, 142} % Gray Approximate PANTONE COOL-GRAY-8 + +\definecolor{Black} {RGB}{30, 30, 30} % Black Approximate PANTONE PROCESS-BLACK +\definecolor{White} {RGB}{255, 255, 255} % White No PANTONE match + + + + + + + + + + + + + + + + +% set the basic colors +\setbeamercolor{palette primary} {fg=black,bg=white} +\setbeamercolor{palette secondary} {fg=black,bg=white} +\setbeamercolor{palette tertiary} {bg=jblue,fg=white} +\setbeamercolor{palette quaternary}{fg=black,bg=white} +\setbeamercolor{structure}{fg=jblue} +\setbeamercolor{titlelike} {bg=jblue,fg=white} +\setbeamercolor{frametitle} {bg=jblue!10,fg=jblue} +\setbeamercolor{cboxb}{fg=black,bg=jblue} +\setbeamercolor{cboxr}{fg=black,bg=red} + +% set colors for itemize/enumerate +\setbeamercolor{item}{fg=ngreen} +\setbeamercolor{item projected}{fg=white,bg=ngreen} + +% set colors for blocks +\setbeamercolor{block title}{fg=ngreen,bg=white} +\setbeamercolor{block body}{fg=black,bg=white} + +% set colors for alerted blocks (blocks with frame) +\setbeamercolor{block alerted title}{fg=white,bg=jblue} +\setbeamercolor{block alerted body}{fg=black,bg=jblue!10} + +% set the fonts +\setbeamerfont{section in head/foot}{series=\bfseries} +\setbeamerfont{block title}{series=\bfseries} +\setbeamerfont{block alerted title}{series=\bfseries} +\setbeamerfont{frametitle}{series=\bfseries} +\setbeamerfont{frametitle}{size=\Large} +\setbeamerfont{block body}{series=\rmfamily} + +% set some beamer theme options +\setbeamertemplate{title page}[default][colsep=-4bp,rounded=true] +\setbeamertemplate{sections/subsections in toc}[square] +\setbeamertemplate{items}[circle] +\setbeamertemplate{blocks}[width=0.0] +\beamertemplatenavigationsymbolsempty + +% set bibliography style +\setbeamertemplate{bibliography item}[text] +\setbeamercolor{bibliography item}{fg=black,bg=white} +\setbeamercolor{bibliography entry author}{fg=black,bg=white} +\setbeamercolor{bibliography item}{fg=black,bg=white} + +% define some length variables that are used by the template +\newlength{\inboxwd} +\newlength{\iinboxwd} +\newlength{\inboxrule} +\makeatletter +\makeatother + +%============================================================================== +% build the poster title +%============================================================================== +\setbeamertemplate{headline}{ + \leavevmode + \begin{columns} + \begin{column}{\linewidth} + \vskip1cm + \centering + \usebeamercolor{title in headline}{\color{jblue}\Huge{\textbf{\inserttitle}}\\[0.5ex]} + \usebeamercolor{author in headline}{\color{fg}\Large{\insertauthor}\\[1ex]} + \usebeamercolor{institute in headline}{\color{fg}\large{\insertinstitute}\\[1ex]} + \vskip1cm + \end{column} + \vspace{1cm} + \end{columns} + \vspace{0.5in} + \hspace{0.5in}\begin{beamercolorbox}[wd=35in,colsep=0.15cm]{cboxb}\end{beamercolorbox} + \vspace{0.1in} +} + +% Block definition +\setbeamertemplate{block begin} +{ + \par\vskip\medskipamount + \begin{beamercolorbox}[colsep*=0ex,dp={2ex},center]{block title} + \vskip-0.25cm + \usebeamerfont{block title}\large\insertblocktitle + \begin{flushleft} + \vskip-1cm + \begin{tikzpicture}[remember picture,overlay] + \shade [inner color=gray,outer color=white] + (0,0) rectangle (\textwidth,0.3cm); + \end{tikzpicture} + \end{flushleft} + \end{beamercolorbox} + {\parskip0pt\par} + \ifbeamercolorempty[bg]{block title} + {} + {\ifbeamercolorempty[bg]{block body}{}{\nointerlineskip\vskip-0.5pt}} + \usebeamerfont{block body} + \vskip-0.5cm + \begin{beamercolorbox}[colsep*=0ex,vmode]{block body} + \justifying +} + +\setbeamertemplate{block end} +{ + \end{beamercolorbox} + \vskip\smallskipamount +} + +% Alert block definition (with frame) +\setbeamertemplate{block alerted begin} +{ + \par\vskip\medskipamount + \begin{beamercolorbox}[sep=0ex,rounded=true,center,dp={2ex}]{block alerted title} + \vskip0.01cm + \usebeamerfont{block title}\large\insertblocktitle + \end{beamercolorbox} + {\parskip0pt\par} + \usebeamerfont{block body} + \vskip-0.8cm + \begin{beamercolorbox}[sep=0.5cm, rounded=true,center]{block alerted title} + \setlength{\inboxwd}{\linewidth} + \addtolength{\inboxwd}{-1cm} + \begin{beamercolorbox}[rounded=true,wd={\inboxwd},center]{block alerted body} + \setlength{\iinboxwd}{\inboxwd} + \setlength{\inboxrule}{\inboxwd} + \addtolength{\iinboxwd}{-0.5cm} + \addtolength{\inboxrule}{0.5cm} + \begin{center} + \begin{minipage}{\iinboxwd} + \justifying +} + +\setbeamertemplate{block alerted end} +{ + \end{minipage} + \end{center} + \end{beamercolorbox} + \end{beamercolorbox} + \vskip\smallskipamount +} \ No newline at end of file diff --git a/prez/ctc_cost.png b/prez/ctc_cost.png new file mode 100644 index 0000000..5ac0561 Binary files /dev/null and b/prez/ctc_cost.png differ diff --git a/prez/ctc_cost_best.png b/prez/ctc_cost_best.png new file mode 100644 index 0000000..63bd584 Binary files /dev/null and b/prez/ctc_cost_best.png differ diff --git a/prez/logo.png b/prez/logo.png new file mode 100644 index 0000000..df92477 Binary files /dev/null and b/prez/logo.png differ diff --git a/prez/placeholder.jpg b/prez/placeholder.jpg new file mode 100644 index 0000000..d5c08e0 Binary files /dev/null and b/prez/placeholder.jpg differ diff --git a/prez/prez.tex b/prez/prez.tex new file mode 100644 index 0000000..3befdd0 --- /dev/null +++ b/prez/prez.tex @@ -0,0 +1,449 @@ +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% Jacobs Portrait Poster +% LaTeX Template +% Version 1.0 (31/08/2015) +% (Based on Version 1.0 (29/03/13) of the landscape template +% +% Created by: +% Computational Physics and Biophysics Group, Jacobs University +% https://teamwork.jacobs-university.de:8443/confluence/display/CoPandBiG/LaTeX+Poster +% +% Further modified by: +% Nathaniel Johnston (nathaniel@njohnston.ca) +% +% Portrait version by: +% John Hammersley +% +% The landscape version of this template was downloaded from: +% http://www.LaTeXTemplates.com +% +% License: +% CC BY-NC-SA 3.0 (http://creativecommons.org/licenses/by-nc-sa/3.0/) +% +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% + +%---------------------------------------------------------------------------------------- +% PACKAGES AND OTHER DOCUMENT CONFIGURATIONS +%---------------------------------------------------------------------------------------- + +\documentclass[final]{beamer} + +\usepackage[scale=1.24]{beamerposter} % Use the beamerposter package for laying out the poster +\usepackage[utf8]{inputenc} + +\usepackage{relsize} + +\usetheme{confposter} % Use the confposter theme supplied with this template + +\setbeamercolor{block title}{fg=ngreen,bg=white} % Colors of the block titles +\setbeamercolor{block body}{fg=black,bg=white} % Colors of the body of blocks +\setbeamercolor{block alerted title}{fg=white,bg=dblue!70} % Colors of the highlighted block titles +\setbeamercolor{block alerted body}{fg=black,bg=dblue!10} % Colors of the body of highlighted blocks +% Many more colors are available for use in beamerthemeconfposter.sty + +%----------------------------------------------------------- +% Define the column widths and overall poster size +% To set effective sepwid, onecolwid and twocolwid values, first choose how many columns you want and how much separation you want between columns +% In this template, the separation width chosen is 0.024 of the paper width and a 4-column layout +% onecolwid should therefore be (1-(# of columns+1)*sepwid)/# of columns e.g. (1-(4+1)*0.024)/4 = 0.22 +% Set twocolwid to be (2*onecolwid)+sepwid = 0.464 +% Set threecolwid to be (3*onecolwid)+2*sepwid = 0.708 + +\newlength{\sepwid} +\newlength{\onecolwid} +\newlength{\twocolwid} +\newlength{\threecolwid} +\setlength{\paperwidth}{36in} % A0 width: 46.8in +\setlength{\paperheight}{48in} % A0 height: 33.1in +\setlength{\sepwid}{0.024\paperwidth} % Separation width (white space) between columns +\setlength{\onecolwid}{0.22\paperwidth} % Width of one column +\setlength{\twocolwid}{0.464\paperwidth} % Width of two columns +\setlength{\threecolwid}{0.708\paperwidth} % Width of three columns +\setlength{\topmargin}{-0.5in} % Reduce the top margin size +%----------------------------------------------------------- + +\usepackage{graphicx} % Required for including images + +\usepackage{booktabs} % Top and bottom rules for tables + + +\usepackage{lmodern} +\usepackage{amsmath} +\usepackage{amssymb} +\usepackage{graphicx} + +\usepackage[T1]{fontenc} + +\DeclareFontShape{OMX}{cmex}{m}{n}{ + <-7.5> cmex7 + <7.5-8.5> cmex8 + <8.5-9.5> cmex9 + <9.5-> cmex10 +}{} + +\SetSymbolFont{largesymbols}{normal}{OMX}{cmex}{m}{n} +\SetSymbolFont{largesymbols}{bold} {OMX}{cmex}{m}{n} + +%---------------------------------------------------------------------------------------- +% TITLE SECTION +%---------------------------------------------------------------------------------------- + +\title{Connectionist Temporal Classification: \\Labelling Unsegmented Sequences with \\Recurrent Neural Networks} % Poster title + +\author{Thomas Mesnard, Alex Auvolat} % Author(s) + +\institute{Probabilisitc Graphical Models Project, MVA Master} % Institution(s) + +%---------------------------------------------------------------------------------------- + +\begin{document} + +\addtobeamertemplate{block end}{}{\vspace*{2ex}} % White space under blocks +\addtobeamertemplate{block alerted end}{}{\vspace*{2ex}} % White space under highlighted (alert) blocks + +\setlength{\belowcaptionskip}{2ex} % White space under figures +\setlength\belowdisplayshortskip{2ex} % White space under equations + +\begin{frame}[t] % The whole poster is enclosed in one beamer frame + +\begin{columns}[t] % The whole poster consists of three major columns, the second of which is split into two columns twice - the [t] option aligns each column's content to the top + +\begin{column}{\sepwid}\end{column} % Empty spacer column + +\begin{column}{\twocolwid} % Begin a column which is two columns wide (column 2) + +\begin{columns}[t,totalwidth=\twocolwid] % Split up the two columns wide column + +\begin{column}{\onecolwid}\vspace{-.6in} % The first column within column 2 (column 2.1) + +%---------------------------------------------------------------------------------------- +% MATERIALS +%---------------------------------------------------------------------------------------- + + +\begin{block}{Abstract} + +Many real-world sequence learning tasks require the prediction of sequences of +labels from noisy, unsegmented input data. Recurrent +neural networks (RNNs) are powerful sequence learners that would seem well +suited to such tasks. However, because they require pre-segmented training +data, and post-processing to transform their outputs into label sequences, +they cannot be applied directly. CTC is a method +for training RNNs to label unsegmented sequences directly, thereby solving both +problems. + +\end{block} + + +%---------------------------------------------------------------------------------------- + +\end{column} % End of column 2.1 + +\begin{column}{\onecolwid}\vspace{-.6in} % The second column within column 2 (column 2.2) + +%---------------------------------------------------------------------------------------- +% METHODS +%---------------------------------------------------------------------------------------- + +\begin{block}{Main Idea} + +RNNs are powerful learners for sequences, but: + +\begin{itemize} +\item Standard methods need pre-segmented training data +\item Need for complex post-preprocessing +\end{itemize} + +CTC solves this problem: + +\begin{itemize} +\item Able to train RNNs using unsegmented training data +\item Learns the segmentation automatically +\item Provides directly usable output +\end{itemize} + +This method is now extremely used, even by Google! + +\end{block} + + +%---------------------------------------------------------------------------------------- + +\end{column} % End of column 2.2 + +\end{columns} % End of the split of column 2 - any content after this will now take up 2 columns width + +%---------------------------------------------------------------------------------------- +% IMPORTANT RESULT +%---------------------------------------------------------------------------------------- + +\begin{alertblock}{The problem and how CTC solves it} + +\begin{figure} +\includegraphics[width=0.9\linewidth]{azerty3.png} +\caption{\small Output of classic framewise phoneme classification and RNN trained with CTC} +\end{figure} + +\end{alertblock} + +%---------------------------------------------------------------------------------------- + + +\begin{block}{Model} +\begin{columns}[t,totalwidth=\twocolwid] % Split up the two columns wide column again + + +\begin{column}{\onecolwid} % The first column within column 2 (column 2.1) + +\begin{itemize} +\item Cost function for RNNs +\item RNN outputs probabilities for the different symbols, plus blank symbol +\item Many possible alignments for the correct label (shorter than input) +\item Dynamic programming: sums all the possible alignments +\item Provides gradients for the RNN to learn a good alignment +\end{itemize} + +\vspace{1em} +\begin{figure} +\includegraphics[width=0.8\linewidth]{azerty4.png} +\caption{Simple bidirectional RNN model with CTC cost layer} +\end{figure} + +%---------------------------------------------------------------------------------------- + +\end{column} % End of column 2.1 + +\begin{column}{\onecolwid} % The second column within column 2 (column 2.2) + + +CTC is a dynamic programming algorithm that calculates the following sum: +\[ +\alpha_t(s) = \sum_{\substack{\pi \in N^T :\\\mathcal{B}(\pi_{1:t}) = l_{1:s}}} + \prod_{t'=1}^t y_{\pi_{t'}}^{t'} +\] + +Where $\mathcal{B}$ is the transform that removes blanks and duplicates. + +\begin{figure} +\includegraphics[width=\linewidth]{azerty1.png} +\caption{Computation graph for $\alpha_t(s)$ (corresponds to an unrolled automaton)} +\end{figure} + +Tools used for our implementation: +\begin{itemize} +\item Theano (GPU computation library) +\item Blocks (deep learning framework) +\end{itemize} + +%---------------------------------------------------------------------------------------- + +\end{column} % End of column 2.2 + +\end{columns} % End of the split of column 2 + +\end{block} + +\end{column} % End of the second column + + + +\begin{column}{\sepwid}\end{column} % Empty spacer column + + + +%================================================================= + +\begin{column}{\twocolwid} % Begin a column which is two columns wide (column 2) + +\begin{block}{Recurrence equations} + +\begin{columns}[t,totalwidth=\twocolwid] % Split up the two columns wide column +\begin{column}{\onecolwid} % The first column + +We define the following notation: + +$y_k^t$: output at time $t$ for symbol $k$ + +$l$: label, $l'$: label with blanks + +Initialization: +\[ +\begin{tabular}{rcl} +$\alpha_1(1)$ &=& $y_b^1$\\ +$\alpha_1(2)$ &=& $y_{l_1}^1$\\ +$\alpha_1(s)$ &=& $0, \forall s > 2$ +\end{tabular} +\] + +Recurrence relation: +\[ +\alpha_t(s) = +\begin{cases} + \bar{\alpha}_t(s) y_{l'_s}^t \mbox{ \; if } l'_s = b\mbox{ or }l'_{s-2}=l'_s \\ + (\bar{\alpha}_t(s)+\alpha_{t-1}(s-2)) y_{l'_s}^t \\ + \hspace{3em} \mbox{ otherwise}\\ +\end{cases} +\] +\[ +\bar{\alpha}_t(s) = \alpha_{t-1}(s) + \alpha_{t-1}(s-1) +\] + +Finally, we have: +\[ +p(l|x) = \alpha_T(|l'|) + \alpha_T(|l'|-1) +\] + +\end{column} +\begin{column}{\sepwid}\end{column} % Empty spacer column +\begin{column}{\onecolwid} % The third column + +\begin{figure} +\includegraphics[width=\linewidth]{azerty2.png} +\caption{Evolution of the CTC error signal} +\end{figure} + +To avoid numerical underflow, at each step $t$: +\[ +C_t = \sum_s \alpha_t(s) +\hspace{1em} +\hat{\alpha}_t(s) = \frac{\alpha_t(s)}{C_t} +\] + +Other solution: do calculations in the logarithmic domain. + + +\end{column} % End of column 2.2 + +\end{columns} % End of the split of column 2 + + +\end{block} + +\begin{columns}[t,totalwidth=\twocolwid] % Split up the two columns wide column +\begin{column}{\onecolwid} % The first column + +\begin{block}{Toy dataset} + +We first tried our implementation on a simple task: + +{\centering +$1^*2^*3^*4^*5^* \to 1$ \\ +$1^*2^*3^*2^*1^* \to 2$ \\ +$5^*4^*3^*2^*1^* \to 3$ \\ +$5^*4^*3^*4^*5^* \to 4$ \\ +} + +\begin{itemize} +\item A RNN can easily solve this +\item It needs to read the full sequence before predicting a label +\item CTC provides satisfactory results +\end{itemize} + +\begin{table} +\vspace{2ex} +\begin{tabular}{l l l} +\toprule +\textbf{Results} & \textbf{train} & \textbf{valid}\\ +\midrule +Sequence length & 5 -- 20 & 5 -- 20 \\ +Error rate & 0.62 & 0.63 \\ +Mean edit distance & 1.0 & 1.1 \\ +Errors per character & 0.08 & 0.09 \\ +\bottomrule +\end{tabular} +\caption{Performances of CTC on our toy dataset} +\end{table} + +\begin{figure} +\includegraphics[width=\linewidth]{ctc_cost_best.png} +\caption{Training and validation cost of the CTC model (negative log likelihood)} +\end{figure} +\end{block} + +\begin{block}{Conclusion} +CTC is a very powerfull model, and also has a nice mathematical formulation. It is also very used in practice (most successfull applications: speech recognition, handwriting recognition). +\end{block} + +%------------------------------------------------ + + +%---------------------------------------------------------------------------------------- + +\end{column} % End of the first column + +\begin{column}{\sepwid}\end{column} % Empty spacer column + + +\begin{column}{\onecolwid} % The third column + +\begin{block}{TIMIT} + +We then tried on the classical TIMIT dataset: + +\begin{itemize} +\item Raw speech signal dataset +\item Labelled by phonemes or by words +\item 4120 sentences +\item Average audio length: 50000 samples +\item Avg. sentence length: 38 phonemes +\end{itemize} + +Model: + +\begin{itemize} +\item Convolution layers on raw signal +\item Bidirectional LSTM layers +\item Dropout and noise for regularization +\item CTC cost function +\end{itemize} + +This model avoids hand-crafted feature extraction on the speech signal. However it is extremely complicated to train such models. Our model hasn't converged yet. + +\end{block} + + + +%\setbeamercolor{block alerted title}{fg=black,bg=norange} % Change the alert block title colors +%\setbeamercolor{block alerted body}{fg=black,bg=white} % Change the alert block body colors + +\setbeamercolor{block title}{fg=red,bg=white} % Change the block title color +\begin{block}{Contact Information} + +\begin{itemize} +\item Web: \url{http://github.com/thomasmesnard/CTC-LSTM} +\item Email: \url{thomas.mesnard@ens.fr} + \url{alex.auvolat@ens.fr} +\end{itemize} + +\end{block} + +\setbeamercolor{block title}{fg=red,bg=white} % Change the block title color +\begin{block}{References} + +\nocite{*} % Insert publications even if they are not cited in the poster +\small{\bibliographystyle{unsrt} +\bibliography{sample}\vspace{0.75in}} + + +\end{block} + +% LOGOS +%\begin{center} +%\begin{tabular}{ccc} +%\includegraphics[width=0.4\linewidth]{logo.png} & \hfill & \includegraphics[width=0.4\linewidth]{logo.png} +%\end{tabular} +%\end{center} + +%---------------------------------------------------------------------------------------- + +\end{column} % End of the third column + +\end{columns} % End of all the columns in the poster + +\end{column} % End of the third column + +\end{columns} % End of all the columns in the poster + +\end{frame} % End of the enclosing frame + +\end{document} diff --git a/prez/sample.bib b/prez/sample.bib new file mode 100644 index 0000000..65c0e6c --- /dev/null +++ b/prez/sample.bib @@ -0,0 +1,8 @@ +@inproceedings{graves2006connectionist, + title={Connectionist temporal classification: labelling unsegmented sequence data with recurrent neural networks}, + author={Graves, Alex and Fern{\'a}ndez, Santiago and Gomez, Faustino and Schmidhuber, J{\"u}rgen}, + booktitle={Proceedings of the 23rd international conference on Machine learning}, + pages={369--376}, + year={2006}, + organization={ACM} +} -- cgit v1.2.3