]> www.fi.muni.cz Git - pan13-paper.git/blob - pan13-poster/poster.tex
1. nastrel
[pan13-paper.git] / pan13-poster / poster.tex
1 \documentclass[a0,portrait]{sciposter}\r
2 \r
3 \usepackage{epsfig}\r
4 \usepackage{amsmath}\r
5 \usepackage{amssymb}\r
6 \usepackage{multicol}\r
7 \usepackage{bera}\r
8 \usepackage[utf8]{inputenc}\r
9 %\usepackage{fancybullets}\r
10 \r
11 \definecolor{BoxCol}{rgb}{0.9,0.9,1}\r
12 % uncomment for light blue background to \section boxes \r
13 % for use with default option boxedsections\r
14 \r
15 \definecolor{SectionCol}{rgb}{0,0,0.5}\r
16 % uncomment for dark blue \section text \r
17 \r
18 \definecolor{ReallyEmph}{rgb}{0.7,0,0}\r
19 \r
20 \renewcommand{\titlesize}{\Huge}\r
21 \title{Diverse Queries and Feature Type Selection \\ for Plagiarism Discovery}\r
22 \r
23 % Note: only give author names, not institute\r
24 \author{Šimon Suchomel, Jan Kasprzak, and Michal Brandejs}\r
25  \r
26 % insert correct institute name\r
27 \institute{Faculty of Informatics, Masaryk University, Brno, Czech Republic}\r
28 \r
29 % \email{kas@fi.muni.cz}  % shows author email address below institute\r
30 \r
31 %\date is unused by the current \maketitle\r
32 \r
33 \font\logofont=fi-logo600 at .16\textwidth\r
34 \r
35 \renewcommand{\sectionsize}{\Large}\r
36 \r
37 \newcommand{\cemph}[1]{{\sffamily\bfseries\itshape \textcolor{SectionCol}{#1}}}\r
38 \newcommand{\lemph}[1]{{\rmfamily\itshape \textcolor{SectionCol}{#1}}}\r
39 \newcommand{\eitem}[1]{\item \cemph{#1}}\r
40 \r
41 \newenvironment{ytemize}\r
42   { \begin{itemize}\r
43         \setlength{\itemsep}{0pt}\r
44         \setlength{\parskip}{0pt}\r
45   }\r
46   { \end{itemize} }\r
47 \r
48 \conference{{\bf CLEF 2013}, 23--27 September 2013, Valencia, Spain}\r
49 \r
50 \setlength{\figbotskip}{\smallskipamount}\r
51 \r
52 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%\r
53 %%% Begin of Document\r
54 \r
55 \begin{document}\r
56 \r
57 \r
58 %\LEFTSIDEfootlogo  \r
59 % Uncomment to put footer logo on left side, and \r
60 % conference name on right side of footer\r
61 \r
62 % Some examples of caption control (remove % to check result)\r
63 \r
64 %\renewcommand{\algorithmname}{Algoritme} % for Dutch\r
65 \r
66 %\renewcommand{\mastercapstartstyle}[1]{\textit{\textbf{#1}}}\r
67 %\renewcommand{\algcapstartstyle}[1]{\textsc{\textbf{#1}}}\r
68 %\renewcommand{\algcapbodystyle}{\bfseries}\r
69 %\renewcommand{\thealgorithm}{\Roman{algorithm}}\r
70 \r
71 % \maketitle\r
72 \r
73 \vspace*{-.06\textwidth}\r
74 \r
75 \hbox to \hsize{\r
76 \begin{minipage}[c]{.11\textwidth}\r
77         \vspace{-.75\textwidth}\r
78         \hbox{\hskip -.83\textwidth\includegraphics[width=3\textwidth]{znak_MU_modry}\hskip -\textwidth}\r
79         \vspace{-\textwidth}\r
80 \end{minipage}\r
81 \hfil\r
82 \begin{minipage}[c]{.7\textwidth}\r
83 \begin{center}\r
84       \renewcommand{\baselinestretch}{2.0}\normalsize\r
85       {\titlesize \bf \@title}\par\r
86       \renewcommand{\baselinestretch}{1.0}\normalsize            \r
87       \vspace{0.4\titleskip}\r
88       {\authorsize {\bf\@author} \par}\r
89       {\instsize\r
90        \vspace{0.2\titleskip}\r
91        \theinstitute \par\r
92        \ifthenelse{\equal{\printemail}{}}{%nothing\r
93          }{%\r
94          \vspace{0.2\titleskip}\r
95          \texttt{\printemail}\r
96          }\r
97       }\r
98 \end{center}\r
99 \end{minipage}\r
100 \hfil\r
101 \begin{minipage}[c]{.15\textwidth}\r
102         \hbox to \hsize{\logofont SL\hss}\r
103 \end{minipage}\r
104 }\r
105 \r
106 \vspace{-.02\textwidth}\r
107 \r
108 %%% Begin of Multicols-Enviroment\r
109 %\begin{abstract}\r
110 %{\sffamily\itshape\r
111 %Nějaký abstrakt.\r
112 %}\r
113 %\end{abstract}\r
114 \r
115 \r
116 \begin{multicols}{2}\setlength{\columnseprule}{0pt}\r
117 \r
118 \r
119 \section{Introduction}\r
120 PAN 2013 LOrem ipsum Lorem ipsum Lorem ipsumLorem ipsumLorem ipsumLorem ipsumLorem ipsum \r
121 \r
122 \r
123 \r
124 \begin{figure}\r
125  \centering\r
126   \includegraphics[width=0.8\textwidth]{img/source_retrieval_process.pdf}\r
127   \caption{Plagiarism discovery process.}\r
128   \label{fig:process}\r
129 \end{figure} \r
130 \r
131 \r
132 \end{multicols}\r
133 \r
134 \r
135 \r
136 \begin{multicols}{2}\r
137 \r
138 %\rm\r
139 \r
140 %%% Introduction\r
141 \section{Querying}\r
142 Querying means to effectively utilize the search engine in order to retrieve as many relevant\r
143 documents as possible with the minimum amount of queries.\r
144 %We consider the resulting document relevantif it shares some of text characteristics with the suspicious document.\r
145 In real-world queries as such represent appreciable cost, therefore their minimization should be one of the top priorities. \\\r
146 \subsection{Types of Queries}\r
147 From the suspicious document, there were three diverse types of queries extracted.\r
148 \subsubsection{Keywords Based Queries}\r
149 \begin{ytemize}\r
150 \item TF--IDF base automated keywords extraction;\r
151 \item 5-token long; \r
152 \item Deterministic;\r
153 \item Non-positional;\r
154 \item Non-phrasal.\r
155 \end{ytemize}\r
156 \subsubsection{Intrinsic Plagiarism Based Queries}\r
157 \begin{ytemize}\r
158 \item Averaged Word Frequency Class based chunking~\cite{AWFC};\r
159 \item Random sentence selection from the chunk;\r
160 \item Non-deterministic;\r
161 \item Positional;\r
162 \item Phrasal.\r
163 \end{ytemize}\r
164 \subsubsection{Paragraph Based Queries}\r
165 \begin{ytemize}\r
166 \item Longest sentences from miscellaneous paragraphs;\r
167 \item Deterministic;\r
168 \item Positional;\r
169 \item Phrasal.\r
170 \end{ytemize}\r
171 \r
172 \section{Selecting}\r
173 \begin{figure}\r
174   \centering\r
175   \includegraphics[width=0.8\textwidth]{img/snippets_graph.pdf}\r
176   \caption{Downloads and similarities performance.}\r
177   \label{fig:snippet_graph}\r
178 \end{figure}\r
179 \r
180 \section{Text Alignment}\r
181 \r
182 \section{Conclusion}\r
183 \r
184 Nějaký závěr\r
185 \r
186 %%% References\r
187 \r
188 %% Note: use of BibTeX als works!!\r
189 \r
190 \bibliographystyle{plain}\r
191 \begin{thebibliography}{1}\r
192 \r
193 \bibitem{ISMU}\r
194 \cemph{Masaryk University Information System}\\\r
195 {\tt http://is.muni.cz/}, contact: {\tt iscor@fi.muni.cz}.\r
196 \r
197 \bibitem{Theses}\r
198 \cemph{Czech National Archive of Graduate Theses}\\\r
199 {\tt http://theses.cz/}, contact: {\tt theses@fi.muni.cz}.\r
200 \r
201 \bibitem{AWFC}\r
202 \cemph{Sven Meyer Zu Eissen and Benno Stein: Intrinsic Plagiarism Detection}\\\r
203 {\tt Proceedings of the European Conference on Information Retrieval (ECIR-06)}, {\tt 2006}\r
204 \r
205 \end{thebibliography}\r
206 \r
207 \smallskip\r
208 \hrule height .1em\r
209 \medskip\r
210 \r
211 % \sffamily\r
212 \r
213 QR kód?\r
214 \r
215 \cemph{Contact information:}\\\r
216         Šimon Suchomel {\tt suchomel@fi.muni.cz},\\\r
217         Jan Kasprzak, {\tt kas@fi.muni.cz}.\r
218 \r
219 \r
220 \end{multicols}\r
221 \r
222 \end{document}\r
223 \r