\relax 
\bibstyle{plainnat}
\citation{Joa}
\@writefile{toc}{\contentsline {section}{\numberline {1}Introduction}{419}}
\citation{CriSha-book}
\citation{Vapnik95}
\citation{BosGuyVap92}
\citation{CriSha-book}
\citation{Scholkopf97}
\citation{Watkins00}
\citation{Haussler99}
\citation{stker2000}
\citation{Joa}
\citation{Saltonetal75}
\citation{Joa}
\citation{Watkins00}
\citation{Haussler99}
\citation{crisetal}
\citation{BosGuyVap92}
\@writefile{toc}{\contentsline {section}{\numberline {2}Kernels and Support Vector Machines}{421}}
\citation{Mercer}
\@writefile{toc}{\contentsline {section}{\numberline {3}A Kernel for Text Sequences- A Step beyond Words}{422}}
\citation{Watkins00}
\citation{Haussler99}
\newlabel{string-ker}{{1}{423}}
\newlabel{recurdef}{{2}{424}}
\citation{cavnar95}
\citation{huffman96}
\newlabel{nglia}{{3}{425}}
\citation{KA-ICML}
\citation{CriSha-book}
\@writefile{toc}{\contentsline {section}{\numberline {4}Experimental Results}{426}}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.1}Effectiveness of Varying Sequence length}{427}}
\@writefile{lot}{\contentsline {table}{\numberline {1}{\ignorespaces The performance (F1, precision, recall) of SVM with SSK, NGK and WK for Reuters categories earn and acq. Results illustrate the effect of the variability of subsequence length on performance. The results are averaged over 10 runs of the techniques. We also report standard deviation.}}{428}}
\newlabel{earnacqlen}{{1}{428}}
\@writefile{lot}{\contentsline {table}{\numberline {2}{\ignorespaces The performance (F1, precision, recall) of SVM with SSK, NGK and WK for Reuters categories crude and corn. Results illustrate the effect of the variability of subsequence length on performance. The results are averaged over 10 runs of the techniques. We also report standard deviation.}}{429}}
\newlabel{crudecornlen}{{2}{429}}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.2}Effectiveness of Varying Weight Decay Factor}{430}}
\@writefile{lot}{\contentsline {table}{\numberline {3}{\ignorespaces The performance (F1, precision, recall) of SVM with SSK, NGK and WK for Reuters categories earn and acq. Results illustrate the impact of varying $\lambda $ on performance of SSK. The results are averaged over 10 runs of the techniques. We also report standard deviation.}}{431}}
\newlabel{earnacqlam}{{3}{431}}
\@writefile{lot}{\contentsline {table}{\numberline {4}{\ignorespaces The performance (F1, precision, recall) of SVM with SSK, NGK and WK for Reuters categories crude and corn. Results illustrate the impact of varying $\lambda $ on performance of SSK. The results are averaged over 10 runs of the techniques. We also report standard deviation.}}{432}}
\newlabel{crudecornlam}{{4}{432}}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.3}Effectiveness of Combining Kernels}{433}}
\@writefile{lot}{\contentsline {table}{\numberline {5}{\ignorespaces The performance (F1, precision, recall) of SVM with combined kernels for Reuters categories earn, acq, corn and crude. The SSK for different lengths have been combined. The results are averaged and standard deviation is also given.}}{434}}
\newlabel{comblen}{{5}{434}}
\citation{Scholkopfetal}
\@writefile{toc}{\contentsline {section}{\numberline {5}Approximating Kernels}{435}}
\newlabel{sec:approximate}{{5}{435}}
\@writefile{lot}{\contentsline {table}{\numberline {6}{\ignorespaces The performance (F1, precision, recall) of SVM with combined kernels for Reuters categories earn, acq, corn and crude. The SSK and NGK are combined. The results are averaged and standard deviation is also given.}}{436}}
\newlabel{comsskngk}{{6}{436}}
\citation{willsee}
\citation{SmoSch}
\@writefile{lot}{\contentsline {table}{\numberline {7}{\ignorespaces The performance (F1, precision, recall) of SVM with combined kernels for Reuters categories earn, acq, corn and crude. The SSK for different $\lambda $'s have been combined. The results are averaged and standard deviation is also given.}}{437}}
\newlabel{comblam}{{7}{437}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.1}Choosing a subset of features}{437}}
\citation{crisetal}
\citation{crisetal}
\citation{crielishawe}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.2}Similarity of Gram Matrices}{438}}
\@writefile{toc}{\contentsline {section}{\numberline {6}Approximating the string kernel}{438}}
\newlabel{string:approx}{{6}{438}}
\@writefile{toc}{\contentsline {subsection}{\numberline {6.1}Obtaining the approximation}{439}}
\@writefile{toc}{\contentsline {subsection}{\numberline {6.2}Selecting the subset}{439}}
\citation{joachims}
\@writefile{lof}{\contentsline {figure}{\numberline {1}{\ignorespaces Alignment scores (against the Gram matrix generated by the full string kernel) when using the most frequent, infrequent and random selection of features.}}{440}}
\newlabel{fig:alignment}{{1}{440}}
\@writefile{toc}{\contentsline {section}{\numberline {7}Experimental Results}{440}}
\newlabel{sec:experiments}{{7}{440}}
\citation{stker2000}
\@writefile{lot}{\contentsline {table}{\numberline {8}{\ignorespaces F1 numbers for 4 Reuters categories. Comparing different numbers of features in the approximation to the SSK on 4 categories of the Reuters dataset.}}{441}}
\newlabel{table:Reuters}{{8}{441}}
\@writefile{lot}{\contentsline {table}{\numberline {9}{\ignorespaces F1 numbers for SVM with WK, NGK and SSK for top-ten Reuters categories.}}{441}}
\newlabel{ngkapproxssk}{{9}{441}}
\@writefile{toc}{\contentsline {section}{\numberline {8}Conclusions}{441}}
\citation{Joa}
\bibdata{stringfinal}
\bibcite{BosGuyVap92}{{1}{1992}{{Boser et~al.}}{{Boser, Guyon, and Vapnik}}}
\bibcite{cavnar95}{{2}{1994}{{Cavnar}}{{}}}
\bibcite{crielishawe}{{3}{2001}{{Cristianini et~al.}}{{Cristianini, Elisseef, and Shawe-Taylor}}}
\bibcite{crisetal}{{4}{to appear}{{Cristianini et~al.}}{{Cristianini, Elisseef, and Shawe-Taylor}}}
\bibcite{CriSha-book}{{5}{2000}{{Cristianini and Shawe-Taylor}}{{}}}
\bibcite{KA-ICML}{{6}{1998}{{Friess et~al.}}{{Friess, Cristianini, and Campbell}}}
\bibcite{Haussler99}{{7}{1999}{{Haussler}}{{}}}
\bibcite{huffman96}{{8}{1995}{{Huffman}}{{}}}
\bibcite{Joa}{{9}{1998}{{Joachims}}{{}}}
\bibcite{joachims}{{10}{1999}{{Joachims}}{{}}}
\bibcite{stker2000}{{11}{2001}{{Lodhi et~al.}}{{Lodhi, Shawe-Taylor, Cristianini, and Watkins}}}
\bibcite{Mercer}{{12}{1909}{{Mercer}}{{}}}
\bibcite{Saltonetal75}{{13}{1975}{{Salton et~al.}}{{Salton, Wong, and Yang}}}
\bibcite{Scholkopf97}{{14}{1997}{{Sch\"olkopf}}{{}}}
\bibcite{Scholkopfetal}{{15}{1999}{{{Sch\"olkopf} et~al.}}{{{Sch\"olkopf}, Mika, Burges, Knirsch, K.-R.M{\"u}ller, R{\"a}tsch, and Smola}}}
\bibcite{SmoSch}{{16}{2000}{{Smola and Sch\"olkopf}}{{}}}
\bibcite{Vapnik95}{{17}{1995}{{Vapnik}}{{}}}
\bibcite{Watkins00}{{18}{2000}{{Watkins}}{{}}}
\bibcite{willsee}{{19}{2001}{{Williams and Seeger}}{{}}}
