\begin{thebibliography}{30}
\expandafter\ifx\csname natexlab\endcsname\relax\def\natexlab#1{#1}\fi
\expandafter\ifx\csname url\endcsname\relax
  \def\url#1{{\tt #1}}\fi

\bibitem[Allwein et~al.(2000)Allwein, Schapire, and Singer]{AllweinScSi00}
E.L. Allwein, R.E. Schapire, and Y.~Singer.
\newblock Reducing multiclass to binary: A unifying approach for margin
  classifiers.
\newblock In {\em Machine Learning: Proceedings of the Seventeenth
  International Conference}, 2000.

\bibitem[Boser et~al.(1992)Boser, Guyon, and Vapnik]{BoserGuVa92}
Bernhard~E. Boser, Isabelle~M. Guyon, and Vladimir~N. Vapnik.
\newblock A training algorithm for optimal margin classifiers.
\newblock In {\em Proceedings of the Fifth Annual ACM Workshop on Computational
  Learning Theory}, pages 144--152, 1992.

\bibitem[Bredensteiner and Bennet(1999)]{BredensteinerBe99}
E.~J. Bredensteiner and K.~P. Bennet.
\newblock Multicategory classification by support vector machines.
\newblock {\em Computational Optimizations and Applications}, 12:\penalty0
  53--79, 1999.

\bibitem[Bregman(1967)]{Bregman67}
L.~M. Bregman.
\newblock The relaxation method of finding the common point of convex sets and
  its application to the solution of problems in convex programming.
\newblock {\em {USSR} Computational Mathematics and Mathematical Physics},
  7:\penalty0 200--217, 1967.

\bibitem[Breiman et~al.(1984)Breiman, Friedman, Olshen, and
  Stone]{BreimanFrOlSt84}
Leo Breiman, Jerome~H. Friedman, Richard~A. Olshen, and Charles~J. Stone.
\newblock {\em Classification and Regression Trees}.
\newblock Wadsworth \& Brooks, 1984.

\bibitem[Burges(1998)]{Burges98}
C.J.C. Burges.
\newblock A tutorial on support vector machines for pattern recognition.
\newblock {\em Data Mining and Knowledge Discovery}, 2\penalty0 (2):\penalty0
  1--47, 1998.

\bibitem[Censor and Zenios(1997)]{CensorZe97}
Yair Censor and Stavros~A. Zenios.
\newblock {\em Parallel optimization: Theory, Algorithms and Applications}.
\newblock Oxford University Press, 1997.

\bibitem[Collobert and Bengio(2001)]{CollobertBe01}
Ronan Collobert and Samy Bengio.
\newblock {SVM}torch: Support vector machines for large-scale regression
  problems.
\newblock {\em Journal of Machine Learning Research}, 1:\penalty0 143--160,
  2001.

\bibitem[Cortes and Vapnik(1995)]{CortesVa95}
Corinna Cortes and Vladimir Vapnik.
\newblock Support-vector networks.
\newblock {\em Machine Learning}, 20\penalty0 (3):\penalty0 273--297, September
  1995.

\bibitem[Crammer and Singer(2000)]{CrammerSi00}
Koby Crammer and Yoram Singer.
\newblock On the learnability and design of output codes for multiclass
  problems.
\newblock In {\em Proceedings of the Thirteenth Annual Conference on
  Computational Learning Theory}, 2000.

\bibitem[Crammer and Singer(2001)]{CrammerSi01}
Koby Crammer and Yoram Singer.
\newblock Ultraconservative online algorithms for multiclass problems.
\newblock In {\em Proceedings of the Fourteenth Annual Conference on
  Computational Learning Theory}, 2001.

\bibitem[Cristianini and Shawe-Taylor(2000)]{CristianiniSh00}
Nello Cristianini and John Shawe-Taylor.
\newblock {\em An Introduction to Support Vector Machines}.
\newblock Cambridge University Press, 2000.

\bibitem[DeCoste and Sch\"olkopf(2001)]{DeCosteSc01}
Dennis DeCoste and Bernhard Sch\"olkopf.
\newblock Training invariant support vector machines.
\newblock {\em Machine Learning}, 46\penalty0 (1--3):\penalty0 133--168, 2001.

\bibitem[Dietterich(2000)]{Dietterich00}
Thomas~G. Dietterich.
\newblock An experimental comparison of three methods for constructing
  ensembles of decision trees: Bagging, boosting, and randomization.
\newblock {\em Machine Learning}, 40\penalty0 (2):\penalty0 139--158, 2000.

\bibitem[Dietterich and Bakiri(1995)]{DietterichBa95}
Thomas~G. Dietterich and Ghulum Bakiri.
\newblock Solving multiclass learning problems via error-correcting output
  codes.
\newblock {\em Journal of Artificial Intelligence Research}, 2:\penalty0
  263--286, January 1995.

\bibitem[Freund and Schapire(1997)]{FreundSc97}
Yoav Freund and Robert~E. Schapire.
\newblock A decision-theoretic generalization of on-line learning and an
  application to boosting.
\newblock {\em Journal of Computer and System Sciences}, 55\penalty0
  (1):\penalty0 119--139, August 1997.

\bibitem[Guermeur et~al.(2000)Guermeur, Elisseeff, and
  Paugam-Moisy]{GuermeurElPa00}
Y.~Guermeur, A.~Elisseeff, and H.~Paugam-Moisy.
\newblock A new multi-class svm based on a uniform convergence result.
\newblock In V.~Piuri et~al., editor, {\em Proceedings of IJCNN-2000}, 2000.

\bibitem[H\"offgen and Simon(1992)]{HoffgenSi92}
Klaus-U. H\"offgen and Hans-U. Simon.
\newblock Robust trainability of single neurons.
\newblock In {\em Proceedings of the Fifth Annual ACM Workshop on Computational
  Learning Theory}, pages 428--439, Pittsburgh, Pennsylvania, July 1992.

\bibitem[Joachims(1998)]{Joachims98}
Thorsten Joachims.
\newblock Making large-scale support vector machine learning practical.
\newblock In B.~Sch\"olkopf, C.~Burges, and A.~Smola, editors, {\em Advances in
  Kernel Methods - Support Vector Learning}. MIT Press, 1998.

\bibitem[Keerthi and Gilbert(2000)]{KeerthiGi00}
S.S. Keerthi and E.G. Gilbert.
\newblock Convergence of a generalized smo algorithm for svm classifier design.
\newblock Technical Report CD-00-01, Control Division Dept. of Mechanical and
  Production Engineering National University of Singapore, 2000.

\bibitem[Lin(2001)]{Lin01}
C.-J. Lin.
\newblock Stopping criteria of decomposition methods for support vector
  machines: a theoretical justification.
\newblock Technical report, Depratment of Computer Science and Information
  Engineering, National Taiwan University, May 2001.

\bibitem[Platt(1998)]{Platt98}
J.C. Platt.
\newblock Fast training of {Support Vector Machines} using sequential minimal
  optimization.
\newblock In B.~Sch\"olkopf, C.~Burges, and A.~Smola, editors, {\em Advances in
  Kernel Methods - Support Vector Learning}. MIT Press, 1998.

\bibitem[Platt et~al.(2000)Platt, Cristianini, and Shawe-Taylor]{PlattCrSh00}
J.C. Platt, N.~Cristianini, and J.~Shawe-Taylor.
\newblock Large margin {DAG}s for multiclass classification.
\newblock In {\em Advances in Neural Information Processing Systems 12}, pages
  547--553. MIT Press, 2000.

\bibitem[Quinlan(1993)]{Quinlan93}
J.~Ross Quinlan.
\newblock {\em C4.5: Programs for Machine Learning}.
\newblock Morgan Kaufmann, 1993.

\bibitem[Schapire and Singer(1999)]{SchapireSi99}
Robert~E. Schapire and Yoram Singer.
\newblock Improved boosting algorithms using confidence-rated predictions.
\newblock {\em Machine Learning}, 37\penalty0 (3):\penalty0 1--40, 1999.

\bibitem[{Sch\"olkopf}(1997)]{Scholkopf97}
B.~{Sch\"olkopf}.
\newblock {\em Support Vector Learning}.
\newblock PhD thesis, GMD First, 1997.

\bibitem[Sch\"olkopf et~al.(1998)Sch\"olkopf, Burges, and
  Smola]{ScholkopfBuSm98}
B.~Sch\"olkopf, C.~Burges, and A.~Smola, editors.
\newblock {\em Advances in Kernel Methods - Support Vector Learning}.
\newblock MIT Press, 1998.

\bibitem[{Sch\"olkopf} et~al.(1996){Sch\"olkopf}, Sung, Burges, Girosi, Niyogi,
  Poggio, and Vapnik]{ScholkopfSuBuGiNiPoVa97}
B.~{Sch\"olkopf}, K.~Sung, C.~Burges, F.~Girosi, P.~Niyogi, T.~Poggio, and
  V.~Vapnik.
\newblock Comparing support vector machines with {G}aussian kernels to radial
  basis function classifiers.
\newblock Technical Report A.I.~Memo No. 1599, Massachusetts Institute of
  Techology, 1996.

\bibitem[Vapnik(1998)]{Vapnik98}
Vladimir~N. Vapnik.
\newblock {\em Statistical Learning Theory}.
\newblock Wiley, 1998.

\bibitem[Weston and Watkins(1999)]{WestonWa99}
J.~Weston and C.~Watkins.
\newblock Support vector machines for multi-class pattern recognition.
\newblock In {\em Proceedings of the Seventh European Symposium on Artificial
  Neural Networks}, April 1999.

\end{thebibliography}
