\begin{thebibliography}{22}
\expandafter\ifx\csname natexlab\endcsname\relax\def\natexlab#1{#1}\fi
\expandafter\ifx\csname url\endcsname\relax
  \def\url#1{{\tt #1}}\fi

\bibitem[Ben-Hur et~al.(2002)Ben-Hur, Elisseeff, and Guyon]{psb02}
A.~Ben-Hur, A.~Elisseeff, and I.~Guyon.
\newblock A stability based method for discovering structure in clustered data.
\newblock in Pacific Symposium on Biocomputing, 2002.

\bibitem[Ben-Hur et~al.(2000)Ben-Hur, Horn, Siegelmann, and Vapnik]{vclust}
A.~Ben-Hur, D.~Horn, H.T. Siegelmann, and V.~Vapnik.
\newblock A support vector clustering method.
\newblock in International Conference on Pattern Recognition, 2000.

\bibitem[Ben-Hur et~al.(2001)Ben-Hur, Horn, Siegelmann, and Vapnik]{nips00}
A.~Ben-Hur, D.~Horn, H.T. Siegelmann, and V.~Vapnik.
\newblock A support vector clustering method.
\newblock in Advances in Neural Information Processing Systems 13: Proceedings
  of the 2000 Conference, Todd K. Leen, Thomas G. Dietterich and Volker Tresp
  eds., 2001.

\bibitem[Blake and Merz(1998)]{UCI}
C.L. Blake and C.J. Merz.
\newblock Uci repository of machine learning databases, 1998.

\bibitem[Blatt et~al.(1997)Blatt, Wiseman, and Domany]{blatt}
Marcelo Blatt, Shai Wiseman, and Eytan Domany.
\newblock Data clustering using a model granular magnet.
\newblock {\em Neural Computation}, 9\penalty0 (8):\penalty0 1805--1842, 1997.

\bibitem[Duda et~al.(2001)Duda, Hart, and Stork]{dhs}
R.O. Duda, P.E. Hart, and D.G. Stork.
\newblock {\em Pattern Classification}.
\newblock John Wiley \& Sons, New York, 2001.

\bibitem[Fisher(1936)]{iris}
R.A. Fisher.
\newblock The use of multiple measurments in taxonomic problems.
\newblock {\em Annals of Eugenics}, 7:\penalty0 179--188, 1936.

\bibitem[Fletcher(1987)]{fletcher}
R.~Fletcher.
\newblock {\em Practical Methods of Optimization}.
\newblock Wiley-Interscience, Chichester, 1987.

\bibitem[Fukunaga(1990)]{fukunaga}
K.~Fukunaga.
\newblock {\em Introduction to Statistical Pattern Recognition}.
\newblock Academic Press, San Diego, CA, 1990.

\bibitem[Jain and Dubes(1988)]{jain}
A.K. Jain and R.C. Dubes.
\newblock {\em Algorithms for clustering data}.
\newblock Prentice Hall, Englewood Cliffs, NJ, 1988.

\bibitem[Lipson and Siegelmann(2000)]{lipson}
H.~Lipson and H.T. Siegelmann.
\newblock Clustering irregular shapes using high-order neurons.
\newblock {\em Neural Computation}, 12:\penalty0 2331--2353, 2000.

\bibitem[MacQueen(1965)]{kmeans1}
J.~MacQueen.
\newblock Some methods for classification and analysis of multivariate
  observations.
\newblock in Proc. 5th Berkeley Symposium on Mathematical Statistics and
  Probability, Vol. 1, 1965.

\bibitem[Milligan and Cooper(1985)]{milligan}
G.W. Milligan and M.C. Cooper.
\newblock An examination of procedures for determining the number of clusters
  in a data set.
\newblock {\em Psychometrika}, 50:\penalty0 159--179, 1985.

\bibitem[Platt(1999)]{SMO}
J.~Platt.
\newblock Fast training of support vector machines using sequential minimal
  optimization.
\newblock in Advances in Kernel Methods --- Support Vector Learning,
  B.~Sch{\"o}lkopf, C.~J.~C. Burges, and A.~J. Smola, editors, 1999.

\bibitem[Ripley(1996)]{ripley}
B.D. Ripley.
\newblock {\em Pattern recognition and neural networks}.
\newblock Cambridge University Press, Cambridge, 1996.

\bibitem[Roberts(1997)]{roberts}
S.J. Roberts.
\newblock Non-parametric unsupervised cluster analysis.
\newblock {\em Pattern Recognition}, 30(2):\penalty0 261--272, 1997.

\bibitem[Sch{\"o}lkopf et~al.(2000)Sch{\"o}lkopf, Williamson, Smola,
  Shawe-Taylor, and Platt]{sch-sup}
B.~Sch{\"o}lkopf, R.C. Williamson, A.J. Smola, J.~Shawe-Taylor, and J.~Platt.
\newblock Support vector method for novelty detection.
\newblock in Advances in Neural Information Processing Systems 12: Proceedings
  of the 1999 Conference, Sara A. Solla, Todd K. Leen and Klaus-Robert Muller
  eds., 2000.

\bibitem[Sch{\"o}lkopf et~al.(2001)Sch{\"o}lkopf, Platt, Shawe-Taylor, , Smola,
  and Williamson]{sch-sup1}
Bernhard Sch{\"o}lkopf, John~C. Platt, John Shawe-Taylor, , Alex~J. Smola, and
  Robert~C. Williamson.
\newblock Estimating the support of a high-dimensional distribution.
\newblock {\em Neural Computation}, 13:\penalty0 1443--1471, 2001.

\bibitem[Shamir and Sharan(2000)]{shamir-gen}
R.~Shamir and R.~Sharan.
\newblock Algorithmic approaches to clustering gene expression data.
\newblock in T.~Jiang, T.~Smith, Y.~Xu, and M.Q. Zhang, editors, Current Topics
  in Computational Biology, 2000.

\bibitem[Tax and Duin(1999)]{tax-duin}
D.M.J. Tax and R.P.W. Duin.
\newblock Support vector domain description.
\newblock {\em Pattern Recognition Letters}, 20:\penalty0 1991--1999, 1999.

\bibitem[Tishby and Slonim(2001)]{bottleneck-nips}
N.~Tishby and N.~Slonim.
\newblock Data clustering by {M}arkovian relaxation and the information
  bottleneck method.
\newblock in Advances in Neural Information Processing Systems 13: Proceedings
  of the 2000 Conference, Todd K. Leen, Thomas G. Dietterich and Volker Tresp
  eds., 2001.

\bibitem[Vapnik(1995)]{Vapnik95}
V.~Vapnik.
\newblock {\em The Nature of Statistical Learning Theory}.
\newblock Springer, New York, 1995.

\end{thebibliography}
