% This is the bibliography of
%
% `Pattern Recognition and Neural Networks' by B.D. Ripley
% Cambridge University Press 1996 0-521-46086-7.
%
%  This file is converted from the database used for the 1997
%  second printing
%
% Copyright 1996 B.D. Ripley.
% All uses must carry this notice.
%
%
@String{NNset = "[Reprinted in \cite{Dasarathy.91}]"}

@String{MLset = "[Reprinted in \cite{Shavlik.Dietterich.90}]"}

@String{URset = "[Reprinted in \cite{Shafer.Pearl.90}]"}

@String{rep-Lau = "[Reprinted in \cite{Lau.92}]"}

@String{AnnMathStat = "Annals of Mathematical Statistics"}

@String{AnnStat = "Annals of Statistics"}

@String{ApplStat = "Applied Statistics"}

@String{AI = "Artificial Intelligence"}

@String{AuRC = "Automation and Remote Control"}

@String{BioCyb = "Biological Cybernetics"}

@String{Biom = "Biometrics"}

@String{Bka = "Biometrika"}

@String{CSDA = "Computational Statistics and Data Analysis"}

@String{CSTM = "Communications in Statistics---Theory and Methods"}

@String{CMwA = "Computers and Mathematics with Applications"}

@String{ComSys = "Complex Systems"}

@String{IEEC = "IEEE Transactions on Electronic Computers"}

@String{IEC = "IEEE Transactions on Computers"}

@String{IEIT = "IEEE Transactions on Information Theory"}

@String{InfoComp = "Information and Computation"}

@String{IJNS = "International Journal of Neural Systems"}

@String{IJPRAI = "International Journal of Pattern Recognition and Artificial Intelligence"}

@String{ISR = "International Statistical Review"}

@String{JASA = "Journal of the American Statistical Association"}

@String{JCGS = "Journal of Computational and Graphical Statistics"}

@String{JRSSA = "Journal of the Royal Statistical Society series A"}

@String{JRSSB = "Journal of the Royal Statistical Society series B"}

@String{ML = "Machine Learning"}

@String{MathProg = "Mathematical Programming"}

@String{Nat = "Nature"}

@String{Nks = "Networks"}

@String{NC = "Neural Computation"}

@String{NNks = "Neural Networks"}

@String{PIEEE = "Proceedings of the IEEE"}

@String{PNAS = "Proceedings of the National Academy of Sciences of the USA"}

@String{PR = "Pattern Recognition"}

@String{PRL = "Pattern Recognition Letters"}

@String{Psym = "Psychometrika"}

@String{SMC = "IEEE Transactions on Systems, Man and Cybernetics"}

@String{PAMI = "IEEE Transactions on Pattern Analysis and Machine Intelligence"}

@String{SIAMSSC = "SIAM Journal on Scientific and Statistical Computing"}

@String{StatComp = "Statistics and Computing"}

@String{StatSci = "Statistical Science"}

@String{Techno = "Technometrics"}

@String{TNN = "IEEE Transactions on Neural Networks"}

@String{TOMS = "ACM Transactions on Mathematical Software"}

@String{PRNNref = "Reference from PRNN"}

@String{PRNNunref = "Unchecked reference from PRNN"}

@String{MK = "Morgan Kaufmann"}

@String{Wiley = "Wiley"}

@String{Springer = "Springer"}


@Book{Ripley.96,
  author =       "B. D. Ripley",
  title =        "Pattern Recognition and Neural Networks",
  publisher =    "Cambridge University Press",
  address =      "Cambridge",
  year =         "1996",
  ISBN =         "0-521-46086-7",
  comment =      PRNNref,
}

@Book{Aarts.Korst.89,
  author =       "E. Aarts and J. Korst",
  title =        "Simulated Annealing and Boltzmann Machines",
  publisher =    Wiley,
  address =      "New York",
  year =         "1989",
  comment =      PRNNref,
}

@Book{Abramowitz.Stegun.65,
  author =       "M. Abramowitz and I. A. Stegun",
  title =        "Handbook of Mathematical Functions with Formulas,
                 Graphs and Mathematical Tables",
  publisher =    "Dover",
  address =      "New York",
  year =         "1965",
  comment =      PRNNref,
}

@Article{Abu-Mostafa.89,
  author =       "Y. S. Abu-Mostafa",
  title =        "{The Vapnik--Chervonenkis dimension: information
                 versus complexity in learning}",
  journal =      NC,
  volume =       "1",
  pages =        "312--317",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Abu-Mostafa.90,
  author =       "Y. S. Abu-Mostafa",
  title =        "Learning from hints in neural networks",
  journal =      "Journal of Complexity",
  volume =       "6",
  pages =        "192--198",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Abu-Mostafa.93,
  author =       "Y. S. Abu-Mostafa",
  title =        "A method for learning from hints",
  crossref =     "NIPS5",
  pages =        "73--80",
  year =         "1993",
  comment =      PRNNref,
}

@InProceedings{Abu-Mostafa.95a,
  author =       "Y. S. Abu-Mostafa",
  editor =       "A.-P. Refenes",
  booktitle =    "Neural Networks in the Capital Markets",
  title =        "Financial market applications of learning from hints",
  publisher =    Wiley,
  address =      "Chichester",
  pages =        "221--232",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Abu-Mostafa.95b,
  author =       "Y. S. Abu-Mostafa",
  title =        "Machines that learn from hints",
  journal =      "Scientific American",
  volume =       "272",
  number =       "4",
  pages =        "64--69",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Abu-Mostafa.95c,
  author =       "Y. S. Abu-Mostafa",
  title =        "Hints",
  journal =      NC,
  volume =       "7",
  pages =        "639--671",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Ackley.ZZ.85,
  author =       "D. H. Ackley and G. E. Hinton and T. J. Sejnowski",
  title =        "A learning algorithm for {Boltzmann} machines",
  journal =      "Cognitive Science",
  volume =       "9",
  pages =        "147--169",
  year =         "1985",
  note =         "[Reprinted in \cite{Anderson.Rosenfeld.88}]",
  comment =      PRNNref,
}

@InProceedings{Agosta.90,
  author =       "J. M. Agosta",
  editor =       "R. D. Shachter and T. S. Levitt and L. N. Kanal and J.
                 F. Lemmer",
  booktitle =    "Uncertainty in Artificial Intelligence 4",
  title =        "The structure of {Bayes} networks for visual
                 recognition",
  publisher =    "North Holland",
  address =      "Amsterdam",
  pages =        "397--405",
  year =         "1990",
  comment =      PRNNref,
}

@Book{Agrawala.77,
  editor =       "A. K. Agrawala",
  title =        "Machine Recognition of Patterns",
  publisher =    "IEEE Press",
  address =      "New York",
  year =         "1977",
  comment =      PRNNunref,
}

@Article{Aitchison.Aitken.76,
  author =       "J. Aitchison and C. G. G. Aitken",
  title =        "Multivariate binary discrimination by the kernel
                 method",
  journal =      Bka,
  volume =       "63",
  pages =        "413--420",
  year =         "1976",
  comment =      PRNNref,
}

@Book{Aitchison.Dunsmore.75,
  author =       "J. Aitchison and I. R. Dunsmore",
  title =        "Statistical Prediction Analysis",
  publisher =    "Cambridge University Press",
  address =      "Cambridge",
  year =         "1975",
  comment =      PRNNref,
}

@Article{Aitchison.ZZ.77,
  author =       "J. Aitchison and J. D. F. Habbema and J. W. Kay",
  title =        "A critical comparison of two methods of statistical
                 discrimination",
  journal =      ApplStat,
  volume =       "26",
  pages =        "15--25",
  year =         "1977",
  comment =      PRNNref,
}

@InProceedings{Aitken.78,
  author =       "C. G. G. Aitken",
  editor =       "L. C. A. Corsten and J. Hermans.",
  booktitle =    "Proceedings of COMPSTAT 1978",
  title =        "Methods of discrimination in multivariate binary
                 data",
  publisher =    "Physica-Verlag",
  address =      "Vienna",
  pages =        "155--161",
  year =         "1978",
  comment =      PRNNref,
}

@Article{Aitken.83,
  author =       "C. G. G. Aitken",
  title =        "Kernel methods for the estimation of discrete
                 distributions",
  journal =      "Journal of Statistical Computation and Simulation",
  volume =       "16",
  pages =        "189--200",
  year =         "1983",
  comment =      PRNNref,
}

@Article{Aizerman.ZZ.64a,
  author =       "M. A. Aizerman and E. M. Braverman and L. I.
                 Rozono\'er",
  title =        "Theoretical foundations of the potential function
                 method in pattern recognition learning",
  journal =      AuRC,
  volume =       "25",
  pages =        "821--837",
  year =         "1964",
  comment =      PRNNref,
}

@Article{Aizerman.ZZ.64b,
  author =       "M. A. Aizerman and E. M. Braverman and L. I.
                 Rozono\'er",
  title =        "The probability problem of pattern recognition
                 learning and the method of potential functions",
  journal =      AuRC,
  volume =       "25",
  pages =        "1175--1190",
  year =         "1964",
  comment =      PRNNref,
}

@Article{Aizerman.ZZ.65,
  author =       "M. A. Aizerman and E. M. Braverman and L. I.
                 Rozono\'er",
  title =        "The {Robbins--Munro} process and the method of
                 potential functions",
  journal =      AuRC,
  volume =       "26",
  pages =        "1882--1885",
  year =         "1965",
  comment =      PRNNref,
}

@InProceedings{Akaike.73,
  author =       "H. Akaike",
  editor =       "B. N. Petrov and F. C\'aski",
  booktitle =    "Second International Symposium on Information Theory",
  title =        "Information theory and an extension of the maximum
                 likelihood principle",
  publisher =    "Akademiai Kaid\'o",
  address =      "Budapest",
  pages =        "267--281",
  year =         "1973",
  note =         "Reprinted in \emph{Breakthroughs in Statistics}, eds
                 Kotz, S. \& Johnson, N. L. (1992), volume I,
                 pp.~599--624. New York: Springer.",
  comment =      PRNNunref,
}

@Article{Akaike.74,
  author =       "H. Akaike",
  title =        "A new look at statistical model identification",
  journal =      "IEEE Transactions on Automatic Control",
  volume =       "19",
  pages =        "716--723",
  year =         "1974",
  comment =      PRNNref,
}

@InProceedings{Akaike.77,
  author =       "H. Akaike",
  editor =       "P. R. Krishnaiah",
  booktitle =    "Applications of Statistics",
  title =        "On entropy maximization principle",
  publisher =    "North-Holland",
  address =      "Amsterdam",
  pages =        "27--42",
  year =         "1977",
  comment =      PRNNref,
}

@Article{Akaike.78,
  author =       "H. Akaike",
  title =        "{A Bayesian analysis of the minimum AIC procedure}",
  journal =      "Annals of the Institute of Statistical Mathematics",
  volume =       "30A",
  pages =        "9--14",
  year =         "1978",
  comment =      PRNNunref,
}

@InProceedings{Akaike.85,
  author =       "H. Akaike",
  editor =       "A. C. Atkinson and S. E. Fienberg",
  booktitle =    "A Celebration of Statistics. The ISI Centenary
                 Volume",
  title =        "Prediction and entropy",
  publisher =    Springer,
  address =      "New York",
  pages =        "1--24",
  year =         "1985",
  comment =      PRNNref,
}

@Article{Albert.Anderson.84,
  author =       "A. Albert and J. A. Anderson",
  title =        "On the existence of maximum likelihood estimates in
                 logistic regression models",
  journal =      Bka,
  volume =       "71",
  pages =        "1--10",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Albert.Lesaffre.86,
  author =       "A. Albert and E. Lesaffre",
  title =        "Multiple group logistic discrimination",
  journal =      CMwA,
  volume =       "12A",
  pages =        "209--224",
  year =         "1986",
  comment =      PRNNref,
}

@InProceedings{Albertini.ZZ.93,
  author =       "F. Albertini and E. D. Sontag and V. Maillot",
  title =        "Uniqueness of weights for neural networks",
  crossref =     "Mammone.93",
  pages =        "115--125",
  year =         "1993",
  comment =      PRNNref,
}

@Book{Aleksander.Morton.90,
  author =       "I. Aleksander and H. Morton",
  title =        "An Introduction to Neural Computing",
  publisher =    "Chapman \& Hall",
  address =      "London",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Alexander.84,
  author =       "K. S. Alexander",
  title =        "Probability inequalities for empirical processes and a
                 law of the iterated logarithm",
  journal =      "Annals of Probability",
  volume =       "12",
  pages =        "1041--1067",
  year =         "1984",
  comment =      PRNNref,
}

@Book{Almond.95,
  author       = "R. G. Almond",
  title        = "Graphical Belief Modeling",
  publisher    = "Chapman \& Hall",
  address      = "London",
  year         = "1995",
  ISBN         = "0-412-06661-0",
  comment =      PRNNref,
}

@Article{Amari.67,
  author =       "S.-I. Amari",
  title =        "A theory of adaptive pattern classifiers",
  journal =      IEEC,
  volume =       "16",
  pages =        "299--307",
  year =         "1967",
  comment =      PRNNref,
}

@InProceedings{Amari.93,
  author =       "S.-I. Amari",
  editor =       "O. E. Barndorff-Nielsen and J. L. Jensen and W. S.
                 Kendall",
  booktitle =    "Networks and Chaos---Statistical and Probabilistic
                 Aspects",
  title =        "Mathematical methods of neurocomputing",
  publisher =    "Chapman \& Hall",
  address =      "London",
  pages =        "1--39",
  year =         "1993",
  comment =      PRNNref,
}

@Book{Amit.89,
  author =       "D. J. Amit",
  title =        "Modeling Brain Function. The World of Attractor Neural
                 Networks",
  publisher =    "Cambridge University Press",
  address =      "Cambridge",
  year =         "1989",
  comment =      PRNNref,
}

@Book{Anderberg.73,
  author =       "M. R. Anderberg",
  title =        "Cluster Analysis for Applications",
  publisher =    "Academic Press",
  address =      "New York",
  year =         "1973",
  comment =      PRNNunref,
}

@InProceedings{Andersen.ZZ.89,
  author =       "S. K. Andersen and K. G. Olesen and F. V. Jensen and
                 F. Jensen",
  editor =       "N. Sridharan",
  booktitle =    "Proceedings of the 11th International Joint Conference
                 on Artificial Intelligence (Detroit, MI, 1989)",
  title =        "{HUGIN}---a shell for building {Bayesian} belief
                 universes for expert systems",
  publisher =    MK,
  address =      "San Mateo, CA",
  pages =        "1080--1085",
  year =         "1989",
  note =         URset,
  comment =      PRNNref,
}

@Article{Anderson.72,
  author =       "J. A. Anderson",
  title =        "Separate sample logistic discrimination",
  journal =      Bka,
  volume =       "59",
  pages =        "19--35",
  year =         "1972",
  comment =      PRNNref,
}

@InProceedings{Anderson.82,
  author =       "J. A. Anderson",
  editor =       "P. R. Krishnaiah and L. N. Kanal",
  booktitle =    "Handbook of Statistics 2: Classification, Pattern
                 Recognition and Reduction of Dimensionality",
  title =        "Logistic discrimination",
  publisher =    "North Holland",
  address =      "Amsterdam",
  pages =        "169--191",
  year =         "1982",
  comment =      PRNNref,
}

@Book{Anderson.84,
  author =       "T. W. Anderson",
  title =        "An Introduction to Multivariate Statistical Analysis",
  publisher =    Wiley,
  address =      "New York",
  edition =      "Second",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Anderson.Bahadur.62,
  author =       "T. W. Anderson and R. R. Bahadur",
  title =        "Classi\-fication into two multivariate normal
                 distributions with different covariance matrices",
  journal =      AnnMathStat,
  volume =       "33",
  pages =        "420--431",
  year =         "1962",
  comment =      PRNNref,
}

@Article{Anderson.Phillips.81,
  author =       "J. A. Anderson and P. R. Phillips",
  title =        "Regression, discrimination and measurement models for
                 ordered categorical variables",
  journal =      ApplStat,
  volume =       "30",
  pages =        "22--31",
  year =         "1981",
  comment =      PRNNref,
}

@Book{Anderson.Rosenfeld.88,
  editor =       "J. A. Anderson and E. Rosenfeld",
  title =        "Neurocomputing: Foundations of Research",
  publisher =    "The MIT Press",
  address =      "Cambridge, MA",
  year =         "1988",
  ISBN =         "0-262-01097-6",
  comment =      PRNNref,
}

@Book{Anderson.ZZ.90,
  editor =       "J. A. Anderson and A. Pellionisz and E. Rosenfeld",
  title =        "Neurocomputing 2: Directions for Research",
  publisher =    "The MIT Press",
  address =      "Cambridge, MA",
  year =         "1990",
  ISBN =         "0-262-01119-0",
  comment =      PRNNref,
}

@Article{Andreassen.ZZ.91,
  author =       "S. Andreassen and F. V. Jensen and K. G. Olesen",
  title =        "Medical expert systems based on causal probabilistic
                 networks",
  journal =      "International Journal of Bio-medical Computing",
  volume =       "28",
  pages =        "1--30",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Angluin.88,
  author =       "D. Angluin",
  title =        "Queries and concept learning",
  journal =      ML,
  volume =       "2",
  pages =        "319--342",
  year =         "1988",
  comment =      PRNNref,
}

@InProceedings{Angluin.93,
  author =       "D. Angluin",
  editor =       "E. B. Baum",
  booktitle =    "Computational Learning and Cognition",
  title =        "Learning with queries",
  publisher =    "SIAM",
  address =      "Philadelphia",
  pages =        "1--28",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Angulin.87,
  author =       "D. Angulin",
  title =        "Learning regular sets from queries and
                 counterexamples",
  journal =      InfoComp,
  volume =       "75",
  pages =        "87--106",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Angluin.Valiant.79,
  author       = "D. Angluin and L. G. Valiant",
  title        = "Fast probabilistic algorithms for {Hamiltonian} circuits
                  and matchings",
  journal      = "Journal of Computer and System Sciences",
  volume       = "18",
  pages        = "155--193",
  year         = "1979",
  comment =      PRNNref,
}

@Book{Anthony.Biggs.92,
  author =       "M. Anthony and N. Biggs",
  title =        "Computational Learning Theory: An Introduction",
  publisher =    "Cambridge University Press",
  address =      "Cambridge",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Anthony.Shawe-Taylor.93,
  author =       "M. Anthony and J. Shawe-Taylor",
  title =        "A result of {Vapnik} with applications",
  journal =      "Discrete Applied Mathematics",
  volume =       "47",
  pages =        "207--217",
  year =         "1993",
  note =         "[Erratum (1994) \textbf{52}, 211 (the proof of theorem
                 2.1 is corrected)]",
  comment =      PRNNref,
}

@Article{Apolloni.Falco.91,
  author =       "B. Apolloni and D. de Falco",
  title =        "Learning by asymmetric parallel {Boltzmann} Machines",
  journal =      NC,
  volume =       "3",
  pages =        "402--408",
  year =         "1991",
  comment =      PRNNref,
}

@Book{Arbib.95,
  editor       = "M. A. Arbib",
  booktitle    = "The Handbook of Brain Theory and Neural Networks",
  title        = "The Handbook of Brain Theory and Neural Networks",
  publisher    = "MIT Press",
  address      = "Cambridge, MA",
  year         = "1995",
  ISBN         = "0-262-01148-4",
  comment =      PRNNref,
}

@Article{Argentiero.ZZ.82,
  author =       "P. Argentiero and R. Chin and P. Beaudet",
  title =        "An automated approach to the design of decision tree
                 classifiers",
  journal =      PAMI,
  volume =       "4",
  pages =        "51--57",
  year =         "1982",
  comment =      PRNNref,
}

@Book{Arkedev.Braverman.66,
  author =       "A. G. Arkedev and E. M. Braverman",
  title =        "Computers and Pattern Recognition",
  publisher =    "Thompson",
  address =      "Washington, DC",
  year =         "1966",
  comment =      PRNNunref,
}

@Article{Ash.89,
  author =       "T. Ash",
  title =        "Dynamic mode creation in backpropagation neural
                 networks",
  journal =      "Connection Science: Journal of Neural Computing,
                 Artificial Intelligence and Cognitive Research",
  volume =       "1",
  pages =        "365--375",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Asimov.85,
  author =       "D. Asimov",
  title =        "The grand tour: {A} tool for viewing multidimensional
                 data",
  journal =      SIAMSSC,
  volume =       "6",
  pages =        "128--143",
  year =         "1985",
  comment =      PRNNref,
}

@Article{Assouad.83,
  author =       "P. Assouad",
  title =        "Densit\'e et dimension",
  journal =      "Annales de l'Institut Fourier Grenoble",
  volume =       "33",
  pages =        "233--282",
  year =         "1983",
  comment =      PRNNref,
}

@Article{Averintsev.75,
  author =       "M. V. Averintsev",
  title =        "{Gibbs} description of random fields whose conditional
                 probabilities may vanish",
  journal =      "Problemy Peredaci Informatsii",
  volume =       "11",
  pages =        "86--96",
  year =         "1975",
  comment =      PRNNunref,
}

@Article{Baba.ZZ.94,
  author =       "N. Baba and Y. Mogami and M. Kohzaki and Y. Shiraishi
                 and Y. Yoshida",
  title =        "A hybrid algorithm for finding the global minimum of
                 error function of neural networks and its
                 applications",
  journal =      NNks,
  volume =       "7",
  pages =        "1253--1265",
  year =         "1994",
  comment =      PRNNref,
}

@InProceedings{Bahadur.61a,
  author =       "R. R. Bahadur",
  editor =       "H. Solomon",
  booktitle =    "Studies in Item Analysis and Prediction",
  title =        "A representation of the joint distribution of
                 responses to $n$ dichotomous items",
  publisher =    "Stanford University Press",
  address =      "Palo Alto, CA",
  pages =        "158--167",
  year =         "1961",
  comment =      PRNNunref,
}

@InProceedings{Bahadur.61b,
  author =       "R. R. Bahadur",
  editor =       "H. Solomon",
  booktitle =    "Studies in Item Analysis and Prediction",
  title =        "On classification based on responses to $n$
                 dichotomous items",
  publisher =    "Stanford University Press",
  address =      "Palo Alto, CA",
  pages =        "169--176",
  year =         "1961",
  comment =      PRNNunref,
}

@Article{Bahl.ZZ.89,
  author =       "L. R. Bahl and P. F. Brown and P. V. de Souza and R.
                 L. Mercer",
  title =        "A tree-based statistical language model for natural
                 language speech recognition",
  journal =      "IEEE Transactions on Acoustics, Speech and Signal
                 Processing",
  volume =       "37",
  pages =        "1001--1008",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Bailey.Jain.78,
  author =       "T. Bailey and A. K. Jain",
  title =        "A note on distance-weighted $k$-nearest neighbor
                 rules",
  journal =      SMC,
  volume =       "8",
  pages =        "311--313",
  year =         "1978",
  comment =      PRNNref,
}

@Article{Baird.93,
  author =       "H. S. Baird",
  title =        "Recognition technology frontiers",
  journal =      PRL,
  volume =       "14",
  pages =        "327--334",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Baldi.Hornik.89,
  author =       "P. Baldi and K. Hornik",
  title =        "Neural networks and principal components analysis:
                 learning from examples without local minima",
  journal =      NNks,
  volume =       "2",
  pages =        "53--58",
  year =         "1989",
  note =         "[Reprinted in \cite{Anderson.ZZ.90}]",
  comment =      PRNNref,
}

@InProceedings{Ball.65,
  author =       "G. B. Ball",
  booktitle =    "Proceedings of the Fall Joint Computing Conference",
  title =        "Data analysis in the social sciences: What about the
                 details?",
  publisher =    "Spartan Books",
  address =      "Washington, DC",
  pages =        "533--559",
  year =         "1965",
  comment =      PRNNunref,
}

@Article{Banfield.Raftery.93,
  author =       "J. D. Banfield and A. E. Raftery",
  title =        "Model-based {Gaussian} and non-{Gaussian} clustering",
  journal =      Biom,
  volume =       "49",
  pages =        "803--821",
  year =         "1993",
  comment =      PRNNref,
}

@Book{Barlow.ZZ.72,
  author =       "R. E. Barlow and D. Bartholomew and J. E. Bremner and
                 H. M. Brunk",
  title =        "Statistical Inference under Order Restrictions. The
                 Theory and Application of Isotonic Regression",
  publisher =    Wiley,
  address =      "London",
  year =         "1972",
  comment =      PRNNref,
}

@InProceedings{Barron.90,
  author =       "A. R. Barron",
  editor =       "G. Roussas",
  booktitle =    "Nonparametric Functional Estimation and Related
                 Topics",
  title =        "Complexity regularization with application to
                 artificial neural networks",
  publisher =    "Kluwer Academic Publishers",
  address =      "Dordrecht",
  pages =        "561--576",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Barron.93,
  author =       "A. R. Barron",
  title =        "Universal approximation bounds for superpositions of a
                 sigmoid function",
  journal =      IEIT,
  volume =       "39",
  pages =        "930--945",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Barron.94,
  author =       "A. R. Barron",
  title =        "Approximation and estimation bounds for artificial
                 neural networks",
  journal =      ML,
  volume =       "14",
  pages =        "115--133",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Barron.Cover.91,
  author =       "A. R. Barron and T. M. Cover",
  title =        "Minimum complexity density estimation",
  journal =      IEIT,
  volume =       "37",
  pages =        "1034--1054",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Barry.86,
  author =       "D. Barry",
  title =        "Nonparametric {Bayesian} regression",
  journal =      AnnStat,
  volume =       "14",
  pages =        "934--953",
  year =         "1986",
  comment =      PRNNref,
}

@Article{Bartlett.93,
  author =       "P. L. Bartlett",
  title =        "{Vapnik--Chervonenkis} dimension bounds for two- and
                 three-layer networks",
  journal =      NC,
  volume =       "5",
  pages =        "371--373",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Bartlett.Williamson.96,
  author       = "P. L. Bartlett and R. C. Williamson",
  title        = "The {VC} dimension and pseudodimension of two-layer
                  neural networks with discrete inputs",
  journal      = NC,
  volume       = "8",
  number       = "3",
  pages        = "625--628",
  year         = "1996",
  comment =      PRNNref,
}

@Article{Basford.McLachlan.85,
  author =       "K. E. Basford and G. J. McLachlan",
  title =        "Estimation of allocation rates in a cluster analysis
                 context",
  journal =      JASA,
  volume =       "80",
  pages =        "286--293",
  year =         "1985",
  comment =      PRNNref,
}

@Article{Bashkirov.ZZ.64,
  author =       "O. A. Bashkirov and E. M. Braverman and I. B.
                 Muchnik",
  title =        "Potential function algorithms for pattern recognition
                 learning machines",
  journal =      AuRC,
  volume =       "25",
  pages =        "629--631",
  year =         "1964",
  comment =      PRNNref,
}

@Book{Bates.Watts.88,
  author =       "D. M. Bates and D. G. Watts",
  title =        "Nonlinear Regression Analysis and its Applications",
  publisher =    Wiley,
  address =      "New York",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Bather.86,
  author =       "J. Bather",
  title =        "A conversation with Hermann Chernoff",
  journal =      "Statistical Science",
  volume =       "11",
  number =       "4",
  pages =        "335--350",
  year =         "1996",
  comment =      PRNNref,
}

@Article{Battiti.89,
  author =       "R. Battiti",
  title =        "Accelerated backpropagation learning: two optimization
                 methods",
  journal =      ComSys,
  volume =       "3",
  number =       "4",
  pages =        "331--342",
  month =        aug,
  year =         "1989",
  comment =      PRNNref,
}

@Article{Battiti.92,
  author =       "R. Battiti",
  title =        "First- and second-order methods for learning: between
                 steepest descent and {Newton}'s method",
  journal =      NC,
  volume =       "4",
  pages =        "141--166",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Battiti.Massuli.90,
  author =       "R. Battiti and F. Massuli",
  booktitle =    "Proceedings of the International Neural Network
                 Conference (Paris, 1990)",
  title =        "{BFGS} optimization for faster and automated
                 supervised learning",
  volume =       "2",
  pages =        "757--760",
  year =         "1990",
  comment =      PRNNunref,
}

@Article{Baum.88,
  author =       "E. B. Baum",
  title =        "On the capabilities of multilayer perceptrons",
  journal =      "Journal of Complexity",
  volume =       "4",
  pages =        "193--215",
  year =         "1988",
  comment =      "PRNNref",
}

@Article{Baum.Haussler.89,
  author =       "E. B. Baum and D. Haussler",
  title =        "What size net gives valid generalization?",
  journal =      NC,
  volume =       "1",
  pages =        "151--160",
  year =         "1989",
  note =         MLset,
  comment =      PRNNref,
}

@Article{Baum.ZZ.70,
  author =       "L. E. Baum and T. Petrie and G. Soules and N. Weiss",
  title =        "A maximization technique occurring in the statistical
                 analysis of probabilistic functions of {Markov}
                 chains",
  journal =      AnnMathStat,
  volume =       "41",
  pages =        "164--171",
  year =         "1970",
  comment =      PRNNref,
}

@Article{Baxt.92,
  author =       "W. G. Baxt",
  title =        "Improving the accuracy of an artificial neural network
                 using multiple differently trained networks",
  journal =      NC,
  volume =       "4",
  pages =        "772--780",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Beaulieu.Goldberg.89,
  author =       "J.-M. Beaulieu and M. Goldberg",
  title =        "Hierarchy in picture segmentation: a stepwise
                 optimization approach",
  journal =      PAMI,
  volume =       "11",
  pages =        "150--163",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Beeri.ZZ.83,
  author =       "C. Beeri and R. Fagin and D. Maier and M. Yannakakis",
  title =        "On the desirability of acyclic database schemes",
  journal =      "Journal of the Association for Computing Machinery",
  volume =       "30",
  pages =        "479--513",
  year =         "1983",
  comment =      PRNNref,
}

@Article{Begg.Gray.84,
  author =       "C. B. Begg and R. Gray",
  title =        "Calculation of polychotomous logistic regression
                 parameters using individualized regressions",
  journal =      Bka,
  volume =       "71",
  pages =        "11--18",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Beigi.Li.90,
  author =       "H. S. M. Beigi and C. J. Li",
  title =        "Learning algorithms for neural networks based on
                 quasi-{Newton} with self-scaling",
  journal =      "Intelligent Control Systems",
  volume =       "23",
  pages =        "23--28",
  year =         "1990",
  comment =      PRNNunref,
}

@Article{Beigi.Li.93,
  author =       "H. S. M. Beigi and C. J. Li",
  title =        "Learning algorithms for neural networks based on
                 quasi-{Newton} with self-scaling",
  journal =      "Journal of Dynamical Systems, Measurement, and Control
                 -- Transactions of the ASME",
  volume =       "115",
  pages =        "38--43",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Benediktsson.Swain.92,
  author =       "J. A. Benediktsson and P. H. Swain",
  title =        "Consensus theoretic classification methods",
  journal =      SMC,
  volume =       "22",
  pages =        "688--704",
  year =         "1992",
  comment =      PRNNref,
}

@Book{Berge.73,
  author =       "C. Berge",
  title =        "Graphs and Hypergraphs",
  publisher =    "North-Holland",
  address =      "Amsterdam",
  year =         "1973",
  comment =      PRNNref,
}

@Book{Berger.85,
  author =       "J. O. Berger",
  title =        "Statistical Decision Theory and Bayesian Analysis",
  publisher =    Springer,
  address =      "New York",
  year =         "1985",
  comment =      PRNNref,
}

@Article{Berger.Delampady.87,
  author =       "J. O. Berger and M. Delampady",
  title =        "Testing precise hypotheses (with discussion)",
  journal =      StatSci,
  volume =       "2",
  pages =        "317--352",
  year =         "1987",
  comment =      PRNNref,
}

@Book{Bernardo.Smith.94,
  author =       "J. M. Bernardo and A. F. M. Smith",
  title =        "Bayesian Theory",
  publisher =    Wiley,
  address =      "Chichester",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Besag.Green.93,
  author =       "J. Besag and P. J. Green",
  title =        "Spatial statistics and {Bayesian} computation (with
                 discussion)",
  journal =      JRSSB,
  volume =       "55",
  pages =        "25--37",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Besag.ZZ.95,
  author =       "J. Besag and P. Green and D. Higdon and K. Mengersen",
  title =        "Bayesian computation and stochastic systems (with
                 discussion)",
  journal =      StatSci,
  volume =       "10",
  pages =        "3--66",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Best.Rayner.88,
  author =       "D. J. Best and J. C. W. Rayner",
  title =        "A test for bivariate normality",
  journal =      "Statistics and Probability Letters",
  volume =       "6",
  pages =        "407--412",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Bezdek.74,
  author =       "J. C. Bezdek",
  title =        "Cluster validity with fuzzy sets",
  journal =      "Journal of Cybernetics",
  volume =       "3",
  pages =        "58--72",
  year =         "1974",
  comment =      PRNNunref,
}

@Article{Bhattacharyya.43,
  author =       "A. Bhattacharyya",
  title =        "On a measure of divergence between two statistical
                 populations defined by their probability
                 distributions",
  journal =      "Bulletin of the Calcutta Mathematics Society",
  volume =       "35",
  pages =        "99--110",
  year =         "1943",
  comment =      PRNNunref,
}

@Article{Bichsel.Seitz.89,
  author =       "M. Bichsel and P. Seitz",
  title =        "Minimum class entropy: a maximum information approach
                 to layered networks",
  journal =      NNks,
  volume =       "2",
  pages =        "133--141",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Bienenstock.ZZ.82,
  author =       "E. Bienenstock and L. N. Cooper and W. Munro",
  title =        "Theory for the development of neuron selectivity:
                 orientation specificity and binocular interaction in
                 the visual cortex",
  journal =      "Journal of Neuroscience",
  volume =       "2",
  pages =        "32--48",
  year =         "1982",
  note =         "[Reprinted in \cite{Anderson.Rosenfeld.88}]",
  comment =      PRNNref,
}

@InProceedings{Binford.ZZ.89,
  author =       "T. O. Binford and T. S. Levitt and W. B. Mann",
  editor =       "L. N. Kanal and T. S. Levitt and J. F. Lemmer",
  booktitle =    "Uncertainty in Artificial Intelligence 3",
  title =        "{Bayesian} inference in model-based machine vision",
  publisher =    "Elsevier",
  address =      "Amsterdam",
  year =         "1989",
  comment =      PRNNunref,
}

@Article{Bishop.91,
  author =       "C. Bishop",
  title =        "Improving the generalization properties of radial
                 basis function neural networks",
  journal =      NC,
  volume =       "3",
  pages =        "579--588",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Bishop.92,
  author =       "C. Bishop",
  title =        "Exact calculation of the {Hessian} matrix for the
                 multilayer perceptron",
  journal =      NC,
  volume =       "4",
  pages =        "494--501",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Bishop.93,
  author =       "C. M. Bishop",
  title =        "Curvature-driven smoothing: a learning algorithm for
                 feedforward networks",
  journal =      TNN,
  volume =       "4",
  pages =        "882--884",
  year =         "1993",
  comment =      PRNNref,
}

@Book{Bishop.95a,
  author =       "C. M. Bishop",
  title =        "Neural Networks for Pattern Recognition",
  publisher =    "Clarendon Press",
  address =      "Oxford",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Bishop.95b,
  author =       "C. M. Bishop",
  title =        "Training with noise is equivalent to {Tikohonov}
                 regularization",
  journal =      NC,
  volume =       "7",
  pages =        "108--116",
  year =         "1995",
  comment =      PRNNref,
}

@InProceedings{Blair.Peyton.93,
  author =       "J. R. S. Blair and B. Peyton",
  editor =       "A. George and J. R. Gilbert and J. H. U. Liu",
  booktitle =    "Graph Theory and Sparse Matrix Computations",
  title =        "An introduction to chordal graphs and clique trees",
  publisher =    Springer,
  address =      "New York",
  pages =        "1--29",
  year =         "1993",
  comment =      PRNNunref,
}

@Article{Block.62,
  author =       "H. D. Block",
  title =        "The perceptron: a model for brain functioning {I}",
  journal =      "Reviews of Modern Physics",
  volume =       "34",
  pages =        "123--135",
  year =         "1962",
  note =         "[Reprinted in \cite{Anderson.Rosenfeld.88}]",
  comment =      PRNNref,
}

@Article{Block.Levin.70,
  author =       "H. D. Block and S. A. Levin",
  title =        "On the boundedness of an iterative procedure for
                 solving a system of linear inequalities",
  journal =      "Proceedings of the American Mathematical Society",
  volume =       "26",
  pages =        "229--235",
  year =         "1970",
  comment =      PRNNref,
}

@Article{Block.ZZ.62,
  author =       "H. D. Block and Knight, Jr., B. W. and F. Rosenblatt",
  title =        "Analysis of a four-layer series-coupled perceptron
                 {II}",
  journal =      "Reviews of Modern Physics",
  volume =       "34",
  pages =        "135--142",
  year =         "1962",
  comment =      PRNNref,
}

@Article{Blue.ZZ.94,
  author =       "J. L. Blue and G. T. Candela and P. J. Grother and C.
                 L. Wilson",
  title =        "Evaluation of pattern classifiers for fingerprint and
                 {OCR} applications",
  journal =      PR,
  volume =       "27",
  pages =        "485--501",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Blumer.ZZ.87,
  author =       "A. Blumer and A. Ehrenfeucht and D. Haussler and M. K.
                 Warmuth",
  title =        "Occam's Razor",
  journal =      "Information Processing Letters",
  volume =       "24",
  pages =        "377--280",
  year =         "1987",
  note =         MLset,
  comment =      PRNNref,
}

@Article{Blumer.ZZ.89,
  author =       "A. Blumer and A. Ehrenfeucht and D. Haussler and M. K.
                 Warmuth",
  title =        "Learnability and the {Vapnik--Chervonenkis}
                 dimension",
  journal =      "Journal of the Association for Computing Machinery",
  volume =       "36",
  pages =        "926--965",
  year =         "1989",
  comment =      PRNNref,
}

@Book{Boor.78,
  author =       "C. de Boor",
  title =        "A Practical Guide to Splines",
  publisher =    Springer,
  address =      "New York",
  year =         "1978",
  comment =      PRNNref,
}

@Article{Bourlard.Kamp.88,
  author =       "H. Bourlard and Y. Kamp",
  title =        "Auto-association by multilayer perceptrons and
                 singular value decomposition",
  journal =      BioCyb,
  volume =       "59",
  pages =        "291--294",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Bouton.Pages.93,
  author =       "C. Bouton and G. Pag\`es",
  title =        "Self-organization of the one-dimensional {Kohonen}
                 algorithm with non-uniformly distributed stimuli",
  journal =      "Stochastic Processes and their Applications",
  volume =       "47",
  pages =        "249--274",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Bouton.Pages.94,
  author =       "C. Bouton and G. Pag\`es",
  title =        "Convergence in distribution of the one-dimensional
                 {Kohonen} algorithms when the stimuli are not uniform",
  journal =      "Advances in Applied Probability",
  volume =       "26",
  pages =        "80--103",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Box.Tiao.62,
  author =       "G. E. P. Box and G. C. Tiao",
  title =        "A further look at robustness via {Bayes's} theorem",
  journal =      Bka,
  volume =       "49",
  pages =        "419--432",
  year =         "1962",
  comment =      PRNNref,
}

@Book{Box.Tiao.73,
  author =       "G. E. P. Box and G. C. Tiao",
  title =        "{Bayesian} Inference in Statistical Analysis",
  publisher =    Wiley,
  address =      "New York",
  year =         "1973",
  note =         "[Formerly Reading, MA: Addison-Wesley]",
  comment =      PRNNref,
}

@Book{Box.ZZ.78,
  author =       "G. E. P. Box and W. G. Hunter and J. S. Hunter",
  title =        "Statistics for Experimenters: An Introduction to
                 Design, Data Analysis and Model Building",
  publisher =    Wiley,
  address =      "New York",
  year =         "1978",
  comment =      PRNNref,
}

@Article{Boyles.83,
  author =       "R. A. Boyles",
  title =        "On the convergence of the {EM} algorithm",
  journal =      JRSSB,
  volume =       "45",
  pages =        "47--50",
  year =         "1983",
  comment =      PRNNref,
}

@InProceedings{Bratko.Kononenko.87,
  author =       "I. Bratko and I. Kononenko",
  editor =       "B. Phelps",
  booktitle =    "Interactions in Artificial Intelligence and
                 Statistical Methods",
  title =        "Learning diagnostic rules from incomplete and noisy
                 data",
  publisher =    "Gower Technical Press",
  address =      "Aldershot",
  pages =        "142--153",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Bratko.Muggleton.95,
  author       = "I. Bratko and S. Muggleton",
  title        = "Applications of inductive logic programming",
  journal      = "Communications of the Association for Computing
                  Machinery",
  volume       = "38",
  number       = "11",
  pages        = "65--70",
  year         = "1995",
}

@Article{Braverman.65,
  author =       "E. M. Braverman",
  title =        "On the method of potential functions",
  journal =      AuRC,
  volume =       "26",
  pages =        "2130--2138",
  year =         "1965",
  comment =      PRNNref,
}

@Article{Breiman.91,
  author =       "L. Breiman",
  title =        "The {$\Pi$}-method for estimating multivariate
                 functions from noisy data (with discussion)",
  journal =      Techno,
  volume =       "33",
  pages =        "125--160",
  year =         "1991",
  comment =      PRNNref,
}

@TechReport{Breiman.92,
  author =       "L. Breiman",
  title =        "Stacked regressions",
  number =       "367",
  institution =  "Dept of Statistics, University of California,
                 Berkeley",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Breiman.93,
  author =       "L. Breiman",
  title =        "Hinging hyperplanes for regression, classification and
                 function approximation",
  journal =      IEIT,
  volume =       "3",
  pages =        "999--1013",
  year =         "1993",
  comment =      PRNNref,
}

@TechReport{Breiman.Ihaka.84,
  author =       "L. Breiman and R. Ihaka",
  title =        "Nonlinear discriminant analysis via {ACE} and
                 scaling",
  number =       "40",
  institution =  "Dept of Statistics, University of California,
                 Berkeley",
  year =         "1984",
  comment =      PRNNref,
}

@Book{Breiman.ZZ.84,
  author =       "L. Breiman and J. H. Friedman and R. A. Olshen and C.
                 J. Stone",
  title =        "Classification and Regression Trees",
  publisher =    "Wadsworth and Brooks/Cole",
  address =      "Monterey, CA",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Brent.91,
  author =       "R. P. Brent",
  title =        "Fast training algorithms for multi\-layer neural
                 nets",
  journal =      TNN,
  volume =       "2",
  pages =        "346--354",
  year =         "1991",
  comment =      PRNNref,
}

@InProceedings{Bridle.90a,
  author =       "J. S. Bridle",
  editor =       "F. {Fogelman Souli\'e} and J. H\'erault",
  booktitle =    "Neuro-computing: Algorithms, Architectures and
                 Applications",
  title =        "Probabilistic interpretation of feedforward
                 classification network outputs, with relationships to
                 statistical pattern recognition",
  publisher =    Springer,
  address =      "Berlin",
  pages =        "227--236",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Bridle.90b,
  author =       "J. S. Bridle",
  title =        "Training stochastic model recognition algorithms as
                 networks can lead to maximum mutual information
                 estimation of parameters",
  crossref =     "NIPS2",
  pages =        "211--217",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Bridle.Cox.91,
  author =       "J. S. Bridle and S. J. Cox",
  title =        "{RecNorm}: simultaneous normalisation and classification
                 applied to speech recognition",
  crossref =     "NIPS3",
  pages =        "234--240",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Brier.50,
  author =       "G. W. Brier",
  title =        "Verification of forecasts expressed in terms of
                 probabilities",
  journal =      "Monthly Weather Review",
  volume =       "78",
  pages =        "1--3",
  year =         "1950",
  comment =      PRNNunref,
}

@Article{Brockett.91,
  author =       "R. W. Brockett",
  title =        "Dynamical systems that sort lists, diagonalize
                 matrices and solve linear programming problems",
  journal =      "Linear Algebra and its Applications",
  volume =       "146",
  pages =        "79--91",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Broffit.ZZ.80,
  author =       "B. Broffit and W. R. Clarke and P. A. Lachenbruch",
  title =        "The effect of {Huberizing} and trimming on the
                 quadratic discriminant function",
  journal =      CSTM,
  volume =       "A9",
  pages =        "13--25",
  year =         "1980",
  comment =      PRNNref,
}

@Article{Bronowski.Long.51,
  author =       "J. Bronowski and W. M. Long",
  title =        "Statistical methods in anthropology",
  journal =      Nat,
  volume =       "1168",
  pages =        "794",
  year =         "1951",
  comment =      PRNNref,
}

@Article{Broomhead.Lowe.88,
  author =       "D. S. Broomhead and D. Lowe",
  title =        "Multivariable functional interpolation and adaptive
                 networks",
  journal =      ComSys,
  volume =       "2",
  pages =        "321--355",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Brown.Koplowitz.79,
  author =       "T. A. Brown and J. Koplowitz",
  title =        "The weighted nearest neighbor rule for class dependent
                 sample sizes",
  journal =      IEIT,
  volume =       "25",
  pages =        "617--619",
  year =         "1979",
  comment =      PRNNref,
}

@Article{Brown.Rundell.85,
  author =       "P. J. Brown and P. W. K. Rundell",
  title =        "Kernel estimates for categorical data",
  journal =      Techno,
  volume =       "28",
  pages =        "293--299",
  year =         "1985",
  comment =      PRNNref,
}

@Article{Bryan.51,
  author =       "J. G. Bryan",
  title =        "The generalized discriminant function: mathematical
                 foundations and computational routine",
  journal =      "Harvard Educational Review",
  volume =       "21",
  pages =        "90--95",
  year =         "1951",
  comment =      PRNNunref,
}

@Article{Bryant.89,
  author =       "J. Bryant",
  title =        "A fast classifier for image data",
  journal =      PR,
  volume =       "22",
  pages =        "45--48",
  year =         "1989",
  comment =      PRNNref,
}

@Book{Bryson.Ho.69,
  author =       "A. E. Bryson and Y.-C. Ho",
  title =        "Applied Optimal Control",
  publisher =    "Blaisdell",
  address =      "New York",
  year =         "1969",
  note =         "[Revised printing New York: Hemisphere, 1975]",
  comment =      PRNNref,
}

@Article{Buckland.92a,
  author =       "S. T. Buckland",
  title =        "Fitting density functions with polynomials",
  journal =      ApplStat,
  volume =       "41",
  pages =        "63--76",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Buckland.92b,
  author =       "S. T. Buckland",
  title =        "Algorithm {AS270}. Maximum likelihood fitting of
                 {Hermite} and simple polynomial densities",
  journal =      ApplStat,
  volume =       "41",
  pages =        "241--266",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Buckley.94,
  author =       "A. G. Buckley",
  title =        "Algorithm 734: {A} {Fortran} 90 code for
                 unconstrained nonlinear minimization",
  journal =      TOMS,
  volume =       "20",
  pages =        "354--372",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Buntine.92,
  author =       "W. L. Buntine",
  title =        "Learning classification trees",
  journal =      StatComp,
  volume =       "2",
  pages =        "63--73",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Buntine.Weigend.91,
  author =       "W. L. Buntine and A. S. Weigend",
  title =        "{Bayesian} back-propagation",
  journal =      ComSys,
  volume =       "5",
  pages =        "603--643",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Buntine.Weigend.94,
  author =       "W. L. Buntine and A. S. Weigend",
  title =        "Calculating second derivatives on feed-forward
                 networks: a review",
  journal =      TNN,
  volume =       "5",
  pages =        "480--488",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Burrascano.91,
  author =       "P. Burrascano",
  title =        "Learning vector quantization for the probabilistic
                 neural network",
  journal =      TNN,
  volume =       "2",
  pages =        "458--461",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Byrd.ZZ.94,
  author =       "R. H. Byrd and J. Nocedal and R. B. Schnabel",
  title =        "Representations of quasi-{Newton} matrices and their
                 use in limited memory methods",
  journal =      MathProg,
  volume =       "63",
  pages =        "129--156",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Byth.McLachlan.78,
  author =       "K. Byth and G. J. McLachlan",
  title =        "The biases associated with maximum likelihood methods
                 of estimation of the multivariate logistic risk
                 function",
  journal =      CSTM,
  volume =       "A7",
  pages =        "877--890",
  year =         "1978",
  comment =      PRNNref,
}

@Article{Cacoullos.66,
  author =       "T. Cacoullos",
  title =        "Estimation of a multivariate density",
  journal =      "Annals of the Institute of Statistical Mathematics",
  volume =       "18",
  pages =        "179--189",
  year =         "1966",
  comment =      PRNNunref,
}

@Article{Campbell.80a,
  author =       "N. A. Campbell",
  title =        "Shrunken estimators in discriminant and canonical
                 variate analysis",
  journal =      ApplStat,
  volume =       "29",
  pages =        "5--14",
  year =         "1980",
  comment =      PRNNref,
}

@Article{Campbell.80b,
  author =       "N. A. Campbell",
  title =        "Robust procedures in multivariate analysis {I}. Robust
                 covariance estimation",
  journal =      ApplStat,
  volume =       "29",
  pages =        "231--237",
  year =         "1980",
  comment =      PRNNref,
}

@Article{Campbell.82,
  author =       "N. A. Campbell",
  title =        "Robust procedures in multivariate analysis {II}\@.
                 Robust canonical variate analysis",
  journal =      ApplStat,
  volume =       "31",
  pages =        "1--8",
  year =         "1982",
  comment =      PRNNref,
}

@Article{Campbell.Mahon.74,
  author =       "N. A. Campbell and R. J. Mahon",
  title =        "A multivariate study of variation in two species of
                 rock crab of genus \emph{Leptograpsus}",
  journal =      "Australian Journal of Zoology",
  volume =       "22",
  pages =        "417--425",
  year =         "1974",
  comment =      PRNNref,
}

@TechReport{Candela.Chellappa.93,
  author =       "G. T. Candela and R. Chellappa",
  title =        "Comparative performance of classification methods for
                 fingerprints",
  number =       "NISTIR 5163",
  institution =  "US National Institute of Standards and Technology",
  year =         "1993",
  comment =      PRNNref,
}

@Book{Cannings.Thompson.81,
  author =       "C. Cannings and E. A. Thompson",
  title =        "Genealogical and Genetic Structure",
  publisher =    "Cambridge University Press",
  address =      "Cambridge",
  year =         "1981",
  comment =      PRNNref,
}

@Article{Cannings.ZZ.78,
  author =       "C. Cannings and E. A. Thompson and M. H. Skolnick",
  title =        "Probability functions on complex pedigrees",
  journal =      "Advances in Applied Probability",
  volume =       "10",
  pages =        "26--61",
  year =         "1978",
  comment =      PRNNref,
}

@Book{Carbonell.90,
  editor =       "J. G. Carbonell",
  title =        "Machine Learning: Paradigms and Methods",
  publisher =    "The MIT Press",
  address =      "Cambridge, MA",
  year =         "1990",
  ISBN =         "0-262-53088-0",
  comment =      PRNNref,
}

@Article{Carpenter.Grossberg.87a,
  author =       "G. A. Carpenter and S. Grossberg",
  title =        "A massively parallel architecture for a
                 self-organizing neural pattern recognition machine",
  journal =      "Computer Vision, Graphics, and Image Processing",
  volume =       "37",
  pages =        "54--115",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Carpenter.Grossberg.87b,
  author =       "G. A. Carpenter and S. Grossberg",
  title =        "{ART} 2: stable self-organization of stable category
                 recognition codes for analog input patterns",
  journal =      "Applied Optics",
  volume =       "26",
  pages =        "4919--4930",
  year =         "1987",
  note =         "[Reprinted in \cite{Anderson.ZZ.90}]",
  comment =      PRNNref,
}

@Article{Carpenter.Grossberg.90,
  author =       "G. A. Carpenter and S. Grossberg",
  title =        "{ART} 3: hierarchical search using chemical
                 transmitters in self-organizing pattern recognition
                 architectures",
  journal =      NNks,
  volume =       "3",
  pages =        "129--152",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Carpenter.Grossberg.94,
  author =       "G. A. Carpenter and S. Grossberg",
  title =        "Self-organizing neural networks for supervised and
                 unsupervised learning and prediction",
  crossref =     "Cherkassky.ZZ.94",
  pages =        "319--348",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Carpenter.ZZ.91a,
  author =       "G. A. Carpenter and S. Grossberg and J. H. Reynolds",
  title =        "{ARTMAP}: supervised real-time learning and
                 classification of nonstationary data by a
                 self-organizing neural network",
  journal =      NNks,
  volume =       "4",
  pages =        "565--588",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Carpenter.ZZ.91b,
  author =       "G. A. Carpenter and S. Grossberg and D. B. Rosen",
  title =        "Fuzzy {ART}: fast stable learning and categorization
                 of analog patterns by an adaptive resonance system",
  journal =      NNks,
  volume =       "4",
  pages =        "759--771",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Carpenter.ZZ.92,
  author =       "G. A. Carpenter and S. Grossberg and N. Markuzon and
                 J. H. Reynolds and D. B. Rosen",
  title =        "Fuzzy {ARTMAP}: a neural network architecture for
                 incremental supervised learning of analog
                 multi\-dimensional maps",
  journal =      TNN,
  volume =       "3",
  pages =        "698--713",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Carroll.Dickinson.89,
  author =       "S. M. Carroll and B. W. Dickinson",
  booktitle =    "Proceedings of the International Joint Conference on
                 Neural Networks (Washington, DC, 1989)",
  title =        "Construction of neural nets using the {Radon}
                 transform",
  volume =       "I",
  publisher =    "IEEE Press",
  address =      "New York",
  pages =        "607--611",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Carter.Catlett.87,
  author =       "C. Carter and J. Catlett",
  title =        "Assessing credit card applications using machine
                 learning",
  journal =      "IEEE Expert",
  volume =       "2",
  number =       "3",
  pages =        "71--79",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Casey.Nagy.84,
  author =       "R. G Casey and G. Nagy",
  title =        "Decision tree design using a probabilistic model",
  journal =      IEIT,
  volume =       "30",
  pages =        "93--99",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Celeux.Diebolt.92,
  author =       "G. Celeux and J. Diebolt",
  title =        "A stochastic approximation type {EM} algorithm for the
                 mixture problem",
  journal =      "Stochastics and Stochastics Reports",
  volume =       "41",
  pages =        "119--134",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Cestnik.ZZ.87,
  author =       "B. Cestnik and I. Kononenko and I. Bratko",
  editor =       "I. Bratko and N. Lavra{\v c}",
  booktitle =    "Progress in Machine Learning",
  title =        "\hbox{ASSISTANT} 86: a knowledge-elicitation tool for
                 sophisticated users",
  publisher =    "Sigma Press",
  address =      "Wilmslow",
  pages =        "31--45",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Chan.93,
  author =       "K. S. Chan",
  title =        "Asymptotic behaviour of the {Gibbs} sampler",
  journal =      JASA,
  volume =       "88",
  pages =        "320--326",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Chan.Bao.91,
  author =       "C. Chan and J. Bao",
  title =        "On the design of a tree classifier and its application
                 to speech recognition",
  journal =      IJPRAI,
  volume =       "5",
  pages =        "677--692",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Chandran.94,
  author =       "P. S. Chandran",
  title =        "Comments on ``{Comparative} analysis of
                 backpropagation and the extended {Kalman} filter for
                 training multilayer perceptrons''",
  journal =      PAMI,
  volume =       "16",
  pages =        "862--863",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Chang.74,
  author =       "C. L. Chang",
  title =        "Finding prototypes for nearest neighbor classifiers",
  journal =      IEC,
  volume =       "23",
  pages =        "1179--1184",
  year =         "1974",
  note =         NNset,
  comment =      PRNNref,
}

@Article{Charniak.91,
  author =       "E. Charniak",
  title =        "{Bayesian} networks without tears",
  journal =      "AI Magazine",
  volume =       "12",
  number =       "4",
  pages =        "50--63",
  year =         "1991",
  comment =      PRNNref,
}

@InProceedings{Chauvin.89,
  author =       "Y. Chauvin",
  title =        "A back-propagation algorithm with optimal use of
                 hidden units",
  crossref =     "NIPS1",
  pages =        "519--526",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Chavez.Cooper.90,
  author =       "R. M. Chavez and G. F. Cooper",
  title =        "A randomized approximation algorithm for probabilistic
                 inference on {Bayesian} belief networks",
  journal =      Nks,
  volume =       "20",
  pages =        "661--685",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Cheeseman.95,
  author =       "P. Cheeseman",
  title =        "On {Bayesian} model selection",
  crossref =     "Wolpert.95",
  pages =        "315--330",
  year =         "1995",
  comment =      PRNNref,
}

@InProceedings{Cheeseman.ZZ.88a,
  author =       "P. Cheeseman and J. Kelly and M. Self and J. Stutz and
                 W. Taylor and D. Freeman",
  booktitle =    "Proceedings of the Fifth International Workshop on
                 Machine Learning, Ann Arbor",
  title =        "{AutoClass}: a {Bayesian} classification system",
  publisher =    MK,
  address =      "San Mateo, CA",
  pages =        "54--64",
  year =         "1988",
  comment =      PRNNunref,
}

@InProceedings{Cheeseman.ZZ.88b,
  author =       "P. Cheeseman and M. Self and J. Kelly and W. Taylor
                 and D. Freeman and J. Stutz",
  editor =       "R. G. Smith and T. M. Mitchell",
  booktitle =    "Proceedings of the Seventh AAAI National Conference on
                 Artificial Intelligence, St Paul, MN",
  title =        "Bayesian classification",
  publisher =    MK,
  address =      "San Mateo, CA",
  pages =        "607--611",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Chen.Jain.94,
  author =       "D. S. Chen and R. C. Jain",
  title =        "A robust back propagation learning algorithm for
                 function approximation",
  journal =      TNN,
  volume =       "5",
  pages =        "467--479",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Chen.ZZ.91,
  author =       "S. Chen and C. F. N. Cowan and P. M. Grant",
  title =        "Orthogonal least squares learning algorithm for radial
                 basis function networks",
  journal =      TNN,
  volume =       "2",
  pages =        "302--309",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Cheng.ZZ.92,
  author =       "Y.-Q. Cheng and Y.-M. Zhuang and J.-Y. Yang",
  title =        "Optimal {Fisher} discriminant analysis using the rank
                 decomposition",
  journal =      PR,
  volume =       "25",
  pages =        "101--111",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Cherkassky.Mulier.94,
  author =       "V. Cherkassky and F. Mulier",
  title =        "Self-organizing networks for nonparametric
                 regression",
  crossref =     "Cherkassky.ZZ.94",
  pages =        "188--212",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Chernick.ZZ.85,
  author =       "M. R. Chernick and V. K. Murthy and C. D. Nealy",
  title =        "Application of bootstrap and other re\-sampling
                 techniques: evaluation of classifier performance",
  journal =      PRL,
  volume =       "3",
  pages =        "167--178",
  year =         "1985",
  comment =      PRNNref,
}

@Article{Chernoff.52,
  author =       "H. Chernoff",
  title =        "A measure of asymptotic efficiency for tests of a
                 hypothesis based on the sum of observations",
  journal =      AnnMathStat,
  volume =       "23",
  pages =        "493--507",
  year =         "1952",
  comment =      PRNNref,
}

@InProceedings{Chernoff.73,
  author =       "H. Chernoff",
  editor =       "P. R. Krishnaiah",
  booktitle =    "Multivariate Analysis III",
  title =        "Some measures for discriminating between normal
                 multivariate distributions with unequal covariance
                 matrices",
  publisher =    "Academic Press",
  address =      "New York",
  pages =        "337--344",
  year =         "1973",
  comment =      PRNNunref,
}

@Article{ChidanandaGowda.Krishna.79,
  author =       "K. Chidananda Gowda and G. Krishna",
  title =        "The condensed nearest neighbor rule using the concept
                 of mutual nearest neighborhood",
  journal =      IEIT,
  volume =       "25",
  pages =        "488--490",
  year =         "1979",
  note =         NNset,
  comment =      PRNNref,
}

@InProceedings{Chou.89,
  author =       "P. A. Chou",
  editor =       "W. A. Pearlman",
  booktitle =    "Visual Communications and Image Processing IV",
  title =        "Recognition of equations using a two-dimensional
                 stochastic context-free grammar",
  volume =       "1199",
  pages =        "852--863",
  year =         "1989",
  series =       "SPIE Proceedings Series",
  comment =      PRNNref,
}

@Article{Chou.91,
  author =       "P. A. Chou",
  title =        "Optimal partitioning for classification and regression
                 trees",
  journal =      PAMI,
  volume =       "13",
  pages =        "340--354",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Chou.Chen.92,
  author =       "W.-S. Chou and Y.-C. Chen",
  title =        "A new fast algorithm for the effective training of
                 neural classifiers",
  journal =      PR,
  volume =       "25",
  pages =        "423--429",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Chow.70,
  author =       "C. K. Chow",
  title =        "On optimum recognition error and reject tradeoff",
  journal =      IEIT,
  volume =       "16",
  pages =        "41--46",
  year =         "1970",
  comment =      PRNNref,
}

@Article{Chow.Liu.68,
  author =       "C. K. Chow and C. N. Liu",
  title =        "Approximating discrete probability distributions with
                 dependence trees",
  journal =      IEIT,
  volume =       "14",
  pages =        "462--467",
  year =         "1968",
  comment =      PRNNref,
}

@InProceedings{Ciampi.ZZ.87,
  author =       "A. Ciampi and C.-H. Chang and S. Hogg and S. McKinney",
  editor =       "I. B. MacNeil and G. J. Umphrey",
  booktitle =    "Biostatistics",
  title =        "Recursive partition: a versatile method for
                 exploratory data analysis in biostatistics",
  publisher =    "Reidel",
  address =      "Dordrecht",
  pages =        "23--50",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Clark.Niblett.89,
  author =       "P. Clark and T. Niblett",
  title =        "The {CN2} induction algorithm",
  journal =      ML,
  volume =       "3",
  pages =        "261--283",
  year =         "1989",
  comment =      PRNNref,
}

@InCollection{Clark.Pregibon.92,
  author =       "L. A. Clark and D. Pregibon",
  title =        "Tree-based models",
  crossref =     "Chambers.Hastie.92",
  chapter =      "9",
  year =         "1992",
  comment =      PRNNref,
}

@InCollection{Cleveland.ZZ.92,
  author =       "W. S. Cleveland and E. Grosse and W. M. Shyu",
  title =        "Local regression models",
  crossref =     "Chambers.Hastie.92",
  chapter =      "8",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Clifford.90,
  author =       "P. Clifford",
  editor =       "G. R. Grimmett and D. J. A. Welsh",
  booktitle =    "Disorder in Physical Systems. A Volume in Honour of
                 John M. Hammersley",
  title =        "{Markov} random fields in statistics",
  publisher =    "Clarendon Press",
  address =      "Oxford",
  pages =        "19--32",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Clunies-Ross.Riffenburgh.60,
  author =       "C. W. Clunies-Ross and R. H. Riffenburgh",
  title =        "Geometry and linear discrimination",
  journal =      Bka,
  volume =       "47",
  pages =        "185--189",
  year =         "1960",
  comment =      PRNNref,
}

@Article{Cohen.ZZ.91,
  author =       "E. Cohen and J. J. Hull and S. N. Srihari",
  title =        "\hbox{Understanding} handwritten text in a structured
                 environment: determining {ZIP} codes from addresses",
  journal =      IJPRAI,
  volume =       "5",
  pages =        "221--264",
  year =         "1991",
  comment =      PRNNunref,
}

@Article{Cohn.Tesauro.92,
  author =       "D. Cohn and G. Tesauro",
  title =        "How tight are the {Vapnik--Chervonenkis} bounds?",
  journal =      NC,
  volume =       "4",
  pages =        "249--269",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Cook.ZZ.93,
  author =       "D. Cook and A. Buja and J. Cabrera",
  title =        "Projection pursuit indices based on orthonormal
                 function expansions",
  journal =      JCGS,
  volume =       "2",
  pages =        "225--250",
  year =         "1993",
  comment =      PRNNref,
}

@Book{Coomans.Broeckaert.86,
  author =       "D. Coomans and I. Broeckaert",
  title =        "Potential Pattern Recognition in Chemical and Medical
                 Decision Making",
  publisher =    "Research Studies Press",
  address =      "Letchworth",
  year =         "1986",
  comment =      PRNNref,
}

@PhdThesis{Cooper.84,
  author =       "G. F. Cooper",
  title =        "{NESTOR}: {A} Computer-based Medical Diagnostic Aid
                 that Integrates Causal and Probabilistic Knowledge",
  school =       "Dept of Computer Science, Stanford University",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Cooper.89,
  author =       "G. F. Cooper",
  title =        "Current research directions in the development of
                 expert systems based on belief networks",
  journal =      "Applied Stochastic Models and Data Analysis",
  volume =       "5",
  pages =        "39--52",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Cooper.90,
  author =       "G. F. Cooper",
  title =        "The computational complexity of probabilistic
                 inference using {Bayesian} belief networks",
  journal =      AI,
  volume =       "42",
  pages =        "393--405",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Cooper.Herskovits.92,
  author =       "G. F. Cooper and E. Herskovits",
  title =        "A {Bayesian} method for the induction of probabilistic
                 networks from data",
  journal =      ML,
  volume =       "9",
  pages =        "309--347",
  year =         "1992",
  comment =      PRNNref,
}

@Book{Cormen.ZZ.90,
  author =       "T. H. Cormen and C. E. Leiserson and R. L. Rivest",
  title =        "Introduction to Algorithms",
  publisher =    "The MIT Press and New York: McGraw-Hill",
  address =      "Cambridge MA",
  year =         "1989",
  ISBN =         "0-262-03141-8",
  comment =      PRNNref,
}

@Article{Cortes.Vapnik.95,
  author       = "C. Cortes and V. Vapnik",
  title        = "Support-vector networks",
  journal      = "Machine Learning",
  volume       = "20",
  pages        = "273--297",
  year         = "1995",
  comment =      PRNNunref,
}

@Article{Cosslett.81,
  author =       "S. R. Cosslett",
  title =        "Maximum likelihood estimators for choice-based
                 samples",
  journal =      "Econometrica",
  volume =       "49",
  pages =        "1289--1316",
  year =         "1981",
  comment =      PRNNref,
}

@Article{Cottrell.Fort.87,
  author =       "M. Cottrell and J. C. Fort",
  title =        "Etude d'un algorithme d'auto-organisation",
  journal =      "Annales de l'Institut Henri Poincar\'e",
  volume =       "23",
  pages =        "1--20",
  year =         "1987",
  comment =      PRNNunref,
}

@InProceedings{Cottrell.Metcalfe.91,
  author =       "G. W. Cottrell and J. Metcalfe",
  title =        "{EMPATH}: face, emotion and gender recognition using
                 holons",
  crossref =     "NIPS3",
  pages =        "564--571",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Cover.65,
  author =       "T. M. Cover",
  title =        "Geometrical and statistical properties of systems of
                 linear inequalities with applications in pattern
                 recognition",
  journal =      IEEC,
  volume =       "14",
  pages =        "326--334",
  year =         "1965",
  comment =      PRNNref,
}

@InProceedings{Cover.68,
  author =       "T. M. Cover",
  booktitle =    "Proceedings of the First Annual Hawaii Conference on
                 Systems Theory, Honolulu",
  title =        "Rates of convergence of nearest neighbor procedures",
  pages =        "413--418",
  year =         "1968",
  comment =      PRNNunref,
}

@InProceedings{Cover.69,
  author =       "T. M. Cover",
  editor =       "S. Watanabe",
  booktitle =    "Methodologies of Pattern Recognition",
  title =        "Learning in pattern recognition",
  publisher =    "Academic Press",
  address =      "New York",
  pages =        "111--132",
  year =         "1969",
  comment =      PRNNref,
}

@Article{Cover.Hart.67,
  author =       "T. M. Cover and P. E. Hart",
  title =        "Nearest neighbor pattern classification",
  journal =      IEIT,
  volume =       "13",
  pages =        "21--27",
  year =         "1967",
  note =         "[Reprinted in \cite{Anderson.ZZ.90}, \cite{Dasarathy.91} and
                 \cite{Lau.92}]",
  comment =      PRNNref,
}

@InProceedings{Cowell.92,
  author =       "R. G. Cowell",
  editor =       "J. M. Bernardo and J. O. Berger and A. P. Dawid and A.
                 F. M. Smith",
  booktitle =    "Bayesian Statistics 4",
  title =        "{BAIES}---a probabilistic expert reasoning shell with
                 qualitative and quantitative learning",
  publisher =    "Clarendon Press",
  address =      "Oxford",
  pages =        "595--600",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Cowell.95,
  author =       "R. G. Cowell",
  title =        "A {C}++ class library for building {Bayesian} belief
                 networks",
  crossref =     "Gammerman.95",
  pages =        "159--165",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Cowell.Dawid.92,
  author =       "R. G. Cowell and A. P. Dawid",
  title =        "Fast retraction of evidence in a probabilistic expert
                 system",
  journal =      StatComp,
  volume =       "2",
  pages =        "37--40",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Cox.58,
  author =       "D. R. Cox",
  title =        "Two further applications of a model for binary
                 regression",
  journal =      Bka,
  volume =       "45",
  pages =        "562--565",
  year =         "1958",
  comment =      PRNNref,
}

@Book{Cox.Cox.94,
  author =       "T. F. Cox and M. A. A. Cox",
  title =        "Multidimensional Scaling",
  publisher =    "Chapman \& Hall",
  address =      "London",
  year =         "1994",
  comment =      PRNNref,
}

@Book{Cox.Hinkley.74,
  author =       "D. R. Cox and D. V. Hinkley",
  title =        "Theoretical Statistics",
  publisher =    "Chapman \& Hall",
  address =      "London",
  year =         "1974",
  comment =      PRNNref,
}

@Book{Cox.Snell.89,
  author =       "D. R. Cox and E. J. Snell",
  title =        "Analysis of Binary Data",
  publisher =    "Chapman \& Hall",
  address =      "London",
  edition =      "Second",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Craven.Wahba.79,
  author =       "P. Craven and G. Wahba",
  title =        "Smoothing noisy data with spline functions: estimating
                 the correct degree of smoothing by the method of
                 generalized cross-validation",
  journal =      "Numerische Matematik",
  volume =       "31",
  pages =        "377--403",
  year =         "1979",
  comment =      PRNNunref,
}

@Article{Crawford.89,
  author =       "S. L. Crawford",
  title =        "Extensions to the {CART} algorithm",
  journal =      "International Journal of Man--Machine Studies",
  volume =       "31",
  pages =        "197--217",
  year =         "1989",
  comment =      PRNNref,
}

@Book{Crevier.93,
  author =       "D. Crevier",
  title =        "{AI}\@. The Tumultuous History of the Search for
                 Artificial Intelligence",
  publisher =    "Basic Books",
  address =      "New York",
  year =         "1993",
  comment =      PRNNref,
}

@TechReport{Cybenko.88,
  author =       "G. Cybenko",
  title =        "Continuous valued neural networks with two hidden
                 layers are sufficient",
  institution =  "Dept of Computer Science, Tufts University",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Cybenko.89,
  author =       "G. Cybenko",
  title =        "Approximation by superpositions of a sigmoidal
                 function",
  journal =      "Mathematics of Control Signals, and Systems",
  volume =       "2",
  pages =        "303--314",
  year =         "1989",
  comment =      PRNNref,
}

@InProceedings{Darken.Moody.91,
  author =       "C. Darken and J. Moody",
  title =        "Note on learning rate schedules for stochastic
                 optimization",
  crossref =     "NIPS3",
  pages =        "832--838",
  year =         "1991",
  comment =      PRNNref,
}

@Book{Dasarathy.91,
  editor =       "B. V. Dasarathy",
  title =        "Nearest Neighbor ({NN}) Norms: {NN} Pattern
                 Classification Techniques",
  publisher =    "IEEE Computer Society Press",
  address =      "Los Alamitos, CA",
  year =         "1991",
  comment =      PRNNunref,
}

@Article{Dattatreya.Sarma.81,
  author =       "G. R. Dattatreya and V. V. S. Sarma",
  title =        "{Bayesian} and decision tree approaches for pattern
                 recognition including feature measurement costs",
  journal =      PAMI,
  volume =       "3",
  pages =        "293--298",
  year =         "1981",
  comment =      PRNNref,
}

@InProceedings{Dattatreya.Sarma.85,
  author =       "G. R. Dattatreya and V. V. S. Sarma",
  editor =       "L. N. Kanal and A. Rosenfeld",
  booktitle =    "Progress in Pattern Recognition 2",
  title =        "Decision trees in pattern recognition",
  publisher =    "Elsevier",
  address =      "Amsterdam",
  year =         "1985",
  comment =      PRNNunref,
}

@Article{Dawid.76,
  author =       "A. P. Dawid",
  title =        "Properties of diagnostic data distributions",
  journal =      Biom,
  volume =       "32",
  pages =        "647--658",
  year =         "1976",
  comment =      PRNNref,
}

@Article{Dawid.79,
  author =       "A. P. Dawid",
  title =        "Conditional independence in statistical theory (with
                 discussion)",
  journal =      JRSSB,
  volume =       "41",
  pages =        "1--31",
  year =         "1979",
  comment =      PRNNref,
}

@Article{Dawid.80,
  author =       "A. P. Dawid",
  title =        "Conditional independence for statistical operations",
  journal =      AnnStat,
  volume =       "8",
  pages =        "598--617",
  year =         "1980",
  comment =      PRNNref,
}

@Article{Dawid.82,
  author =       "A. P. Dawid",
  title =        "The well-calibrated {Bayesian} (with discussion)",
  journal =      JASA,
  volume =       "77",
  pages =        "605--613",
  year =         "1982",
  comment =      PRNNref,
}

@InProceedings{Dawid.86,
  author =       "A. P. Dawid",
  editor =       "S. Kotz and N. L. Johnson and C. B. Read",
  booktitle =    "Encyclopedia of Statistical Sciences",
  title =        "Probability forecasting",
  publisher =    Wiley,
  address =      "New York",
  pages =        "210--218",
  year =         "1986",
  volume =       "7",
  comment =      PRNNref,
}

@Article{Dawid.92,
  author =       "A. P. Dawid",
  title =        "Applications of a general propagation algorithm for
                 probabilistic expert systems",
  journal =      StatComp,
  volume =       "2",
  pages =        "25--36",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Dawid.Lauritzen.93,
  author =       "A. P. Dawid and S. L. Lauritzen",
  title =        "Hyper {Markov} laws in the statistical analysis of
                 decomposable graphical models",
  journal =      AnnStat,
  volume =       "21",
  pages =        "1272--1317",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Deely.Lindley.81,
  author =       "J. J. Deely and D. V. Lindley",
  title =        "Bayes empirical {Bayes}",
  journal =      JASA,
  volume =       "76",
  pages =        "833--841",
  year =         "1981",
  comment =      PRNNref,
}

@InProceedings{DeMers.Cottrell.93,
  author =       "D. DeMers and G. Cottrell",
  title =        "Non-linear dimensionality reduction",
  crossref =     "NIPS5",
  pages =        "580--587",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Dempster.Kong.88,
  author =       "A. P. Dempster and A. Kong",
  title =        "Uncertain evidence and artificial analysis",
  journal =      "Journal of Statistical Planning and Inference",
  volume =       "20",
  pages =        "355--368",
  year =         "1988",
  note =         URset,
  comment =      PRNNref,
}

@Article{Dempster.ZZ.77,
  author =       "A. P. Dempster and N. M. Laird and D. B. Rubin",
  title =        "Maximum likelihood from incomplete data via the {EM}
                 algorithm (with discussion)",
  journal =      JRSSB,
  volume =       "39",
  pages =        "1--38",
  year =         "1977",
  comment =      PRNNref,
}

@Book{Dennis.Schnabel.83,
  author =       "J. E. Dennis and R. B. Schnabel",
  title =        "Numerical Methods for Unconstrained Optimization and
                 Nonlinear Equations",
  publisher =    "Prentice-Hall",
  address =      "Englewood Cliffs, NJ",
  year =         "1983",
  comment =      PRNNunref,
}

@Book{Devijver.Kittler.82,
  author =       "P. A. Devijver and J. V. Kittler",
  title =        "Pattern Recognition. {A} Statistical Approach",
  publisher =    "Prentice-Hall",
  address =      "Englewood Cliffs, NJ",
  year =         "1982",
  comment =      PRNNref,
}

@Book{Devijver.Kittler.87,
  editor =       "P. A. Devijver and J. V. Kittler",
  title =        "Pattern Recognition Theory and Applications",
  publisher =    Springer,
  address =      "Berlin",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Devlin.ZZ.81,
  author =       "S. J. Devlin and R. Gnanadesikan and J. R.
                 Kettenring",
  title =        "Robust estimation of dispersion matrices and principal
                 components",
  journal =      JASA,
  volume =       "76",
  pages =        "354--362",
  year =         "1981",
  comment =      PRNNref,
}

@Article{DeVore.ZZ.89,
  author =       "R. A. DeVore and R. Howard and C. A. Micchelli",
  title =        "Optimal nonlinear approximation",
  journal =      "Manuscripta Mathematica",
  volume =       "63",
  pages =        "469--478",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Devroye.81a,
  author =       "L. Devroye",
  title =        "On the inequality of {Cover} and {Hart} in nearest
                 neighbor discrimination",
  journal =      PAMI,
  volume =       "3",
  pages =        "75--78",
  year =         "1981",
  comment =      PRNNref,
}

@Article{Devroye.81b,
  author =       "L. Devroye",
  title =        "On the almost everywhere convergence of nonparametric
                 regression function estimates",
  journal =      AnnStat,
  volume =       "9",
  pages =        "1310--1319",
  year =         "1981",
  comment =      PRNNref,
}

@Article{Devroye.82,
  author =       "L. Devroye",
  title =        "Bounds for the uniform deviation of empirical
                 measures",
  journal =      "Journal of Multivariate Analysis",
  volume =       "12",
  pages =        "72--79",
  year =         "1982",
  comment =      PRNNunref,
}

@Article{Devroye.88,
  author =       "L. Devroye",
  title =        "Automatic pattern recognition: a study of the
                 probability of error",
  journal =      PAMI,
  volume =       "10",
  pages =        "530--543",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Diaconis.Freedman.84,
  author =       "P. Diaconis and D. Freedman",
  title =        "Asymptotics of graphical projection pursuit",
  journal =      AnnStat,
  volume =       "12",
  pages =        "793--815",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Diaconis.Shahshahani.84,
  author =       "P. Diaconis and M. Shahshahani",
  title =        "On non-linear functions of linear combinations",
  journal =      SIAMSSC,
  volume =       "5",
  pages =        "175--191",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Diebolt.Robert.94,
  author =       "J. Diebolt and C. P. Robert",
  title =        "Estimation of finite mixture distributions through
                 {Bayesian} sampling",
  journal =      JRSSB,
  volume =       "56",
  pages =        "363--375",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Dietterich.90,
  author =       "T. G. Dietterich",
  title =        "Machine learning",
  journal =      "Annual Review of Computer Science",
  volume =       "4",
  pages =        "255--306",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Dietterich.Bakiri.91,
  author =       "T. G. Dietterich and G. Bakiri",
  editor =       "Dean, T. L. and McKeown, K.",
  booktitle =    "Proceedings of the Ninth AAAI National Conference on
                 Artificial Intelligence",
  title =        "Error-correcting output codes: a general method for
                 improving multiclass inductive learning programs",
  publisher =    "AAAI Press",
  address =      "Menlo Park, CA",
  pages =        "572--577",
  year =         "1991",
  note =         "[An identical paper appears as pp.~395--407 of
                 \cite{Wolpert.95}]",
  comment =      PRNNref,
}

@Article{Dietterich.Bakiri.95,
  author =       "T. G. Dietterich and G. Bakiri",
  title =        "Solving multiclass learning problems via
                 error-correcting output codes",
  journal =      "Journal of Artificial Intelligence Research",
  volume =       "2",
  pages =        "263--286",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Diggle.Hall.86,
  author =       "P. J. Diggle and P. Hall",
  title =        "The selection of terms in a orthogonal series density
                 estimator",
  journal =      JASA,
  volume =       "81",
  pages =        "230--233",
  year =         "1986",
  comment =      PRNNref,
}

@Article{Donoho.Johnstone.89,
  author =       "D. L. Donoho and I. M. Johnstone",
  title =        "Projection-based approximation and a duality with
                 kernel methods",
  journal =      AnnStat,
  volume =       "17",
  pages =        "58--106",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Doyle.73,
  author =       "P. Doyle",
  title =        "The use of automatic interaction detector and similar
                 search procedures",
  journal =      "Operational Research Quarterly",
  volume =       "24",
  pages =        "465--467",
  year =         "1973",
  comment =      PRNNunref,
}

@Article{Doyle.Fenwick.75,
  author =       "P. Doyle and I. Fenwick",
  title =        "The pitfalls of {AID} analysis",
  journal =      "Journal of Marketing Research",
  volume =       "12",
  pages =        "408--413",
  year =         "1975",
  comment =      PRNNunref,
}

@Article{Draper.95,
  author =       "D. Draper",
  title =        "Assessment and propagation of model uncertainty (with
                 discussion)",
  journal =      JRSSB,
  volume =       "57",
  pages =        "45--97",
  year =         "1995",
  comment =      PRNNref,
}

@InProceedings{Duchon.77,
  author =       "J. Duchon",
  editor =       "W. Schempp and K. Zeller",
  booktitle =    "Constructive Theory of Functions of Several
                 Variables",
  title =        "Spline minimizing rotation-invariant semi-norms in
                 Sobolev spaces",
  volume =       "571",
  pages =        "85--100",
  year =         "1977",
  series =       "Lecture Notes in Mathematics",
  comment =      PRNNref,
}

@Book{Duda.Hart.73,
  author =       "R. O. Duda and P. E. Hart",
  title =        "Pattern Classification and Scene Analysis",
  publisher =    Wiley,
  address =      "New York",
  year =         "1973",
  comment =      PRNNref,
}

@Article{Dudani.76,
  author =       "S. A. Dudani",
  title =        "The distance-weighted $k$-nearest-neighbor rule",
  journal =      SMC,
  volume =       "6",
  pages =        "325--327",
  year =         "1976",
  note =         NNset,
  comment =      PRNNref,
}

@Article{Dunn.74,
  author =       "J. C. Dunn",
  title =        "A fuzzy relative of the {ISODATA} process and its use
                 in detecting compact well-separated clusters",
  journal =      "Journal of Cybernetics",
  volume =       "3",
  pages =        "32--57",
  year =         "1974",
  comment =      PRNNunref,
}

@InProceedings{Dyn.87,
  author =       "N. Dyn",
  editor =       "C. K. Chui and L. L. Schumaker and F. I. Utreras",
  booktitle =    "Topics in Multivariate Approximation",
  title =        "Interpolation of scattered data by radial functions",
  publisher =    "Academic Press",
  address =      "New York",
  year =         "1987",
  comment =      PRNNunref,
}

@Article{Eaton.Oliver.92,
  author =       "H. A. C. Eaton and T. L. Oliver",
  title =        "Learning coefficient dependence on training set size",
  journal =      NNks,
  volume =       "5",
  pages =        "283--288",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Edwards.90,
  author =       "D. Edwards",
  title =        "Hierarchical interaction models (with discussion)",
  journal =      JRSSB,
  volume =       "81",
  pages =        "3--20",
  year =         "1990",
  comment =      PRNNref,
}

@Book{Edwards.95,
  author       = "Edwards, D.",
  title        = "Introduction to Graphical Modelling",
  publisher    = "Springer",
  year         = "1995",
  comment =      PRNNref,
}

@Article{Edwards.Havarnek.85,
  author =       "D. Edwards and T. Hav\'arnek",
  title =        "A fast procedure for model-search in multidimensional
                 contingency tables",
  journal =      Bka,
  volume =       "72",
  pages =        "339--351",
  year =         "1985",
  comment =      PRNNref,
}

@Article{Efron.75,
  author =       "B. Efron",
  title =        "The efficiency of logistic regression compared to
                 normal discriminant analysis",
  journal =      JASA,
  volume =       "70",
  pages =        "892--898",
  year =         "1975",
  comment =      PRNNref,
}

@Article{Efron.79,
  author =       "B. Efron",
  title =        "Bootstrap methods: another look at the jackknife",
  journal =      AnnStat,
  volume =       "7",
  pages =        "1--26",
  year =         "1979",
  comment =      PRNNref,
}

@Book{Efron.82,
  author =       "B. Efron",
  title =        "The Jackknife, the Bootstrap and Other Resampling
                 Plans",
  publisher =    "SIAM",
  address =      "Philadelphia",
  year =         "1982",
  comment =      PRNNref,
}

@Article{Efron.83,
  author =       "B. Efron",
  title =        "Estimating the error rate of a prediction rule.
                 Improvements on cross-validation",
  journal =      JASA,
  volume =       "78",
  pages =        "316--331",
  year =         "1983",
  comment =      PRNNref,
}

@Article{Efron.86,
  author =       "B. Efron",
  title =        "How biased is the apparent error rate of a prediction
                 rule?",
  journal =      JASA,
  volume =       "81",
  pages =        "461--470",
  year =         "1986",
  comment =      PRNNref,
}

@Article{Efron.Gong.83,
  author =       "B. Efron and G. Gong",
  title =        "A leisurely look at the bootstrap, the jackknife, and
                 cross-validation",
  journal =      "American Statistician",
  volume =       "37",
  pages =        "36--48",
  year =         "1983",
  comment =      PRNNref,
}

@Book{Efron.Tibshirani.93,
  author =       "B. Efron and R. J. Tibshirani",
  title =        "An Introduction to the Bootstrap",
  publisher =    "Chapman \& Hall",
  address =      "New York",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Ehrenfeucht.ZZ.89,
  author =       "A. Ehrenfeucht and D. Haussler and M. Kearns and L.
                 Valiant",
  title =        "A general lower bound on the number of examples needed
                 for learning",
  journal =      InfoComp,
  volume =       "82",
  pages =        "247--261",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Eisenberger.64,
  author =       "I. Eisenberger",
  title =        "Genesis of bimodal distributions",
  journal =      Techno,
  volume =       "6",
  pages =        "357--363",
  year =         "1964",
  comment =      PRNNref,
}

@Article{Eriksen.87,
  author =       "P. S. Eriksen",
  title =        "Proportionality of covariances",
  journal =      AnnStat,
  volume =       "15",
  pages =        "732--748",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Erwin.ZZ.92,
  author =       "E. Erwin and K. Obermayer and K. Schulten",
  title =        "Self-organizing maps: ordering, convergence properties
                 and energy functions",
  journal =      BioCyb,
  volume =       "67",
  pages =        "47--55",
  year =         "1992",
  comment =      PRNNref,
}

@PhdThesis{Eslava.89,
  author =       "G. Eslava-G\'omez",
  title =        "Projection Pursuit and Other Graphical Methods for
                 Multivariate Data",
  type =         "{D.~Phil.} thesis",
  school =       "University of Oxford",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Eslava.Marriott.94,
  author =       "G. Eslava and F. H. C. Marriott",
  title =        "Some criteria for projection pursuit",
  journal =      StatComp,
  volume =       "4",
  pages =        "13--20",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Evans.Swartz.95,
  author =       "M. Evans and T. Swartz",
  title =        "Methods for approximating integrals in statistics with
                 special emphasis on {Bayesian} integration problems",
  journal =      StatSci,
  volume =       "10",
  pages =        "254--272",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Fagin.77,
  author =       "R. Fagin",
  title =        "Multivalued dependencies and a new normal form for relational
                 databases",
  journal =      "ACM Transactions on Database Systems",
  volume =       "2",
  pages =        "262--278",
  year =         "1977",
  comment =      PRNNref,
}

@InProceedings{Fahlman.89,
  author =       "S. E. Fahlman",
  editor =       "D. Touretzky and G. Hinton and T. Sejnowski",
  booktitle =    "Proceedings of the 1988 Connectionist Models Summer
                 School, Pittsburg",
  title =        "Faster-learning variations on back-propagation: an
                 empirical study",
  publisher =    MK,
  address =      "San Mateo, CA",
  pages =        "38--51",
  year =         "1989",
  comment =      PRNNref,
}

@InProceedings{Fahlman.Lebiere.90,
  author =       "S. E. Fahlman and C. Lebiere",
  title =        "The cascade-correlation learning architecture",
  crossref =     "NIPS2",
  pages =        "524--532",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Fauquet.ZZ.88,
  author =       "C. Fauquet and D. Desbois and D. Fargette and G.
                 Vidal",
  editor =       "J. I. Cooper and M. J. C. Asher",
  booktitle =    "Viruses with Fungal Vectors",
  title =        "Classification of furoviruses based on the amino acid
                 composition of their coat proteins",
  publisher =    "Association of Applied Biologists",
  address =      "Edinburgh",
  pages =        "19--38",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Fayyad.Irani.92,
  author =       "U. M. Fayyad and K. B. Irani",
  title =        "On the handling of continuous-valued attributes in
                 decision tree generation",
  journal =      ML,
  volume =       "8",
  pages =        "87--102",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Fefferman.Markel.94,
  author =       "C. Fefferman and S. Markel",
  title =        "Recovering a feed-forward network from its output",
  crossref =     "NIPS6",
  pages =        "335--342",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Feldman.85,
  author =       "J. A. Feldman",
  title =        "Connectionist models and their applications:
                 introduction",
  journal =      "Cognitive Science",
  volume =       "9",
  pages =        "1--2",
  year =         "1985",
  comment =      PRNNunref,
}

@Article{Fienberg.Holland.73,
  author =       "S. E. Fienberg and P. W. Holland",
  title =        "Simultaneous estimation of multinomial cell
                 probabilities",
  journal =      JASA,
  volume =       "68",
  pages =        "683--691",
  year =         "1973",
  comment =      PRNNref,
}

@Article{Finnoff.ZZ.93,
  author =       "W. Finnoff and F. Hergert and H. G. Zimmerman",
  title =        "Improving model selection by nonconvergent methods",
  journal =      NNks,
  volume =       "6",
  pages =        "771--783",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Fisher.36,
  author =       "R. A. Fisher",
  title =        "The use of multiple measurements in taxonomic
                 problems",
  journal =      "Annals of Eugenics",
  volume =       "7",
  pages =        "179--188",
  year =         "1936",
  comment =      PRNNref,
}

@TechReport{Fix.Hodges.51,
  author =       "E. Fix and J. L. Hodges",
  title =        "Discriminatory analysis---nonparametric
                 discrimination: consistency properties",
  type =         "Report no.{}",
  number =       "4",
  institution =  "US Air Force School of Aviation Medicine, Random
                 Field, Texas",
  year =         "1951",
  note =         "[Published in Agrawala (1977), Silverman and Jones
                 (1989) and Dasarathy (1991)]",
  comment =      PRNNref,
}

@InProceedings{Flanagan.ZZ.89,
  author =       "J. K. Flanagan and D. R. Morrell and R. L. Frost and
                 C. J. Read and B. E. Nelson",
  booktitle =    "Proceedings of the International Conference on
                 Acoustics, Speech and Signal Processing (Glasgow, May
                 1989)",
  title =        "Vector quantization codebook generation using
                 simulated annealing",
  year =         "1989",
  comment =      PRNNunref,
}

@Book{Fleiss.81,
  author =       "J. L. Fleiss",
  title =        "Statistical Methods for Rates and Proportions",
  publisher =    Wiley,
  address =      "New York",
  edition =      "Second",
  year =         "1981",
  comment =      PRNNref,
}

@Book{Fletcher.87,
  author =       "R. Fletcher",
  title =        "Practical Methods of Optimization",
  publisher =    Wiley,
  address =      "Chichester",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Flocchini.ZZ.92,
  author =       "P. Flocchini and F. Gardin and G. Mauri and M. P.
                 Pensini and P. Stofella",
  title =        "Combining image processing operators and neural
                 networks in a face recognition system",
  journal =      IJPRAI,
  volume =       "6",
  pages =        "447--467",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Flury.86,
  author =       "B. Flury",
  title =        "Proportionality of $k$ covariance matrices",
  journal =      "Statistics and Probability Letters",
  volume =       "4",
  pages =        "29--33",
  year =         "1986",
  comment =      PRNNref,
}

@Article{Flury.ZZ.94,
  author =       "B. Flury and M. J. Schmid and A. Natayanan",
  title =        "Error rates in quadratic discrimination with
                 constraints on the covariance matrices",
  journal =      "Journal of Classification",
  volume =       "11",
  pages =        "101--120",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Forgy.65,
  author =       "E. W. Forgy",
  title =        "Cluster analysis of multivariate data: efficiency vs
                 interpretability of classifications",
  journal =      Biom,
  volume =       "21",
  pages =        "768--769",
  year =         "1965",
  comment =      PRNNref,
}

@Article{Fort.Pages.93,
  author =       "M. Fort and G. Pag\`es",
  title =        "Sur la convergence \emph{p.s.} de l'algorithme de
                 {Kohonen} g\'en\'eralis\'e",
  journal =      "Note aux Compte Rendus de l'Acad\'emie des Sciences de
                 Paris",
  volume =       "317",
  number =       "S\'erie I",
  pages =        "389--394",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Frank.Friedman.93,
  author =       "I. E. Frank and J. H. Friedman",
  title =        "A statistical view of some chemometrics regression
                 tools (with discussion)",
  journal =      Techno,
  volume =       "35",
  pages =        "109--148",
  year =         "1993",
  comment =      PRNNref,
}

@Book{Fraser.68,
  author =       "D. A. S. Fraser",
  title =        "The Structure of Inference",
  publisher =    Wiley,
  address =      "New York",
  year =         "1968",
  comment =      PRNNunref,
}

@Article{Frean.90,
  author =       "M. Frean",
  title =        "The upstart algorithm: {A} method for constructing and
                 training feedforward neural networks",
  journal =      NC,
  volume =       "2",
  number =       "2",
  pages =        "198--209",
  year =         "1990",
  comment =      PRNNref,
}

@Book{Freedman.71,
  author =       "D. Freedman",
  title =        "{Markov} Chains",
  publisher =    "Holden-Day",
  address =      "San Francisco",
  year =         "1971",
  comment =      PRNNref,
}

@Article{Friedman.77,
  author =       "J. H. Friedman",
  title =        "A recursive partitioning decision rule for
                 nonparametric classification",
  journal =      IEC,
  volume =       "26",
  pages =        "404--408",
  year =         "1977",
  comment =      PRNNref,
}

@TechReport{Friedman.84,
  author =       "J. H. Friedman",
  title =        "{SMART} users' guide",
  number =       "1",
  institution =  "Laboratory for Computational Statistics, Dept of
                 Statistics, Stanford University",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Friedman.87,
  author =       "J. H. Friedman",
  title =        "Exploratory projection pursuit",
  journal =      JASA,
  volume =       "82",
  pages =        "249--266",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Friedman.89,
  author =       "J. H. Friedman",
  title =        "Regularized discriminant analysis",
  journal =      JASA,
  volume =       "84",
  pages =        "165--175",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Friedman.91,
  author =       "J. H. Friedman",
  title =        "Multivariate adaptive regression splines (with
                 discussion)",
  journal =      AnnStat,
  volume =       "19",
  pages =        "1--141",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Friedman.Rubin.67,
  author =       "H. P. Friedman and J. Rubin",
  title =        "Some invariant criteria for grouping data",
  journal =      JASA,
  volume =       "62",
  pages =        "1159--1178",
  year =         "1967",
  comment =      PRNNref,
}

@Article{Friedman.Silverman.89,
  author =       "J. H. Friedman and B. W. Silverman",
  title =        "Flexible parsimonious smoothing and additive modeling
                 (with discussion)",
  journal =      Techno,
  volume =       "31",
  pages =        "3--39",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Friedman.Stuetzle.81,
  author =       "J. H. Friedman and W. Stuetzle",
  title =        "Projection pursuit regression",
  journal =      JASA,
  volume =       "76",
  pages =        "817--823",
  year =         "1981",
  comment =      PRNNref,
}

@Article{Friedman.Tukey.74,
  author =       "J. H. Friedman and J. W. Tukey",
  title =        "A projection pursuit algorithm for exploratory data
                 analysis",
  journal =      IEC,
  volume =       "23",
  pages =        "881--890",
  year =         "1974",
  comment =      PRNNref,
}

@Article{Friedman.ZZ.75,
  author =       "J. H. Friedman and F. Baskett and L. J. Shustek",
  title =        "An algorithm for finding nearest neighbors",
  journal =      IEC,
  volume =       "24",
  pages =        "1000--1006",
  year =         "1975",
  comment =      PRNNref,
}

@Article{Friedman.ZZ.77,
  author =       "J. H. Friedman and J. L. Bentley and R. A. Finkel",
  title =        "An algorithm for finding best matches in logarithmic
                 expected time",
  journal =      TOMS,
  volume =       "3",
  pages =        "209--226",
  year =         "1977",
  comment =      PRNNref,
}

@Article{Friedman.ZZ.84,
  author =       "J. H. Friedman and W. Stuetzle and A. Schroeder",
  title =        "Projection pursuit density estimation",
  journal =      JASA,
  volume =       "79",
  pages =        "599--608",
  year =         "1984",
  comment =      PRNNref,
}

@Book{Fu.82,
  author =       "K.-S. Fu",
  title =        "Syntactic Pattern Recognition and Applications",
  publisher =    "Prentice Hall",
  address =      "Engelwood Cliffs, NJ",
  year =         "1982",
  comment =      PRNNunref,
}

@Book{Fukunaga.90,
  author =       "K. Fukunaga",
  title =        "Introduction to Statistical Pattern Recognition",
  publisher =    "Academic Press",
  address =      "Boston",
  edition =      "Second",
  year =         "1990",
  note =         "[First edition, 1972]",
  comment =      PRNNref,
}

@Article{Fukunaga.Flick.84,
  author =       "K. Fukunaga and T. E. Flick",
  title =        "An optimal global nearest neighbor metric",
  journal =      PAMI,
  volume =       "6",
  pages =        "314--318",
  year =         "1984",
  note =         NNset,
  comment =      PRNNref,
}

@Article{Fukunaga.Flick.85,
  author =       "K. Fukunaga and T. E. Flick",
  title =        "The $2$-{NN} rule for more accurate {NN} risk
                 estimation",
  journal =      PAMI,
  volume =       "7",
  pages =        "107--112",
  year =         "1985",
  comment =      PRNNref,
}

@Article{Fukunaga.Hummels.87a,
  author =       "K. Fukunaga and D. M. Hummels",
  title =        "Bias of nearest neighbor error estimates",
  journal =      PAMI,
  volume =       "9",
  pages =        "103--112",
  year =         "1987",
  note =         NNset,
  comment =      PRNNref,
}

@Article{Fukunaga.Hummels.87b,
  author =       "K. Fukunaga and D. M. Hummels",
  title =        "{Bayes} error estimation using Parzen and $k$-{NN}
                 procedures",
  journal =      PAMI,
  volume =       "9",
  pages =        "634--643",
  year =         "1987",
  note =         NNset,
  comment =      PRNNref,
}

@Article{Fukunaga.Kessell.71,
  author =       "K. Fukunaga and D. L. Kessell",
  title =        "Estimation of classification error",
  journal =      IEC,
  volume =       "20",
  pages =        "1521--1527",
  year =         "1971",
  comment =      PRNNref,
}

@Article{Fukunaga.Mantock.84,
  author =       "K. Fukunaga and J. M. Mantock",
  title =        "Nonparametric data reduction",
  journal =      PAMI,
  volume =       "6",
  pages =        "115--118",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Fukunaga.Narendra.75,
  author =       "K. Fukunaga and P. M. Narendra",
  title =        "A branch and bound algorithm for computing $k$-nearest
                 neighbors",
  journal =      IEC,
  volume =       "24",
  pages =        "750--753",
  year =         "1975",
  comment =      PRNNref,
}

@Article{Funahashi.89,
  author =       "K. Funahashi",
  title =        "On the approximate realization of continuous mappings
                 by neural networks",
  journal =      NNks,
  volume =       "2",
  pages =        "183--192",
  year =         "1989",
  comment =      PRNNref,
}

@InProceedings{Fung.Crawford.90,
  author =       "R. M. Fung and S. L. Crawford",
  editor =       "Dietterich, T. and Swartout, W.",
  booktitle =    "Proceedings, Eighth AAAI National Conference on
                 Artificial Intelligence (Boston, 1990)",
  title =        "Constructor: a system for induction of probabilistic
                 models",
  publisher =    "AAAI Press",
  address =      "Menlo Park, CA",
  pages =        "762--769",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Furman.Lindsay.94,
  author =       "W. Furman and B. Lindsay",
  title =        "Testing for the number of components in a mixture of
                 normal distributions using moment estimators",
  journal =      CSDA,
  volume =       "17",
  pages =        "473--492",
  year =         "1994",
  comment =      PRNNunref,
}

@Article{Furnival.Wilson.74,
  author =       "G. M. Furnival and Wilson, Jr., R. W.",
  title =        "Regressions by leaps and bounds",
  journal =      Techno,
  volume =       "16",
  pages =        "499--511",
  year =         "1974",
  comment =      PRNNref,
}

@Article{Gader.ZZ.91,
  author =       "P. Gader and B. Forester and M. Ganzberger and A.
                 Gillies and B. Mitchell and M. Whalen and T. Yocum",
  title =        "Recognition of handwritten digits using template and
                 model matching",
  journal =      PR,
  volume =       "24",
  pages =        "421--431",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Gallant.90,
  author =       "S. I. Gallant",
  title =        "Perceptron-based learning algorithms",
  journal =      TNN,
  volume =       "1",
  pages =        "179--191",
  year =         "1990",
  comment =      PRNNref,
}

@Book{Gallant.93,
  author =       "S. I. Gallant",
  title =        "Neural Network Learning and Expert Systems",
  publisher =    "The MIT Press",
  address =      "Cambridge, MA",
  year =         "1993",
  ISBN =         "0-262-07145-2",
  comment =      PRNNref,
}

@InProceedings{Gammerman.ZZ.95,
  author =       "A. Gammerman and Z. Luo and C. G. G. Aitken and M. J.
                 Brewer",
  title =        "Exact and approximate algorithms and their
                 implementations in mixed graphical models",
  crossref =     "Gammerman.95",
  pages =        "33--53",
  year =         "1995",
  comment =      PRNNref,
}

@Book{Garey.Johnson.79,
  author =       "M. R. Garey and D. S. Johnson",
  title =        "Computers and Intractability: {A} Guide to the Theory
                 of {NP}-completeness",
  publisher =    "Freeman",
  address =      "New York",
  year =         "1979",
  comment =      PRNNref,
}

@Article{Gates.72,
  author =       "G. W. Gates",
  title =        "The reduced nearest neighbor rule",
  journal =      IEIT,
  volume =       "18",
  pages =        "431--433",
  year =         "1972",
  comment =      PRNNref,
}

@InProceedings{Geiger.Pearl.90,
  author =       "D. Geiger and J. Pearl",
  editor =       "R. D. Shachter and T. S. Levitt and L. N. Kanal and J.
                 F. Lemmer",
  booktitle =    "Uncertainty in Artificial Intelligence 4",
  title =        "On the logic of causal models",
  publisher =    "North-Holland",
  address =      "Amsterdam",
  pages =        "3--14",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Geiger.Pearl.93,
  author =       "D. Geiger and J. Pearl",
  title =        "Logical and algorithmic properties of conditional
                 independence and graphical models",
  journal =      AnnStat,
  volume =       "21",
  pages =        "2001--2021",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Geiger.ZZ.90,
  author =       "D. Geiger and T. Verma and J. Pearl",
  title =        "Recognizing independence in {Bayesian} networks",
  journal =      Nks,
  volume =       "20",
  pages =        "507--534",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Geisser.64,
  author =       "S. Geisser",
  title =        "Posterior odds for multivariate normal
                 classifications",
  journal =      JRSSB,
  volume =       "26",
  pages =        "69--76",
  year =         "1964",
  comment =      PRNNref,
}

@InProceedings{Geisser.66,
  author =       "S. Geisser",
  editor =       "P. R. Krishnaiah",
  booktitle =    "Multivariate Analysis",
  title =        "Predictive discrimination",
  publisher =    "Academic Press",
  address =      "New York",
  pages =        "149--163",
  year =         "1966",
  comment =      PRNNunref,
}

@Article{Geisser.75,
  author =       "S. Geisser",
  title =        "The predictive sample reuse method with applications",
  journal =      JASA,
  volume =       "70",
  pages =        "320--328",
  year =         "1975",
  comment =      PRNNref,
}

@Article{Geisser.84,
  author =       "S. Geisser",
  title =        "On prior distributions for binary trials (with
                 discussion)",
  journal =      "American Statistician",
  volume =       "38",
  pages =        "244--251",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Geisser.87,
  author =       "S. Geisser",
  title =        "Comment on \cite{Hodges.87}",
  journal =      StatSci,
  volume =       "2",
  pages =        "277--279",
  year =         "1987",
  comment =      PRNNref,
}

@Book{Geisser.93,
  author =       "S. Geisser",
  title =        "Predictive Inference: An Introduction",
  publisher =    "Chapman \& Hall",
  address =      "New York",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Geisser.Cornfield.63,
  author =       "S. Geisser and J. Cornfield",
  title =        "Posterior distributions for multivariate normal
                 parameters",
  journal =      JRSSB,
  volume =       "25",
  pages =        "368--376",
  year =         "1963",
  comment =      PRNNref,
}

@InProceedings{Gelfand.Delp.91,
  author =       "S. B. Gelfand and E. J. Delp",
  title =        "On tree structured classifiers",
  crossref =     "Sethi.Jain.91",
  pages =        "51--70",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Gelfand.Dey.94,
  author =       "A. E. Gelfand and D. K. Dey",
  title =        "{Bayes} model choice: asymptotics and exact
                 calculations",
  journal =      JRSSB,
  volume =       "56",
  pages =        "501--514",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Gelfand.Mitter.91,
  author =       "S. B. Gelfand and S. K. Mitter",
  title =        "Recursive stochastic algorithms for global
                 optimization in $\mathbb{R}^d$",
  journal =      "SIAM Journal on Control and Optimization",
  volume =       "29",
  pages =        "999--1018",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Gelfand.Smith.90,
  author =       "A. E. Gelfand and A. F. M. Smith",
  title =        "Sampling-based approaches to calculating marginal
                 densities",
  journal =      JASA,
  volume =       "85",
  pages =        "398--409",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Gelfand.ZZ.90,
  author =       "A. E. Gelfand and S. E. Hills and A. Racine-Poon and
                 A. F. M. Smith",
  title =        "Illustration of {Bayesian} inference in normal data
                 models using {Gibbs} sampling",
  journal =      JASA,
  volume =       "85",
  pages =        "972--985",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Gelfand.ZZ.91,
  author =       "S. B. Gelfand and C. S. Ravishankar and E. J. Delp",
  title =        "An iterative growing and pruning algorithm for
                 classification tree design",
  journal =      PAMI,
  volume =       "13",
  pages =        "163--174",
  year =         "1991",
  comment =      PRNNref,
}

@Book{Gelman.ZZ.95,
  author =       "A. Gelman and J. B. Carlin and H. S. Stern and D. B.
                 Rubin",
  title =        "{Bayesian} Data Analysis",
  publisher =    "Chapman \& Hall",
  address =      "New York",
  year =         "1995",
  comment =      PRNNref,
}

@InProceedings{Geman.90,
  author =       "D. Geman",
  editor =       "P. L. Hennequin",
  booktitle =    "\'Ecole d'\'Et\'e de Probabilit\'es de Saint-Flour
                 XVIII -- 1988",
  title =        "Random fields and inverse problems in imaging",
  volume =       "1427",
  pages =        "113--193",
  year =         "1990",
  series =       "Lecture Notes in Mathematics",
  comment =      PRNNref,
}

@Article{Geman.Geman.84,
  author =       "S. Geman and D. Geman",
  title =        "Stochastic relaxation, {Gibbs} distributions and the
                 {Bayesian} restoration of images",
  journal =      PAMI,
  volume =       "6",
  pages =        "721--741",
  year =         "1984",
  note =         URset,
  comment =      PRNNref,
}

@Article{Geman.Hwang.82,
  author =       "S. Geman and C.-R. Hwang",
  title =        "Nonparametric maximum likelihood estimation by the
                 method of sieves",
  journal =      AnnStat,
  volume =       "10",
  pages =        "401--414",
  year =         "1982",
  comment =      PRNNref,
}

@Article{Geman.ZZ.92,
  author =       "S. Geman and E. Bienenstock and R. Doursat",
  title =        "Neural networks and the bias/variance dilemma",
  journal =      NC,
  volume =       "4",
  pages =        "1--58",
  year =         "1992",
  comment =      PRNNref,
}

@Article{George.McCulloch.93,
  author =       "E. I. George and R. E. McCulloch",
  title =        "Variable \hbox{selection} via {Gibbs} sampling",
  journal =      JASA,
  volume =       "88",
  pages =        "881--889",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Georgiopoulos.ZZ.90,
  author =       "M. Georgiopoulos and G. L. Heileman and J. Huang",
  title =        "Convergence properties of learning in {ART1}",
  journal =      NC,
  volume =       "2",
  pages =        "502--509",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Georgiopoulos.ZZ.91,
  author =       "M. Georgiopoulos and G. L. Heileman and J. Huang",
  title =        "Properties of learning related to pattern diversity in
                 {ART1}",
  journal =      NNks,
  volume =       "4",
  pages =        "751--757",
  year =         "1991",
  comment =      PRNNref,
}

@Book{Gersho.Gray.92,
  author =       "A. Gersho and R. M. Gray",
  title =        "Vector Quantization and Signal Compression",
  publisher =    "Kluwer Academic Publishers",
  address =      "Boston",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Geyer.92,
  author =       "C. Geyer",
  title =        "Practical {Markov} chain {Monte Carlo} (with
                 discussion)",
  journal =      StatSci,
  volume =       "7",
  pages =        "473--511",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Ghurye.Olkin.69,
  author =       "S. G. Ghurye and I. Olkin",
  title =        "Unbiased estimation of some multivariate probability
                 densities and related functions",
  journal =      AnnMathStat,
  volume =       "40",
  pages =        "1261--1271",
  year =         "1969",
  comment =      PRNNref,
}

@Article{Gilbert.Lemarechal.89,
  author =       "J. C. Gilbert and C. Lemar\'echal",
  title =        "Some numerical experiments with variable storage
                 quasi-{Newton} methods",
  journal =      MathProg,
  volume =       "45",
  pages =        "407--436",
  year =         "1989",
  comment =      PRNNref,
}

@Book{Gill.ZZ.81,
  author =       "P. E. Gill and W. Murray and M. H. Wright",
  title =        "Practical Optimization",
  publisher =    "Academic Press",
  address =      "London",
  year =         "1981",
  comment =      PRNNref,
}

@InProceedings{Girosi.Anzellotti.93,
  author =       "F. Girosi and G. Anzellotti",
  title =        "Rates of convergence for radial basis functions and
                 neural networks",
  crossref =     "Mammone.93",
  pages =        "97--114",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Girosi.Poggio.90,
  author =       "F. Girosi and T. Poggio",
  title =        "Networks and the best approximation property",
  journal =      BioCyb,
  volume =       "63",
  pages =        "169--176",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Girosi.ZZ.95,
  author =       "F. Girosi and M. Jones and T. Poggio",
  title =        "Regularization theory and neural networks
                 architectures",
  journal =      NC,
  volume =       "7",
  pages =        "219--269",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Glick.72,
  author =       "N. Glick",
  title =        "Sample-based classification procedures derived from
                 density estimators",
  journal =      JASA,
  volume =       "67",
  pages =        "116--122",
  year =         "1972",
  comment =      PRNNref,
}

@Article{Glick.76,
  author =       "N. Glick",
  title =        "Sample-based classification procedures related to
                 empiric distributions",
  journal =      IEIT,
  volume =       "22",
  pages =        "454--461",
  year =         "1976",
  comment =      PRNNref,
}

@Book{Glymour.ZZ.87,
  author =       "C. Glymour and R. Scheines and P. Spirtes and K.
                 Kelly",
  title =        "Discovering Causal Structure: Artificial Intelligence,
                 Philosophy of Science, and Statistical Modeling",
  publisher =    "Academic Press",
  address =      "San Diego",
  year =         "1987",
  comment =      PRNNref,
}

@Book{Goldstein.Dillon.78,
  author =       "M. Goldstein and W. R. Dillon",
  title =        "Discrete Discriminant Analysis",
  publisher =    Wiley,
  address =      "New York",
  year =         "1978",
  comment =      PRNNref,
}

@InProceedings{Golomb.ZZ.91,
  author =       "B. A. Golomb and D. T. Lawrence and T. J. Sejnowski",
  title =        "{SEXNET}: {A} neural network identifies sex from human
                 faces",
  crossref =     "NIPS3",
  pages =        "572--577",
  year =         "1991",
  comment =      PRNNref,
}

@Book{Golombic.80,
  author =       "M. C. Golombic",
  title =        "Algorithmic Graph Theory and Perfect Graphs",
  publisher =    "Academic Press",
  address =      "New York",
  year =         "1980",
  comment =      PRNNref,
}

@Book{Golub.VanLoan.89,
  author =       "G. H. Golub and C. F. {Van Loan}",
  title =        "Matrix Computations",
  publisher =    "Johns Hopkins University Press",
  address =      "Baltimore",
  edition =      "Second",
  year =         "1989",
  comment =      PRNNref,
}

@Book{Gonzalez.Thomason.78,
  author =       "R. C. Gonzalez and M. G. Thomason",
  title =        "Syntactic Pattern Recognition: An Introduction",
  publisher =    "Addison-Wesley",
  address =      "Reading, MA",
  year =         "1978",
  comment =      PRNNunref,
}

@Book{Good.65,
  author =       "I. J. Good",
  title =        "The Estimation of Probabilities",
  publisher =    "The MIT Press",
  address =      "Cambridge, MA",
  year =         "1965",
  comment =      PRNNref,
}

@Book{Good.83,
  author =       "I. J. Good",
  title =        "Good Thinking: The Foundations of Probability and its
                 Applications",
  publisher =    "University of Minnesota Press",
  address =      "Minneapolis",
  year =         "1983",
  comment =      PRNNunref,
}

@Article{Goodman.Smyth.88,
  author =       "R. M. Goodman and P. Smyth",
  title =        "Decision tree design from a communication theory
                 standpoint",
  journal =      IEIT,
  volume =       "34",
  pages =        "979--994",
  year =         "1988",
  comment =      PRNNref,
}

@Book{Gordon.81,
  author =       "A. D. Gordon",
  title =        "Classification. Methods for Exploratory Analysis of
                 Multivariate Data",
  publisher =    "Chapman \& Hall",
  address =      "London",
  year =         "1981",
  comment =      PRNNref,
}

@Article{Gori.Tesi.92,
  author =       "M. Gori and A. Tesi",
  title =        "On the problem of local minima in backpropagation",
  journal =      PAMI,
  volume =       "14",
  pages =        "76--86",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Gower.66,
  author =       "J. C. Gower",
  title =        "Some distance properties of \hbox{latent} root and
                 vector methods used in multivariate analysis",
  journal =      Bka,
  volume =       "53",
  pages =        "325--328",
  year =         "1966",
  comment =      PRNNref,
}

@Article{Gower.71,
  author =       "J. C. Gower",
  title =        "A general coefficient of similarity and some of its
                 properties",
  journal =      Biom,
  volume =       "27",
  pages =        "857--871",
  year =         "1971",
  comment =      PRNNref,
}

@Article{Gower.Legendre.86,
  author =       "J. C. Gower and P. Legendre",
  title =        "Metric and \hbox{Euclidean} properties of
                 dissimilarity coefficients",
  journal =      "Journal of Classification",
  volume =       "3",
  pages =        "5--48",
  year =         "1986",
  comment =      PRNNref,
}

@Article{Gray.84,
  author =       "R. M. Gray",
  title =        "Vector quantization",
  journal =      "IEEE ASSP Magazine",
  volume =       "1",
  number =       "2",
  pages =        "4--29",
  year =         "1984",
  comment =      PRNNref,
}

@Book{Green.Silverman.94,
  author =       "P. J. Green and B. W. Silverman",
  title =        "Nonparametric Regression and Generalized Linear
                 Models. {A} Roughness Penalty Approach",
  publisher =    "Chapman \& Hall",
  address =      "London",
  year =         "1994",
  comment =      PRNNref,
}

@Book{Grenander.81,
  author =       "U. Grenander",
  title =        "Abstract Inference",
  publisher =    Wiley,
  address =      "New York",
  year =         "1981",
  comment =      PRNNunref,
}

@Book{Grenander.ZZ.91,
  author =       "U. Grenander and Y. Chow and D. M. Keenan",
  title =        "Hands. {A} Pattern Theoretic Study of Biological
                 Shapes",
  publisher =    Springer,
  address =      "New York",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Grinold.69,
  author =       "R. C. Grinold",
  title =        "Comment on `{Pattern} classification design by linear
                 programming'",
  journal =      IEC,
  volume =       "18",
  pages =        "378--379",
  year =         "1969",
  comment =      PRNNref,
}

@TechReport{Grother.Candela.93,
  author =       "P. J. Grother and G. T. Candela",
  title =        "Comparison of handprinted digit classifiers",
  number =       "NISTIR 5209",
  institution =  "US National Institute of Standards and Technology",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Gu.90,
  author =       "C. Gu",
  title =        "Adaptive spline smoothing in non-{Gaussian} regression
                 models",
  journal =      JASA,
  volume =       "85",
  pages =        "801--807",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Gu.Wahba.91,
  author =       "C. Gu and G. Wahba",
  title =        "Minimizing {GCV}/{GML} scores with multiple smoothing
                 parameters via the {Newton} method",
  journal =      SIAMSSC,
  volume =       "12",
  pages =        "383--398",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Gu.ZZ.89,
  author =       "C. Gu and D. M. Bates and Z. Chen and G. Wahba",
  title =        "The computation of generalized cross-validation
                 functions through {Householder} tridiagonalization with
                 applications to the fitting of interaction spline
                 models",
  journal =      "SIAM Journal on Matrix Analysis and Applications",
  volume =       "10",
  pages =        "459--480",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Guo.Gelfand.92,
  author =       "H. Guo and S. B. Gelfand",
  title =        "Classification trees with neural network feature
                 extraction",
  journal =      TNN,
  volume =       "3",
  pages =        "923--933",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Guyon.ZZ.92,
  author =       "I. Guyon and V. Vapnik and B. Boser and L. Bottou and
                 S. A. Solla",
  title =        "Structural risk minimization for character
                 recognition",
  crossref =     "NIPS4",
  pages =        "471--479",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Hall.81,
  author =       "P. Hall",
  title =        "On nonparametric multivariate binary discrimination",
  journal =      Bka,
  volume =       "68",
  pages =        "287--294",
  year =         "1981",
  comment =      PRNNref,
}

@Article{Hall.89,
  author =       "P. Hall",
  title =        "On polynomial-based projection indices for exploratory
                 projection pursuit",
  journal =      AnnStat,
  volume =       "17",
  pages =        "589--605",
  year =         "1989",
  comment =      PRNNref,
}

@TechReport{Hall.Ball.65,
  author =       "D. J. Hall and G. B. Ball",
  title =        "{ISODATA}: a novel method of data analysis and pattern
                 classification",
  institution =  "Stanford Research Institute, Menlo Park CA",
  year =         "1965",
  comment =      PRNNref,
}

@InProceedings{Hall.Khanna.77,
  author =       "D. J. Hall and D. Khanna",
  editor =       "K. Enslein and A. Ralston and H. S. Wilf",
  booktitle =    "Statistical Methods for Digital Computers",
  title =        "The {ISODATA} method of computation for relative
                 perception of similarities and differences in complex
                 and real computers",
  volume =       "3",
  publisher =    Wiley,
  address =      "New York",
  pages =        "340--373",
  year =         "1977",
  comment =      PRNNunref,
}

@Article{Hall.Wand.88,
  author =       "P. Hall and M. P. Wand",
  title =        "On nonparametric discrimination using density
                 differences",
  journal =      Bka,
  volume =       "75",
  pages =        "541--547",
  year =         "1988",
  comment =      PRNNref,
}

@Book{Hampel.ZZ.86,
  author =       "F. R. Hampel and E. M. Ronchetti and P. J. Rousseeuw
                 and W. A. Stahel",
  title =        "Robust Statistics: The Approach Based on Influence
                 Functions",
  publisher =    Wiley,
  address =      "New York",
  year =         "1986",
  comment =      PRNNref,
}

@Article{Hampson.Volper.86,
  author       = "S. E. Hampson and D. J. Volper",
  title        = "Linear function neurons: structure and training",
  journal      = "Biological Cybernetics",
  volume =       "53",
  pages =        "203--217",
  year         = "1986",
  comment =      PRNNref,
}

@Book{Hand.81,
  author =       "D. J. Hand",
  title =        "Discrimination and Classification",
  publisher =    Wiley,
  address =      "Chichester",
  year =         "1981",
  comment =      PRNNref,
}

@Book{Hand.82,
  author =       "D. J. Hand",
  title =        "Kernel Discriminant Analysis",
  publisher =    "Research Studies Press",
  address =      "Chichester",
  year =         "1982",
  comment =      PRNNunref,
}

@Article{Hand.Batchelor.78,
  author =       "D. J. Hand and B. G. Batchelor",
  title =        "An edited condensed nearest neighbor rule",
  journal =      "Information Sciences",
  volume =       "14",
  pages =        "171--180",
  year =         "1978",
  comment =      PRNNunref,
}

@Article{Hannan.Quinn.79,
  author =       "E. J. Hannan and B. G. Quinn",
  title =        "The determination of the order of an autoregression",
  journal =      JRSSB,
  volume =       "41",
  pages =        "190--195",
  year =         "1979",
  comment =      PRNNref,
}

@Article{Hansen.Salamon.90,
  author =       "L. K. Hansen and P. Salamon",
  title =        "Neural network ensembles",
  journal =      PAMI,
  volume =       "12",
  pages =        "993--1001",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Hanson.Pratt.89,
  author =       "S. J. Hanson and L. Y. Pratt",
  title =        "Comparing biases for minimal network construction with
                 back-propagation",
  crossref =     "NIPS1",
  pages =        "177--185",
  year =         "1989",
  comment =      PRNNref,
}

@Book{Hardle.90,
  author =       "W. H{\"a}rdle",
  title =        "Applied Nonparametric Regression",
  publisher =    "Cambridge University Press",
  address =      "Cambridge",
  year =         "1990",
  comment =      PRNNref,
}

@Book{Hardle.91,
  author =       "W. H{\"a}rdle",
  title =        "Smoothing Techniques with Implementation in {S}",
  publisher =    Springer,
  address =      "New York",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Hardy.71,
  author =       "R. L. Hardy",
  title =        "Multiquadric equations of topography and other
                 irregular surfaces",
  journal =      "Journal of Geophysical Research",
  volume =       "76",
  pages =        "1906--1915",
  year =         "1971",
  comment =      PRNNunref,
}

@Article{Hardy.90,
  author =       "R. L. Hardy",
  title =        "Theory and applications of the multiquadric-biharmonic
                 method: 20 years of discovery 1968--1988",
  journal =      CMwA,
  volume =       "19",
  pages =        "163--208",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Hart.68,
  author =       "P. E. Hart",
  title =        "The condensed nearest neighbor rule",
  journal =      IEIT,
  volume =       "14",
  pages =        "515--516",
  year =         "1968",
  comment =      PRNNref,
}

@Book{Hartigan.75,
  author =       "J. A. Hartigan",
  title =        "Clustering Algorithms",
  publisher =    Wiley,
  address =      "New York",
  year =         "1975",
  comment =      PRNNunref,
}

@Article{Hartigan.Wong.79,
  author =       "J. A. Hartigan and M. A. Wong",
  title =        "Algorithm {AS136}. {A} ${K}$-means clustering
                 algorithm",
  journal =      ApplStat,
  volume =       "28",
  pages =        "100--108",
  year =         "1979",
  comment =      PRNNref,
}

@Article{Hartman.ZZ.90,
  author =       "E. J. Hartman and J. D. Keeler and J. M. Kowalski",
  title =        "Layered neural networks with {Gaussian} hidden units
                 as universal approximations",
  journal =      NC,
  volume =       "2",
  pages =        "210--215",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Hassibi.Stork.93,
  author =       "B. Hassibi and D. G. Stork",
  title =        "Second derivatives for network pruning: Optimal
                 {Brain} {Surgeon}",
  crossref =     "NIPS5",
  pages =        "164--171",
  year =         "1993",
  comment =      PRNNref,
}

@InProceedings{Hassibi.ZZ.94,
  author =       "B. Hassibi and D. G. Stork and G. Wolff and T.
                 Watanabe",
  title =        "{Optimal} {Brain} {Surgeon}: extensions and performance
                 comparisons",
  crossref =     "NIPS6",
  pages =        "263--270",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Hastie.Mallows.93,
  author =       "T. Hastie and C. Mallows",
  title =        "Discussion of {Frank} and {Friedman} (1993)",
  journal =      Techno,
  volume =       "35",
  pages =        "140--143",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Hastie.Stuetzle.89,
  author =       "T. Hastie and W. Stuetzle",
  title =        "Principal curves",
  journal =      JASA,
  volume =       "84",
  pages =        "502--516",
  year =         "1989",
  comment =      PRNNref,
}

@Book{Hastie.Tibshirani.90,
  author =       "T. J. Hastie and R. J. Tibshirani",
  title =        "Generalized Additive Models",
  publisher =    "Chapman \& Hall",
  address =      "London",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Hastie.Tibshirani.96,
  author =       "T. Hastie and R. Tibshirani",
  title =        "Discriminant analysis by {Gaussian} mixtures",
  journal =      JRSSB,
  volume =       "58",
  pages =        "158--176",
  year =         "1996",
  comment =      PRNNref,
}

@Article{Hastie.ZZ.94,
  author =       "T. Hastie and R. Tibshirani and A. Buja",
  title =        "Flexible discriminant analysis by optimal scoring",
  journal =      JASA,
  volume =       "89",
  pages =        "1255--1270",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Hastie.ZZ.95,
  author =       "T. Hastie and A. Buja and R. Tibshirani",
  title =        "Penalized discriminant analysis",
  journal =      AnnStat,
  volume =       "23",
  pages =        "73--102",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Hastings.70,
  author =       "W. K. Hastings",
  title =        "{Monte Carlo} sampling methods using {Markov} chains
                 and their applications",
  journal =      Bka,
  volume =       "57",
  pages =        "97--109",
  year =         "1970",
  comment =      PRNNref,
}

@Article{Hathaway.85,
  author =       "R. J. Hathaway",
  title =        "A constrained formulation of maximum-likelihood
                 estimation for normal mixture distributions",
  journal =      AnnStat,
  volume =       "13",
  pages =        "795--800",
  year =         "1985",
  comment =      PRNNref,
}

@Article{Hauck.Donner.77,
  author =       "Hauck, Jr., W. W. and A. Donner",
  title =        "Wald's test as applied to hypotheses in logit
                 analysis",
  journal =      JASA,
  volume =       "72",
  pages =        "851--853",
  year =         "1977",
  comment =      PRNNref,
}

@Article{Haussler.92,
  author =       "D. Haussler",
  title =        "Decision theoretic generalizations of the {PAC} model
                 for neural net and other learning applications",
  journal =      InfoComp,
  volume =       "100",
  pages =        "78--150",
  year =         "1992",
  note =         "[Reprinted as pp.~37--116 of \cite{Wolpert.95}]",
  comment =      PRNNref,
}

@Book{Haykin.94,
  author =       "S. Haykin",
  title =        "Neural Networks. {A} Comprehensive Foundation",
  publisher =    "Macmillan College Publishing",
  address =      "New York",
  year =         "1994",
  comment =      PRNNref,
}

@Book{Hebb.49,
  author =       "D. O. Hebb",
  title =        "The Organization of Behavior",
  publisher =    Wiley,
  address =      "New York",
  year =         "1949",
  comment =      PRNNref,
}

@Article{Hellman.70,
  author =       "M. E. Hellman",
  title =        "The nearest neighbor classification rule with a reject
                 option",
  journal =      "IEEE Transactions on Systems Science and Cybernetics",
  volume =       "6",
  pages =        "179--185",
  year =         "1970",
  note =         NNset,
  comment =      PRNNref,
}

@InProceedings{Henrichon.Fu.68,
  author =       "Henrichon, Jr., E. G. and K.-S. Fu",
  booktitle =    "Proceedings of the Seventh Symposium on Adaptive
                 Processes, UCLA",
  title =        "On mode estimation in pattern recognition",
  year =         "1968",
  comment =      PRNNunref,
}

@Article{Henrichon.Fu.69,
  author =       "Henrichon, Jr., E. G. and K.-S. Fu",
  title =        "A nonparametric partitioning procedure for pattern
                 classification",
  journal =      IEC,
  volume =       "18",
  pages =        "614--624",
  year =         "1969",
  comment =      PRNNref,
}

@InProceedings{Henrion.88,
  author =       "M. Henrion",
  editor =       "J. Lemmer and L. N. Kanal",
  booktitle =    "Uncertainty in Artificial Intelligence 2",
  title =        "Propagating uncertainty in {Bayesian} networks by
                 probabilistic logic sampling",
  publisher =    "North-Holland",
  address =      "Amsterdam",
  pages =        "149--163",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Henrion.ZZ.91,
  author =       "M. Henrion and J. S. Breese and E. J. Horvitz",
  title =        "Decision analysis and expert systems",
  journal =      "AI Magazine",
  volume =       "12",
  number =       "4",
  pages =        "64--91",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Hermans.ZZ.82,
  author =       "J. Hermans and J. D. F. Habbema and J. R. Schaefer",
  title =        "The {ALLOC80} package for discriminant analysis",
  journal =      "Statistical Software Newsletter",
  volume =       "8",
  pages =        "15--20",
  year =         "1982",
  comment =      PRNNref,
}

@Book{Hertz.ZZ.91,
  author =       "J. Hertz and A. Krogh and R. G. Palmer",
  title =        "Introduction to the Theory of Neural Computation",
  publisher =    "Addison-Wesley",
  address =      "Redwood City, CA",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Heskes.Kappen.91,
  author =       "T. M. Heskes and B. Kappen",
  title =        "Learning processes in neural networks",
  journal =      "Physical Reviews A",
  volume =       "44",
  pages =        "2718--2726",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Highleyman.62a,
  author =       "W. H. Highleyman",
  title =        "The design and analysis of pattern recognition
                 experiments",
  journal =      "Bell Systems Technical Journal",
  volume =       "41",
  pages =        "723--744",
  year =         "1962",
  comment =      PRNNunref,
}

@Article{Highleyman.62b,
  author =       "W. H. Highleyman",
  title =        "Linear decision functions, with application to pattern
                 recognition",
  journal =      "Proceedings of the IRE",
  volume =       "50",
  pages =        "1501--1514",
  year =         "1962",
  comment =      PRNNref,
}

@Article{Hills.66,
  author =       "M. Hills",
  title =        "Allocation rules and their error rates (with
                 discussion)",
  journal =      JRSSB,
  volume =       "28",
  pages =        "1--31",
  year =         "1966",
  comment =      PRNNref,
}

@InProceedings{Hinton.86,
  author =       "G. E. Hinton",
  booktitle =    "Proceedings of the Eighth Annual Conference of the
                 Cognitive Science Society (Amherst, 1986)",
  title =        "Learning distributed representations of concepts",
  publisher =    "Erlbaum",
  address =      "Hillsdale",
  pages =        "1--12",
  year =         "1986",
  comment =      PRNNref,
}

@Article{Hinton.89a,
  author =       "G. E. Hinton",
  title =        "Connectionist learning procedures",
  journal =      AI,
  volume =       "40",
  pages =        "185--234",
  year =         "1989",
  note =         "[Reprinted in \cite{Carbonell.90}]",
  comment =      PRNNref,
}

@Article{Hinton.89b,
  author =       "G. E. Hinton",
  title =        "Deterministic {Boltzmann} machine learning performs
                 steepest descent in weight space",
  journal =      NC,
  volume =       "1",
  pages =        "143--150",
  year =         "1989",
  comment =      PRNNref,
}

@InProceedings{Hinton.Sejnowski.83,
  author =       "G. E. Hinton and T. J. Sejnowski",
  booktitle =    "Proceedings of the IEEE Conference on Computer Vision
                 and Pattern Recognition (Washington, 1983)",
  title =        "Optimal perceptual inference",
  publisher =    "IEEE Press",
  address =      "New York",
  pages =        "448--453",
  year =         "1983",
  comment =      PRNNref,
}

@Unpublished{Hjort.86,
  author =       "N. L. Hjort",
  title =        "Notes on the Theory of Statistical Symbol
                 Recognition",
  year =         "1986",
  note =         "Norwegian Computing Center Report \textbf{778}",
  comment =      PRNNref,
}

@Article{Hjort.Glad.95,
  author =       "N. L. Hjort and I. K. Glad",
  title =        "Nonparametric density estimation with a parametric
                 start",
  journal =      AnnStat,
  volume =       "23",
  pages =        "882--904",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Hjort.Jones.96,
  author =       "N. L. Hjort and M. C. Jones",
  title =        "Locally parametric nonparametric density estimation",
  journal =      AnnStat,
  volume =       "24",
  pages =        "1619--1647",
  year =         "1996",
  comment =      PRNNref,
}

@Article{Ho.Kashyap.65,
  author =       "Y.-C. Ho and R. L. Kashyap",
  title =        "An algorithm for linear inequalities and its
                 applications",
  journal =      IEEC,
  volume =       "14",
  pages =        "683--688",
  year =         "1965",
  comment =      PRNNref,
}

@Article{Hodges.87,
  author =       "J. S. Hodges",
  title =        "Uncertainty, policy analysis and statistics (with
                 discussion)",
  journal =      StatSci,
  volume =       "2",
  pages =        "259--291",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Hoeffding.63,
  author =       "W. Hoeffding",
  title =        "Probability inequalities for sums of bounded random
                 variables",
  journal =      JASA,
  volume =       "58",
  pages =        "13--30",
  year =         "1963",
  comment =      PRNNref,
}

@Article{Hoerl.Kennard.70a,
  author =       "A. E. Hoerl and R. W. Kennard",
  title =        "Ridge \hbox{regression:} biased estimation for
                 nonorthogonal problems",
  journal =      Techno,
  volume =       "12",
  pages =        "55--67",
  year =         "1970",
  comment =      PRNNref,
}

@Article{Hoerl.Kennard.70b,
  author =       "A. E. Hoerl and R. W. Kennard",
  title =        "Ridge \hbox{regression:} applications to nonorthogonal
                 problems",
  journal =      Techno,
  volume =       "12",
  pages =        "69--82",
  year =         "1970",
  comment =      PRNNref,
}

@Article{Hoffgen.ZZ.95,
  author       = "K.-U. H{\"{o}}ffgen and H.-U. Simon and K. S. {Van Horn}",
  title        = "Robust trainability of single neurons",
  journal      = "Journal of Computer and System Sciences",
  volume       = "50",
  number       = "1",
  pages        = "114--125",
  year         = "1995",
  comment =      PRNNunref,
}

@Article{Holt.Semnani.90,
  author =       "M. J. J. Holt and S. Semnani",
  title =        "Convergence of back-propagation in neural networks
                 using a log-likelihood cost function",
  journal =      "Electronics Letters",
  volume =       "26",
  pages =        "1964--1965",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Hopfield.82,
  author =       "J. J. Hopfield",
  title =        "Neural networks and physical systems with emergent
                 collective computational facilities",
  journal =      PNAS,
  volume =       "79",
  pages =        "2554--2558",
  year =         "1982",
  note =         "[Reprinted in \cite{Anderson.Rosenfeld.88} and
                 \cite{Lau.92}]",
  comment =      PRNNref,
}

@Article{Hopfield.87,
  author =       "J. J. Hopfield",
  title =        "Learning algorithms and probability distributions in
                 feed-forward and feed-back networks",
  journal =      PNAS,
  volume =       "84",
  pages =        "8429--8433",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Hornik.ZZ.89,
  author =       "K. Hornik and M. Stinchcombe and H. White",
  title =        "Multilayer feedforward networks are universal
                 approximators",
  journal =      NNks,
  volume =       "2",
  pages =        "359--366",
  year =         "1989",
  note =         "[Reprinted in \cite{White.92}]",
  comment =      PRNNref,
}

@Article{Hornik.ZZ.90,
  author =       "K. Hornik and M. Stinchcombe and H. White",
  title =        "Universal approximation of an unknown mapping and its
                 derivatives using feedforward networks",
  journal =      NNks,
  volume =       "3",
  pages =        "551--560",
  year =         "1990",
  note =         "[Reprinted in \cite{White.92}]",
  comment =      PRNNref,
}

@Article{Hrycej.90,
  author =       "T. Hrycej",
  title =        "{Gibbs} sampling in {Bayesian} networks",
  journal =      AI,
  volume =       "46",
  pages =        "351--363",
  year =         "1990",
  comment =      PRNNref,
}

@Book{Hrycej.92,
  author =       "T. Hrycej",
  title =        "Modular Learning in Neural Networks. {A} Modularized
                 Appproach to Neural Network Classification",
  publisher =    Wiley,
  address =      "New York",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Huang.ZZ.95,
  author =       "J. Huang and M. Georgiopoulos and G. L. Heileman",
  title =        "Fuzzy {ART} properties",
  journal =      NNks,
  volume =       "8",
  pages =        "203--213",
  year =         "1995",
  comment =      PRNNref,
}

@InProceedings{Huber.67,
  author =       "P. J. Huber",
  editor =       "L. M. Le Cam and J. Neyman",
  booktitle =    "Proceedings of the Fifth Berkeley Symposium on
                 Mathematical Statistics and Probability",
  title =        "The behavior of maximum likelihood estimates under
                 nonstandard conditions",
  volume =       "1",
  publisher =    "University of California Press",
  address =      "Berkeley, CA",
  pages =        "221--233",
  year =         "1967",
  comment =      PRNNref,
}

@Book{Huber.81,
  author =       "P. J. Huber",
  title =        "Robust Statistics",
  publisher =    Wiley,
  address =      "New York",
  year =         "1981",
  comment =      PRNNref,
}

@Article{Huber.85,
  author =       "P. J. Huber",
  title =        "Projection pursuit (with discussion)",
  journal =      AnnStat,
  volume =       "13",
  pages =        "435--525",
  year =         "1985",
  comment =      PRNNref,
}

@Book{Hunt.ZZ.66,
  author =       "E. B. Hunt and J. Marin and P. J. Stone",
  title =        "Experiments in Induction",
  publisher =    "Academic Press",
  address =      "New York",
  year =         "1966",
  comment =      PRNNref,
}

@InProceedings{Hwang.ZZ.91,
  author =       "J.-N. Hwang and H. Li and D. Martin and J. Schimert",
  booktitle =    "25th Asilomar Conference on Signals, Systems and
                 Computers, Pacific Grove, CA",
  title =        "The learning parsimony of projection pursuit and
                 back-propagation networks",
  publisher =    "IEEE Computer Society Press",
  address =      "Los Alamitos, CA",
  pages =        "491--495",
  year =         "1991",
  comment =      PRNNref,
}

@InProceedings{Hwang.ZZ.92a,
  author =       "J.-N. Hwang and H. Li and M. Maechler and D. Martin
                 and J. Schimert",
  title =        "A comparison of projection pursuit and neural network
                 regression modeling",
  crossref =     "NIPS4",
  pages =        "1159--1166",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Hwang.ZZ.92b,
  author =       "J.-N. Hwang and H. Li and M. Maechler and D. Martin
                 and J. Schimert",
  title =        "Projection pursuit learning networks for regression",
  journal =      "Engineering Applications of Artificial Intelligence",
  volume =       "5",
  pages =        "193--204",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Hwang.ZZ.94a,
  author =       "J.-N. Hwang and S.-R. Lay and M. Maechler and D.
                 Martin and J. Schimert",
  title =        "Regression modeling in back-propagation and projection
                 pursuit learning",
  journal =      TNN,
  volume =       "5",
  pages =        "342--353",
  year =         "1994",
  comment =      PRNNref,
}

@TechReport{Hwang.ZZ.94bb,
  author =       "J.-N. Hwang and S.-S. You and S.-R. Lay and I.-C.
                 Jou",
  title =        "What's wrong with a cascaded correlation learning
                 network: a projection pursuit learning perspective",
  institution =  "Dept of Electrical Engineering, University of
                 Washington",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Hwang.ZZ.96,
  author       = "J.-N. Hwang and S. S. You and S.-R. Lay and I-C. Jou",
  title        = "The cascade-correlation learning: {A} projection pursuit
                  learning perspective",
  journal      = "IEEE Transactions on Neural Networks",
  volume       = "7",
  number       = "2",
  pages        = "278--289",
  year         = "1996",
  comment =      PRNNref,
}

@Article{Hyafil.Rivest.76,
  author =       "R. Hyafil and R. L. Rivest",
  title =        "Constructing optimal binary trees is {NP}-complete",
  journal =      "Information Processing Letters",
  volume =       "5",
  pages =        "15--17",
  year =         "1976",
  comment =      PRNNunref,
}

@Article{Impedovo.ZZ.91,
  author =       "S. Impedovo and L. Ottaviano and S. Occhinegro",
  title =        "Optical character recognition---a survey",
  journal =      IJPRAI,
  volume =       "5",
  pages =        "1--24",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Ingrassia.92,
  author =       "S. Ingrassia",
  title =        "A comparison between the simulated annealing and the
                 {EM} algorithms in normal mixture decompositions",
  journal =      StatComp,
  volume =       "2",
  pages =        "203--211",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Intrator.90,
  author =       "N. Intrator",
  title =        "A neural network for feature extraction",
  crossref =     "NIPS2",
  pages =        "719--726",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Intrator.91,
  author =       "N. Intrator",
  title =        "Exploratory feature extraction in speech signals",
  crossref =     "NIPS3",
  pages =        "241--247",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Intrator.92,
  author =       "N. Intrator",
  title =        "Feature extraction using an unsupervised neural
                 network",
  journal =      NC,
  volume =       "4",
  pages =        "98--107",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Intrator.Cooper.92,
  author =       "N. Intrator and L. N. Cooper",
  title =        "Objective function formulation of the {BCM} theory of
                 visual cortical plasticity: statistical connections,
                 stability conditions",
  journal =      NNks,
  volume =       "5",
  pages =        "3--17",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Intrator.Gold.93,
  author =       "N. Intrator and J. I. Gold",
  title =        "Three-dimensional object recognition of using an
                  unsupervised {BCM} network: the usefulness of
                  distinguishing features",
  journal =      NC,
  volume =       "5",
  pages =        "61--74",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Isham.81,
  author =       "V. Isham",
  title =        "An introduction to spatial point processes and
                 {Markov} random fields",
  journal =      ISR,
  volume =       "49",
  pages =        "21--43",
  year =         "1981",
  comment =      PRNNref,
}

@Book{Jackson.91,
  author =       "J. E. Jackson",
  title =        "A User's Guide to Principal Components",
  publisher =    Wiley,
  address =      "New York",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Jacobs.88,
  author =       "R. A. Jacobs",
  title =        "Increased rates of convergence through learning rate
                 adaptation",
  journal =      NNks,
  volume =       "1",
  pages =        "295--307",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Jacobs.ZZ.91,
  author =       "R. A. Jacobs and M. I. Jordan and S. J. Nowlan and G.
                 E. Hinton",
  title =        "Adaptive mixtures of local experts",
  journal =      NC,
  volume =       "3",
  pages =        "79--87",
  year =         "1991",
  comment =      PRNNref,
}

@Book{Jain.Dubes.88,
  author =       "A. K. Jain and R. C. Dubes",
  title =        "Algorithms for Clustering Data",
  publisher =    "Prentice-Hall",
  address =      "Englewood Cliffs, NJ",
  year =         "1988",
  comment =      PRNNunref,
}

@Article{Jain.ZZ.87,
  author =       "A. K. Jain and R. C. Dubes and C.-C. Chen",
  title =        "Bootstrap techniques for error estimation",
  journal =      PAMI,
  volume =       "9",
  pages =        "628--633",
  year =         "1987",
  comment =      PRNNref,
}

@Book{James.88,
  author =       "M. James",
  title =        PR,
  publisher =    Wiley,
  address =      "New York",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Jancey.66,
  author =       "R. C. Jancey",
  title =        "Multidimensional group analysis",
  journal =      "Australian Journal of Botany",
  volume =       "14",
  pages =        "127--130",
  year =         "1966",
  comment =      PRNNunref,
}

@Book{Jeffreys.61,
  author =       "H. Jeffreys",
  title =        "Theory of Probability",
  publisher =    "Clarendon Press",
  address =      "Oxford",
  edition =      "Third",
  year =         "1961",
  comment =      PRNNref,
}

@InProceedings{Jensen.91,
  author =       "F. V. Jensen",
  booktitle =    "Proceedings of the Scandinavian Conference on
                 Artificial Intelligence",
  title =        "Calculation in {HUGIN} of probabilities for specific
                 configurations --- a trick with many applications",
  publisher =    "IOS Press",
  address =      "Amsterdam",
  pages =        "176--186",
  year =         "1991",
  comment =      PRNNref,
}

@Book{Jensen.96,
  author =       "F. V. Jensen",
  title =        "An introduction to Belief Networks",
  publisher =    "UCL Press (Taylor \& Francis Ltd)",
  address =      "London",
  year =         "1996",
  comment =      PRNNref,
}

@InProceedings{Jensen.Liang.95,
  author =       "F. V. Jensen and J. Liang",
  title =        "{drHugin}. {A} system for hypothesis driven data
                 request",
  crossref =     "Gammerman.95",
  pages =        "109--124",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Jensen.ZZ.90,
  author =       "F. V. Jensen and S. L. Lauritzen and K. G. Olesen",
  title =        "{Bayesian} updating in causal probabilistic networks
                 by local computations",
  journal =      "Computational Statistics Quarterly",
  volume =       "5",
  pages =        "269--282",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Jiang.Zhang.93,
  author =       "Q. Jiang and W. Zhang",
  title =        "An improved method for finding nearest neighbors",
  journal =      PRL,
  volume =       "14",
  pages =        "531--535",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Johansson.ZZ.91,
  author =       "E. M. Johansson and F. U. Dowla and D. M. Goodman",
  title =        "Back-propagation learning for multi-layer feed-forward
                 neural networks using the conjugate gradient method",
  journal =      IJNS,
  volume =       "2",
  pages =        "291--302",
  year =         "1991",
  comment =      PRNNunref,
}

@Book{Johnson.Kotz.72,
  author =       "N. L. Johnson and S. Kotz",
  title =        "Distributions in Statistics: Continuous Multivariate
                 Distributions",
  publisher =    Wiley,
  address =      "New York",
  year =         "1972",
  comment =      PRNNref,
}

@Book{Jolliffe.86,
  author =       "I. T. Jolliffe",
  title =        "Principal Component Analysis",
  publisher =    Springer,
  address =      "New York",
  year =         "1986",
  comment =      PRNNref,
}

@Article{Jones.87,
  author =       "L. K. Jones",
  title =        "On a conjecture of {Huber} concerning the convergence
                 of projection pursuit regression",
  journal =      AnnStat,
  volume =       "15",
  pages =        "880--882",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Jones.92,
  author =       "L. K. Jones",
  title =        "A simple lemma on greedy approximation in {Hilbert}
                 space and convergence rates for projection pursuit
                 regression and neural network training",
  journal =      AnnStat,
  volume =       "20",
  pages =        "608--613",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Jones.Sibson.87,
  author =       "M. C. Jones and R. Sibson",
  title =        "What is projection pursuit (with discussion)?",
  journal =      JRSSA,
  volume =       "150",
  pages =        "1--36",
  year =         "1987",
  comment =      PRNNref,
}

@InProceedings{Jordan.Jacobs.92,
  author =       "M. I. Jordan and R. A. Jacobs",
  title =        "Hierarchies of adaptive experts",
  crossref =     "NIPS4",
  pages =        "985--992",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Jordan.Jacobs.94,
  author =       "M. I. Jordan and R. A. Jacobs",
  title =        "Hierarchical mixtures of experts and the {EM}
                 algorithm",
  journal =      NC,
  volume =       "6",
  pages =        "181--214",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Kalantari.McDonald.83,
  author =       "I. Kalantari and G. McDonald",
  title =        "A data structure and an algorithm for the nearest
                 point problem",
  journal =      "IEEE Transactions on Software Engineering",
  volume =       "9",
  pages =        "631--634",
  year =         "1983",
  comment =      PRNNref,
}

@InProceedings{Kambhatla.Leen.94,
  author =       "N. Kambhatla and T. K. Leen",
  title =        "Fast non-linear dimension reduction",
  crossref =     "NIPS6",
  pages =        "152--159",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Kamgar-Parsi.Kanal.85,
  author =       "B. Kamgar-Parsi and L. N. Kanal",
  title =        "An improved branch and bound algorithm for computing
                 $k$-nearest neighbours",
  journal =      PRL,
  volume =       "3",
  pages =        "7--12",
  year =         "1985",
  comment =      PRNNref,
}

@Article{Kansa.90,
  author =       "E. J. Kansa",
  title =        "Multiquadrics---a scattered data approximation scheme
                 with applications to computational fluid dynamics. 1",
  journal =      CMwA,
  volume =       "19",
  pages =        "127--145",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Kappen.95,
  author =       "H. J. Kappen",
  title =        "Deterministic learning rules for {Boltzmann}
                 machines",
  journal =      NNks,
  volume =       "8",
  pages =        "537--548",
  year =         "1995",
  comment =      PRNNref,
}

@InProceedings{Karpinski.Macintyre.95a,
  author       = "M. Karpinski and A. Macintyre",
  editor       = "P. Vitanyi",
  booktitle    = "Proceedings of the Second European Conference on
                  Computational Learning Theory (Barcelona, Spain)",
  title        = "Bounding {VC}-dimension of neural networks: Progress and
                  prospects.",
  number       = "904",
  publisher    = "Springer",
  address      = "Berlin",
  pages        = "337--341",
  year         = "1995",
  series       = "Lecture Notes in Artificial Intelligence",
  comment =      PRNNunref,
}

@InProceedings{Karpinski.Macintyre.95b,
  author       = "M. Karpinski and A. Macintyre",
  booktitle    = "Proceedings of the Twenty-Seventh Annual ACM Symposium on
                  Theory of Computing (Las Vegas)",
  title        = "Polynomial bounds for {VC} dimension of sigmoidal neural
                  networks.",
  publisher    = "ACM Press",
  pages        = "200--208",
  year         = "1995",
  comment =      PRNNunref,
}

@Article{Kashyap.Blaydon.68,
  author =       "R. L. Kashyap and C. C. Blaydon",
  title =        "Estimation of probability density and distribution
                 functions",
  journal =      IEIT,
  volume =       "14",
  pages =        "549--556",
  year =         "1968",
  comment =      PRNNref,
}

@Article{Kass.80,
  author =       "G. V. Kass",
  title =        "An exploratory technique for investigating large
                 quantities of categorical data",
  journal =      ApplStat,
  volume =       "29",
  pages =        "119--127",
  year =         "1980",
  comment =      PRNNref,
}

@Article{Kass.Raftery.95,
  author =       "R. E. Kass and A. E. Raftery",
  title =        "{Bayes} factors",
  journal =      JASA,
  volume =       "90",
  pages =        "733--795",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Kass.Vaidyanathan.92,
  author =       "R. E. Kass and S. K. Vaidyanathan",
  title =        "Approximate {Bayes} factors and orthogonal parameters,
                 with application to testing equality of two binomial
                 proportions",
  journal =      JRSSB,
  volume =       "54",
  pages =        "129--144",
  year =         "1992",
  comment =      PRNNref,
}

@Book{Kaufman.Rousseeuw.90,
  author =       "L. Kaufman and P. J. Rousseeuw",
  title =        "Finding Groups in Data. An Introduction to Cluster
                 Analysis",
  publisher =    Wiley,
  address =      "New York",
  year =         "1990",
  comment =      PRNNref,
}

@Book{Kendall.Stuart.66,
  author =       "M. G. Kendall and A. Stuart",
  title =        "The Advanced Theory of Statistics, volume {III}",
  publisher =    "Griffin",
  address =      "London",
  year =         "1966",
  comment =      PRNNunref,
}

@Article{Kent.ZZ.94,
  author =       "J. T. Kent and D. E. Tyler and Y. Vardi",
  title =        "A curious likelihood identity for the multivariate
                 $t$-distribution",
  journal =      "Communications in Statistics---Simulation and
                 Computation",
  volume =       "23",
  pages =        "441--453",
  year =         "1994",
  comment =      PRNNref,
}

@InProceedings{Kibler.Aha.87,
  author =       "D. Kibler and D. W. Aha",
  editor =       "P. Langley",
  booktitle =    "Proceedings of the Fourth International Workshop on
                 Machine Learning (Irvine, 1987)",
  title =        "Learning representative exemplars of concepts: an
                 initial case study",
  publisher =    MK,
  address =      "Palo Alto, CA",
  pages =        "24--30",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Kiiveri.ZZ.84,
  author =       "H. Kiiveri and T. P. Speed and J. B. Carlin",
  title =        "Recursive causal models",
  journal =      "Journal of the Australian Mathematical Society (series
                 A)",
  volume =       "36",
  pages =        "30--52",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Kim.Park.86,
  author =       "B. S. Kim and S. B. Park",
  title =        "A fast $k$ nearest neighbor finding algorithm based on
                 the ordered partition",
  journal =      PAMI,
  volume =       "8",
  pages =        "761--766",
  year =         "1986",
  note =         NNset,
  comment =      PRNNref,
}

@InProceedings{Kim.Pearl.83,
  author =       "J. H. Kim and J. Pearl",
  editor =       "A. Bundy",
  booktitle =    "Proceedings of the Eighth International Joint
                 Conference on Artificial Intelligence (Karlsruhe,
                 1983)",
  title =        "A computational model for combined causal and
                 diagnostic reasoning in inference systems",
  publisher =    "AAAI",
  address =      "Menlo Park, CA",
  pages =        "190--193",
  year =         "1983",
  comment =      PRNNref,
}

@Article{King.ZZ.92,
  author =       "R. D. King and S. Muggleton and R. A. Lewis and M. J.
                 E. Sternberg",
  title =        "Drug design by machine learning: The use of inductive
                 logic programming to model the structure-activity
                 relationships of trimethoprim analogues binding to
                 dihydrofolate reductase",
  journal =      PNAS,
  volume =       "89",
  pages =        "11322--11326",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Kjaerulff.92,
  author =       "U. Kj{\ae}rulff",
  title =        "Optimal decomposition of probabilistic networks by
                 simulated annealing",
  journal =      StatComp,
  volume =       "2",
  pages =        "7--17",
  year =         "1992",
  comment =      PRNNref,
}

@Book{Kleijnen.87,
  author =       "J. P. C. Kleijnen",
  title =        "Statistical Tools for Simulation Practitioners",
  publisher =    "Marcel Dekker",
  address =      "New York",
  year =         "1987",
  comment =      PRNNref,
}

@Book{Kleijnen.Groenendaal.92,
  author =       "J. P. C. Kleijnen and W. van Groenendaal",
  title =        "Simulation: {A} Statistical Perspective",
  publisher =    Wiley,
  address =      "Chichester",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Knerr.ZZ.92,
  author =       "S. Knerr and L. Personnaz and G. Dreyfus",
  title =        "Handwritten digit recognition by neural networks with
                 single-layer training",
  journal =      TNN,
  volume =       "3",
  pages =        "962--968",
  year =         "1992",
  comment =      PRNNref,
}

@Book{Knuth.68,
  author =       "D. E. Knuth",
  title =        "The Art of Computer Programming, Volume 1: Fundamental
                 Algorithms",
  publisher =    "Addison-Wesley",
  address =      "Reading, MA",
  year =         "1968",
  note =         "[Second edition, 1973]",
  comment =      PRNNref,
}

@Article{Kohonen.82a,
  author =       "T. Kohonen",
  title =        "Self-organized formation of topologically correct
                 feature maps",
  journal =      BioCyb,
  volume =       "43",
  pages =        "59--69",
  year =         "1982",
  note =         "[Reprinted in \cite{Anderson.Rosenfeld.88}]",
  comment =      PRNNref,
}

@Article{Kohonen.82b,
  author =       "T. Kohonen",
  title =        "Analysis of a simple self-organizing process",
  journal =      BioCyb,
  volume =       "43",
  pages =        "135--140",
  year =         "1982",
  comment =      PRNNref,
}

@Article{Kohonen.88a,
  author =       "T. Kohonen",
  title =        "An introduction to neural computing",
  journal =      NNks,
  volume =       "1",
  pages =        "3--16",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Kohonen.88b,
  author =       "T. Kohonen",
  title =        "Learning vector quantization",
  journal =      NNks,
  volume =       "1",
  number =       "(suppl.~1)",
  pages =        "303",
  year =         "1988",
  comment =      PRNNref,
}

@Book{Kohonen.89,
  author =       "T. Kohonen",
  title =        "Self-Organization and Associative Memory",
  publisher =    Springer,
  address =      "Berlin",
  edition =      "Third",
  year =         "1989",
  note =         "[First edition, 1984]",
  comment =      PRNNref,
}

@Article{Kohonen.90a,
  author =       "T. Kohonen",
  title =        "The self-organizing map",
  journal =      PIEEE,
  volume =       "78",
  pages =        "1464--1480",
  year =         "1990",
  note =         rep-Lau,
  comment =      PRNNref,
}

@InProceedings{Kohonen.90b,
  author =       "T. Kohonen",
  booktitle =    "Proceedings of the IEEE International Conference on
                 Neural Networks, San Diego",
  title =        "Improved versions of learning vector quantization",
  volume =       "I",
  publisher =    "IEEE Press",
  address =      "New York",
  pages =        "545--550",
  year =         "1990",
  comment =      PRNNunref,
}

@Article{Kohonen.93,
  author =       "T. Kohonen",
  title =        "Physiological interpretation of the self-organizing
                 map algorithm",
  journal =      NNks,
  volume =       "6",
  pages =        "895--905",
  year =         "1993",
  comment =      PRNNref,
}

@Book{Kohonen.95,
  author =       "T. Kohonen",
  title =        "Self-Organizing Maps",
  publisher =    Springer,
  address =      "Berlin",
  year =         "1995",
  comment =      PRNNref,
}

@InProceedings{Kohonen.ZZ.88,
  author =       "T. Kohonen and G. Barna and R. Chrisley",
  booktitle =    "Proceedings of the IEEE International Conference on
                 Neural Networks, San Diego,",
  title =        "Statistical pattern recognition with neural networks:
                 benchmarking studies",
  volume =       "I",
  publisher =    "IEEE Press",
  address =      "Long Beach, CA",
  pages =        "61--68",
  year =         "1988",
  note =         "[Reprinted in \cite{Anderson.ZZ.90}]",
  comment =      PRNNref,
}

@Manual{Kohonen.ZZ.92,
  author =       "T. Kohonen and T. Kangas and J. Laaksonen and K.
                 Torkkola",
  title =        "\emph{LVQ\_PAK}\@. The learning vector quantization
                 program package version 2.1",
  organization = "Laboratory of Computer and Information Science,
                 Helsinki University of Technology",
  year =         "1992",
  note =         "[Version 3.1 became available in 1995]",
  comment =      PRNNref,
}

@Article{Kong.91,
  author =       "A. Kong",
  title =        "Efficient methods for computing linkage likelihoods of
                 recessive diseases in inbred pedigrees",
  journal =      "Genetic Epidemiology",
  volume =       "8",
  pages =        "81--103",
  year =         "1991",
  comment =      PRNNref,
}

@InProceedings{Koiran.Sontag.96,
  author       = "Pascal Koiran and Eduardo D. Sontag",
  title        = "Neural networks with quadratic {VC} dimension",
  crossref     = "NIPS8",
  pages        = "197--203",
  year         = "1996",
  comment =      PRNNref,
}

@TechReport{Kononenko.ZZ.84,
  author =       "I. Kononenko and I. Bratko and E. Ro{\u s}kar",
  title =        "Experiments in the automatic learning of medical
                 diagnosis rules",
  institution =  "Josef Stefan Institute, Ljubljana",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Koontz.ZZ.75,
  author =       "W. L. G. Koontz and P. M. Narendra and K. Fukunaga",
  title =        "A branch and bound clustering algorithm",
  journal =      IEC,
  volume =       "24",
  pages =        "908--915",
  year =         "1975",
  comment =      PRNNref,
}

@Article{Kramer.91,
  author =       "M. A.. Kramer",
  title =        "Nonlinear principal component analysis using
                 autoassociative neural networks",
  journal =      "AICHE Journal",
  volume =       "37",
  pages =        "233--243",
  year =         "1991",
  comment =      PRNNref,
}

@InProceedings{Kramer.Sangiovanni-Vincentelli.89,
  author =       "A. H. Kramer and A. Sangiovanni-Vincentelli",
  title =        "Efficient parallel learning algorithms for neural
                 networks",
  crossref =     "NIPS1",
  pages =        "40--48",
  year =         "1989",
  comment =      PRNNref,
}

@Book{Krishnaiah.Kanal.82,
  editor =       "P. R. Krishnaiah and L. N. Kanal",
  title =        "Handbook of Statistics 2: Classification, Pattern
                 Recognition and Reduction of Dimensionality",
  publisher =    "North Holland",
  address =      "Amsterdam",
  year =         "1982",
  comment =      PRNNref,
}

@Article{Kruskal.64a,
  author =       "J. B. Kruskal",
  title =        "Multidimensional scaling by optimizing goodness-of-fit
                 to a nonmetric hypothesis",
  journal =      PSym,
  volume =       "29",
  pages =        "1--29",
  year =         "1964",
  comment =      PRNNunref,
}

@Article{Kruskal.64b,
  author =       "J. B. Kruskal",
  title =        "Non-metric multidimensional scaling: a numerical
                 method",
  journal =      PSym,
  volume =       "29",
  pages =        "115--129",
  year =         "1964",
  comment =      PRNNunref,
}

@InProceedings{Kruskal.69,
  author =       "J. B. Kruskal",
  editor =       "R. C. Milton and J. A. Nelder",
  booktitle =    "Statistical Computation",
  title =        "Toward a practical method which helps uncover the
                 structure of a set of multivariate observations by
                 finding the linear transformation which optimizes a new
                 `index of condensation'",
  publisher =    "Academic Press",
  address =      "New York",
  pages =        "427--440",
  year =         "1969",
  comment =      PRNNunref,
}

@Article{Kruskal.71,
  author =       "J. B. Kruskal",
  title =        "Monotone regression: continuity and differentiability
                 properties",
  journal =      PSym,
  volume =       "36",
  pages =        "57--62",
  year =         "1971",
  comment =      PRNNunref,
}

@InProceedings{Kruskal.72,
  author =       "J. B. Kruskal",
  editor =       "R. N. Shephard and A. K. Romney and S. K. Nerlove",
  booktitle =    "Multidimensional Scaling: Theory and Application in
                 the Behavioural Sciences",
  title =        "Linear transformation of multivariate data to reveal
                 clustering",
  publisher =    "Seminar Press",
  address =      "New York",
  pages =        "179--191",
  year =         "1972",
  comment =      PRNNunref,
}

@Article{Krzanowski.75,
  author =       "W. J. Krzanowski",
  title =        "Discrimination and classification using both binary
                 and continuous variables",
  journal =      JASA,
  volume =       "70",
  pages =        "782--790",
  year =         "1975",
  comment =      PRNNref,
}

@InProceedings{Kung.Diamantaras.90,
  author =       "S. Y. Kung and K. I. Diamantaras",
  booktitle =    "Proceedings of the IEEE International Conference on
                 Acoustics, Speech and Signal Processing (Albuquerque,
                 NM, 1990)",
  title =        "A neural network learning algorithm for {Adaptive
                 Principal component EXtraction (APEX)}",
  volume =       "2",
  publisher =    "IEEE Press",
  address =      "Long Beach, CA",
  pages =        "861--864",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Kurkova.91,
  author =       "V. K{\accent '27 u}rkov{\'a}",
  title =        "Kolmogorov's theorem is relevant",
  journal =      NC,
  volume =       "3",
  pages =        "617--622",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Kurkova.92,
  author =       "V. K{\accent '27 u}rkov{\'a}",
  title =        "Kolmogorov's theorem and multilayer neural networks",
  journal =      NNks,
  volume =       "5",
  pages =        "501--506",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Kurzynski.83a,
  author =       "M. W. Kurzynski",
  title =        "Decision rules for a hierarchical classifier",
  journal =      PRL,
  volume =       "1",
  pages =        "305--310",
  year =         "1983",
  comment =      PRNNref,
}

@Article{Kurzynski.83b,
  author =       "M. W. Kurzynski",
  title =        "The optimal strategy of a tree classifier",
  journal =      PR,
  volume =       "16",
  pages =        "81--87",
  year =         "1983",
  note =         "[Correction page 361]",
  comment =      PRNNref,
}

@Article{Kushner.87,
  author =       "H. Kushner",
  title =        "Asymptotic global behavior for stochastic
                 approximation and diffusions with slowly decreasing
                 noise effects: global minimization via {Monte Carlo}",
  journal =      "SIAM Journal on Applied Mathematics",
  volume =       "47",
  pages =        "169--185",
  year =         "1987",
  comment =      PRNNref,
}

@InProceedings{Kwok.Carter.90,
  author =       "S. W. Kwok and C. Carter",
  editor =       "R. D. Shachter and T. S. Levitt and L. N. Kanal and J.
                 F. Lemmer",
  booktitle =    "Uncertainty in Artificial Intelligence 4",
  title =        "Multiple decision trees",
  publisher =    "North Holland",
  address =      "Amsterdam",
  pages =        "327--335",
  year =         "1990",
  comment =      PRNNref,
}

@Book{Lachenbruch.75,
  author =       "P. A. Lachenbruch",
  title =        "Discriminant Analysis",
  publisher =    "Hafner Press",
  address =      "New York",
  year =         "1975",
  comment =      PRNNunref,
}

@Article{Lachenbruch.Mickey.68,
  author =       "P. A. Lachenbruch and M. R. Mickey",
  title =        "Estimation of error rates in discriminant analysis",
  journal =      Techno,
  volume =       "10",
  pages =        "1--11",
  year =         "1968",
  comment =      PRNNref,
}

@Article{Lange.ZZ.89,
  author =       "K. L. Lange and R. J. A. Little and J. M. G. Taylor",
  title =        "Robust statistical modeling using the $t$
                 distribution",
  journal =      JASA,
  volume =       "84",
  pages =        "881--896",
  year =         "1989",
  comment =      PRNNref,
}

@Book{Langley.96,
  author       = "P. Langley",
  title        = "Elements of Machine Learning",
  publisher    = "Morgan Kaufmann",
  address      = "San Francisco",
  year         = "1996",
  comment =      PRNNref,
}

@Article{Langley.Simon.95,
  author       = "P. Langley and H. A. Simon",
  title        = "Applications of machine learning and rule induction",
  journal      = "Communications of the ACM",
  volume       = "38",
  number       = "11",
  pages        = "54--64",
  year         = "1995",
  comment =      PRNNref,
}

@Book{Lau.92,
  editor =       "C. Lau",
  title =        "Neural Networks: Theoretical Foundations and
                 Analysis",
  publisher =    "IEEE Press",
  address =      "New York",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Lauritzen.89,
  author =       "S. Lauritzen",
  title =        "Mixed graphical association models (with discussion)",
  journal =      "Scandinavian Journal of Statistics",
  volume =       "16",
  pages =        "273--306",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Lauritzen.92,
  author =       "S. Lauritzen",
  title =        "Propagation of probabilities, means and variances in
                 mixed graphical association models",
  journal =      JASA,
  volume =       "87",
  pages =        "1089--1108",
  year =         "1992",
  comment =      PRNNref,
}

@Book{Lauritzen.96,
  author       = "Steffen L. Lauritzen",
  title        = "Graphical Models",
  publisher    = "Clarendon Press",
  address      = "Oxford",
  year         = "1996",
  ISBN         = "0-19-852219-3",
  comment =      PRNNref,
}

@Article{Lauritzen.Spiegelhalter.88,
  author =       "S. Lauritzen and D. J. Spiegelhalter",
  title =        "Local computations with probabilities on graphical
                 structures and their application to expert systems
                 (with discussion)",
  journal =      JRSSB,
  volume =       "50",
  pages =        "157--224",
  year =         "1988",
  note =         URset,
  comment =      PRNNref,
}

@Article{Lauritzen.Wermuth.89,
  author =       "S. L. Lauritzen and N. Wermuth",
  title =        "Graphical models for associations between variables,
                 some of which are qualitative and some quantitative",
  journal =      AnnStat,
  volume =       "17",
  pages =        "31--57",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Lauritzen.ZZ.90,
  author =       "S. L. Lauritzen and A. P. Dawid and B. N. Larsen and
                 H.-G. Leimer",
  title =        "Independence properties of directed {Markov} fields",
  journal =      Nks,
  volume =       "20",
  pages =        "491--505",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Lauritzen.ZZ.94,
  author =       "S. L. Lauritzen and B. Thiesson and D. J.
                 Spiegelhalter",
  editor =       "P. Cheeseman and R. W. Oldford",
  booktitle =    "Selecting Models from Data: AI and Statistics IV",
  title =        "Diagnostic systems created by model selection
                 methods---a case study",
  volume =       "89",
  publisher =    Springer,
  address =      "New York",
  pages =        "143--152",
  year =         "1994",
  series =       "Lecture Notes in Statistics",
  comment =      PRNNunref,
}

@InProceedings{Lazarsfeld.61,
  author =       "P. F. Lazarsfeld",
  editor =       "H. Solomon",
  booktitle =    "Studies in Item Analysis and Prediction",
  title =        "The algebra of dichotomous systems",
  publisher =    "Stanford University Press",
  address =      "Palo Alto, CA",
  pages =        "111--157",
  year =         "1961",
  comment =      PRNNunref,
}

@TechReport{LeBlanc.Tibshirani.93,
  author =       "M. LeBlanc and R. J. Tibshirani",
  title =        "Combining estimates in regression and classification",
  type =         "Preprint",
  institution =  "Depts of Preventive Medicine and Biostatistics and of
                 Statistics, University of Toronto",
  year =         "1993",
  comment =      PRNNref,
}

@Article{LeCun.ZZ.89,
  author =       "Y. {Le Cun} and B. Boser and J. S. Denker and D.
                 Henderson and R. E. Howard and W. Hubbard and L. D.
                 Jackel",
  title =        "Backpropagation applied to handwritten {Zip} code
                 recognition",
  journal =      NC,
  volume =       "1",
  pages =        "541--551",
  year =         "1989",
  note =         "[Reprinted in \cite{Anderson.ZZ.90}]",
  comment =      PRNNref,
}

@InProceedings{LeCun.ZZ.90a,
  author =       "Y. {Le Cun} and B. Boser and J. S. Denker and D.
                 Henderson and R. E. Howard and W. Hubbard and L. D.
                 Jackel",
  title =        "Handwritten digit recognition with a back-propagation
                 network",
  crossref =     "NIPS2",
  pages =        "396--404",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{LeCun.ZZ.90b,
  author =       "Y. {Le Cun} and J. S. Denker and S. A. Solla",
  title =        "Optimal brain damage",
  crossref =     "NIPS2",
  pages =        "598--605",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Lee.91,
  author =       "Y. Lee",
  title =        "Handwritten digit recognition using {K}
                 nearest-neighbor, radial-basis function, and
                 backpropagation neural networks",
  journal =      NC,
  volume =       "3",
  pages =        "440--449",
  year =         "1991",
  comment =      PRNNref,
}

@InProceedings{Lee.Kil.88,
  author =       "S. Lee and R. M. Kil",
  booktitle =    "Proceedings of the IEEE International Conference on
                 Neural Networks, San Diego",
  title =        "Multi-layer feedforward potential function network",
  volume =       "I",
  publisher =    "IEEE Press",
  address =      "Long Beach, CA",
  pages =        "61--171",
  year =         "1988",
  comment =      PRNNref,
}

@InProceedings{Lee.ZZ.90,
  author =       "T.-C. Lee and A. M. Peterson and J. C. Tsai",
  booktitle =    "Proceedings of the IEEE International Conference on
                 Systems, Man and Cybernetics, Los Angeles",
  title =        "A multi-layer feed-forward neural network with
                 dynamically adjustable structures",
  publisher =    "IEEE Press",
  address =      "Long Beach, CA",
  pages =        "367--369",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Leeuw.84,
  author =       "J. de Leeuw",
  title =        "Differentiability of {Kruskal's} stress at a local
                 minimum",
  journal =      PSym,
  volume =       "49",
  pages =        "111--113",
  year =         "1984",
  comment =      PRNNref,
}

@Book{Lehmann.83,
  author =       "E. L. Lehmann",
  title =        "Theory of Point Estimation",
  publisher =    Wiley,
  address =      "New York",
  year =         "1983",
  comment =      PRNNref,
}

@Book{Lehmann.86,
  author =       "E. L. Lehmann",
  title =        "Testing Statistical Hypotheses",
  publisher =    "Wadsworth and Brooks/Cole",
  address =      "Pacific Grove, CA",
  edition =      "Second",
  year =         "1986",
  note =         "[Formerly New York: Wiley]",
  comment =      PRNNref,
}

@Article{Leonard.ZZ.92,
  author =       "J. A. Leonard and M. A. Kramer and J. H. Ungar",
  title =        "Using radial basis functions to approximate a function
                 and its error bounds",
  journal =      TNN,
  volume =       "3",
  pages =        "624--627",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Lesaffre.Albert.89,
  author =       "E. Lesaffre and A. Albert",
  title =        "Partial separation in logistic discrimination",
  journal =      JRSSB,
  volume =       "51",
  pages =        "109--116",
  year =         "1989",
  comment =      PRNNref,
}

@InProceedings{Levin.ZZ.94,
  author =       "A. U. Levin and T. K. Leen and J. E. Moody",
  title =        "Fast pruning using principal components",
  crossref =     "NIPS6",
  pages =        "35--42",
  year =         "1994",
  comment =      PRNNref,
}

@InProceedings{Levitt.ZZ.90,
  author =       "T. S. Levitt and T. O. Binford and G. L. Ettinger",
  editor =       "R. D. Shachter and T. S. Levitt and L. N. Kanal and J.
                 F. Lemmer",
  booktitle =    "Uncertainty in Artificial Intelligence 4",
  title =        "Utility-based control for computer vision",
  publisher =    "North Holland",
  address =      "Amsterdam",
  pages =        "407--422",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Li.Dubes.86,
  author =       "X. B. Li and R. C. Dubes",
  title =        "Tree classifier design with a permutation statistic",
  journal =      PR,
  volume =       "19",
  pages =        "229--235",
  year =         "1986",
  comment =      PRNNref,
}

@InProceedings{Lincoln.Skrzypek.90,
  author =       "W. P. Lincoln and J. Skrzypek",
  title =        "Synergy of clustering multiple backpropagation
                 networks",
  crossref =     "NIPS2",
  pages =        "650--657",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Lindley.80,
  author =       "D. V. Lindley",
  editor =       "J. M. Bernardo and M. H. DeGroot and D. V. Lindley and
                 A. F. M. Smith",
  booktitle =    "Bayesian Statistics",
  title =        "Approximate {Bayesian} methods",
  publisher =    "Valencia University Press",
  address =      "Valencia",
  pages =        "223--237",
  year =         "1980",
  comment =      PRNNref,
}

@Book{Little.Rubin.87,
  author =       "R. J. A. Little and D. B. Rubin",
  title =        "Statistical Analysis with Missing Data",
  publisher =    Wiley,
  address =      "New York",
  year =         "1987",
  comment =      PRNNref,
}

@InProceedings{Liu.93,
  author =       "Y. Liu",
  title =        "Neural network model selection using asymptotic
                 jackknife estimator and cross-validation method",
  crossref =     "NIPS5",
  pages =        "599--606",
  year =         "1993",
  comment =      PRNNref,
}

@InProceedings{Liu.94,
  author =       "Y. Liu",
  title =        "Robust parameter estimation and model selection for
                 neural network regression",
  crossref =     "NIPS6",
  pages =        "192--199",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Liu.95,
  author =       "Y. Liu",
  title =        "Unbiased estimate of generalization error and model
                 selection in neural network",
  journal =      NNks,
  volume =       "8",
  pages =        "215--219",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Liu.Nocedal.89,
  author =       "D. C. Liu and J. Nocedal",
  title =        "On the limited memory {BFGS} method for large-scale
                 optimization",
  journal =      MathProg,
  volume =       "45",
  pages =        "503--528",
  year =         "1989",
  comment =      PRNNref,
}

@InProceedings{Liu.ZZ.91,
  author =       "L. Liu and D. C. Wilkins and X. Ying and Z. Bain",
  booktitle =    "Proceedings of the Conference on Uncertainty in AI
                 (Cambridge, MA)",
  title =        "Minimum error tree decomposition",
  pages =        "180--185",
  year =         "1991",
  comment =      PRNNunref,
}

@TechReport{Lloyd.57,
  author =       "S. P. Lloyd",
  title =        "Least squares quantization in {PCM}\@",
  type =         "Technical Note",
  institution =  "Bell Laboratories",
  year =         "1957",
  note =         "[Published as \cite{Lloyd.82}]",
  comment =      PRNNref,
}

@Article{Lloyd.82,
  author =       "S. P. Lloyd",
  title =        "Least squares quantization in {PCM}\@",
  journal =      IEIT,
  volume =       "28",
  pages =        "128--137",
  year =         "1982",
  comment =      PRNNref,
}

@Article{Loizou.Maybank.87,
  author =       "G. Loizou and S. J. Maybank",
  title =        "The nearest neighbor and the {Bayes} error rates",
  journal =      PAMI,
  volume =       "9",
  pages =        "254--262",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Louis.82,
  author =       "T. A. Louis",
  title =        "Finding the observed information matrix when using the
                 {EM} algorithm",
  journal =      JRSSB,
  volume =       "44",
  pages =        "226--233",
  year =         "1982",
  comment =      PRNNref,
}

@Article{Lunts.Brailovsky.67,
  author =       "A. L. Lunts and V. L. Brailovsky",
  title =        "Evaluation of attributes obtained in statistical
                 decision rules",
  journal =      "Engineering Cybernetics",
  volume =       "3",
  pages =        "98--109",
  year =         "1967",
  comment =      PRNNunref,
}

@Article{Luttrell.89,
  author =       "S. P. Luttrell",
  title =        "Hierarchical vector quantization",
  journal =      "IEE Proceedings I",
  volume =       "136",
  pages =        "405--413",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Maass.94a,
  author =       "W. G. Maass",
  title =        "Neural networks with superlinear {VC} dimension",
  journal =      NC,
  volume =       "6",
  pages =        "877--884",
  year =         "1994",
  comment =      PRNNref,
}

@InCollection{Maass.94b,
  author =       "W. G. Maass",
  editor =       "V. Roychowdhury and K.-Y. Siu and A. Orlitsky",
  booktitle =    "Theoretical Advances in Neural Computation and
                 Learning",
  title =        "Perspectives of current research about the complexity
                 of learning on neural nets",
  chapter =      "5",
  publisher =    "Kluwer Academic Publishers",
  address =      "Boston",
  year =         "1994",
  note =         "[Also NeuroCOLT Technical Report Series NC-TR-95-003.]",
  comment =      PRNNref,
  ISBN =         "0-7923-9478-X",
}

@InCollection{Maass.Turan.94,
  author       = "W. Maass and G. Tur{\'a}n",
  editor       = "S. J. Hanson and G. A. Drastal and R. L. Rivest",
  booktitle    = "Computational Learning Theory and Natural Learning
                  Systems: Constraints and Prospects",
  title        = "How Fast Can a Threshold Gate Learn?",
  volume       = "I",
  publisher    = "MIT Press",
  pages        = "381--414",
  year         = "1994",
  ISBN         = "0-262-58126-4",
  comment =      PRNNref,
}

@InProceedings{Macintyre.Sontag.93,
  author =       "A. Macintyre and E. D. Sontag",
  editor =       "W. Aggarwal",
  booktitle =    "Proceedings of the 25th Annual ACM Symposium Theory of
                 Computing, San Diego, 1993",
  title =        "Finiteness results for sigmoidal ``neural'' networks",
  publisher =    "ACM Press",
  address =      "New York",
  pages =        "325--334",
  year =         "1993",
  comment =      PRNNref,
}

@Article{MacKay.92a,
  author =       "D. J. C. MacKay",
  title =        "{Bayesian} interpolation",
  journal =      NC,
  volume =       "4",
  pages =        "415--447",
  year =         "1992",
  comment =      PRNNref,
}

@Article{MacKay.92b,
  author =       "D. J. C. MacKay",
  title =        "A practical {Bayesian} framework for backprop
                 networks",
  journal =      NC,
  volume =       "4",
  pages =        "448--472",
  year =         "1992",
  comment =      PRNNref,
}

@Article{MacKay.92c,
  author =       "D. J. C. MacKay",
  title =        "Information-based objective functions for active data
                 selection",
  journal =      NC,
  volume =       "4",
  pages =        "590--604",
  year =         "1992",
  comment =      PRNNref,
}

@Article{MacKay.92d,
  author =       "D. J. C. MacKay",
  title =        "The evidence framework applied to classification
                 networks",
  journal =      NC,
  volume =       "4",
  pages =        "720--736",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{MacKay.92e,
  author =       "D. J. C. MacKay",
  title =        "{Bayesian} model comparison and backprop nets",
  crossref =     "NIPS4",
  pages =        "839--846",
  year =         "1992",
  comment =      PRNNref,
}

@Article{MacKay.McCulloch.52,
  author =       "D. M. MacKay and W. S. McCulloch",
  title =        "The limiting information capacity of a neuronal link",
  journal =      "Bulletin of Mathematical Biophysics",
  volume =       "14",
  pages =        "127--135",
  year =         "1952",
  comment =      PRNNunref,
}

@Article{MacLeod.ZZ.87,
  author =       "J. E. S. MacLeod and A. Luk and D. M. Titterington",
  title =        "A re-examination of the distance-weighted $k$-nearest
                 neighbor classification rule",
  journal =      SMC,
  volume =       "17",
  pages =        "689--696",
  year =         "1987",
  note =         NNset,
  comment =      PRNNunref,
}

@Article{Macnaughton-Smith.ZZ.84,
  author =       "P. Macnaughton-Smith and W. T. Williams and M. B. Dale
                 and L. G. Mockett",
  title =        "Dissimilarity analysis: a new technique of
                 hierarchical sub-division",
  journal =      Nat,
  volume =       "202",
  pages =        "1034--1035",
  year =         "1984",
  comment =      PRNNref,
}

@InProceedings{MacQueen.67,
  author =       "J. MacQueen",
  editor =       "L. M. Le Cam and J. Neyman",
  booktitle =    "Proceedings of the Fifth Berkeley Symposium on
                 Mathematical Statistics and Probability",
  title =        "Some methods for classification and analysis of
                 multivariate observations",
  volume =       "1",
  publisher =    "University of California Press",
  address =      "Berkeley, CA",
  pages =        "281--297",
  year =         "1967",
  comment =      PRNNref,
}

@Article{Madigan.Raftery.94,
  author =       "D. Madigan and A. E. Raftery",
  title =        "Model selection and accounting for model uncertainty
                 in graphical models using {Occam}'s window",
  journal =      JASA,
  volume =       "89",
  pages =        "1535--1546",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Madigan.York.95,
  author =       "D. Madigan and J. York",
  title =        "{Bayesian} graphical models for discrete data",
  journal =      ISR,
  volume =       "63",
  pages =        "215--232",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Madych.Nelson.90,
  author =       "W. R. Madych and S. A. Nelson",
  title =        "Multivariate interpolation and conditionally positive
                 definite functions {II}",
  journal =      "Mathematics of Computation",
  volume =       "54",
  pages =        "211--230",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Mahalanobis.36,
  author =       "P. C. Mahalanobis",
  title =        "On generalized distance in statistics",
  journal =      "Proceedings of the National Inst. Sci. (India)",
  volume =       "12",
  pages =        "49--55",
  year =         "1936",
  comment =      PRNNunref,
}

@Book{Maier.83,
  author =       "D. Maier",
  title =        "The Theory of Relational Databases",
  publisher =    "Computer Science Press",
  address =      "Rockville, Md",
  year =         "1983",
  comment =      PRNNunref,
}

@InProceedings{Makram-Ebeid.ZZ.89,
  author =       "S. Makram-Ebeid and J.-A. Sirat and J.-R. Viala",
  booktitle =    "International Joint Conference on Neural Networks
                 (Washington, 1989)",
  title =        "A rationalized back-propagation learning algorithm",
  volume =       "II",
  publisher =    "IEEE Press",
  address =      "New York",
  pages =        "373--380",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Mangarasian.68,
  author =       "O. L. Mangarasian",
  title =        "Multisurface methods of pattern separation",
  journal =      IEIT,
  volume =       "14",
  pages =        "801--807",
  year =         "1968",
  comment =      PRNNref,
}

@InProceedings{Mangarasian.ZZ.90,
  author =       "O. L. Mangarasian and R. Setiono and W. H. Wolberg",
  editor =       "T. F. Coleman and Y. Li",
  booktitle =    "Large-Scale Numerical Optimization, 1990",
  title =        "Pattern-recognition via linear-programming: theory and
                 application to medical diagnosis",
  publisher =    "SIAM",
  address =      "Philadelphia",
  pages =        "22--31",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Manly.Rayner.87,
  author =       "B. F. J. Manly and J. C. W. Rayner",
  title =        "The comparison of sample covariance matrices using
                 likelihood ratio tests",
  journal =      Bka,
  volume =       "74",
  pages =        "841--847",
  year =         "1987",
  comment =      PRNNref,
}

@InProceedings{Mansfield.91,
  author =       "A. J. Mansfield",
  booktitle =    "Proceedings of the International Joint Conference on
                 Neural Networks (Seattle 1991)",
  title =        "Comparison of perceptron training by
                 linear-programming and by the perceptron convergence
                 procedure",
  volume =       "II",
  publisher =    "IEEE Press",
  address =      "Long Beach, CA",
  pages =        "25--30",
  year =         "1991",
  comment =      PRNNref,
}

@Book{Mardia.ZZ.79,
  author =       "K. V. Mardia and J. T. Kent and J. M. Bibby",
  title =        "Multivariate Analysis",
  publisher =    "Academic Press",
  address =      "London",
  year =         "1979",
  comment =      PRNNref,
}

@Book{Maritz.Lwin.89,
  author =       "J. S. Maritz and T. Lwin",
  title =        "Empirical {Bayes} Methods",
  publisher =    "Chapman \& Hall",
  address =      "London",
  edition =      "Second",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Marks.Dunn.74,
  author =       "S. Marks and O. J. Dunn",
  title =        "Discriminant functions when covariance matrices are
                 unequal",
  journal =      JASA,
  volume =       "69",
  pages =        "555--559",
  year =         "1974",
  comment =      PRNNref,
}

@Article{Maronna.76,
  author =       "R. A. Maronna",
  title =        "Robust {$M$}-estimators of multivariate location and
                 scatter",
  journal =      AnnStat,
  volume =       "4",
  pages =        "51--67",
  year =         "1976",
  comment =      PRNNref,
}

@Article{Marriott.75,
  author =       "F. H. C. Marriott",
  title =        "Separating mixtures of normal distributions",
  journal =      Biom,
  volume =       "31",
  pages =        "767--769",
  year =         "1975",
  comment =      PRNNref,
}

@InProceedings{Martin.Pitman.90,
  author =       "G. L. Martin and J. A. Pitman",
  title =        "Recognizing hand-printed letters and digits",
  crossref =     "NIPS2",
  pages =        "405--414",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Martin.Pitman.91,
  author =       "G. L. Martin and J. A. Pitman",
  title =        "Recognizing hand-printed letters and digits using
                 backpropagation learning",
  journal =      NC,
  volume =       "3",
  pages =        "258--267",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Massart.ZZ.83,
  author =       "D. L. Massart and F. Plastria and L. Kaufman",
  title =        "Non-hierarchical clustering with {MASLOC}",
  journal =      PR,
  volume =       "16",
  pages =        "507--516",
  year =         "1983",
  comment =      PRNNref,
}

@InProceedings{Mathieson.96,
  author =       "M. J. Mathieson",
  editor =       "A.-P. N. Refenes and Y. Abu-Mostafa and J. Moody
                  and A. Weigend",
  title =        "Ordinal models for neural networks",
  booktitle =    "Neural Networks in Financial Engineering.
                  Proceedings of the Third International Conference
                  on Neural Networks in the Capital Markets",
  publisher =    "World Scientific",
  address =      "Singapore",
  pages =        "523--536",
  year =         "1996",
  ISBN =         "981-02-2480-X",
  comment =      PRNNref,
}

@Article{Matus.92,
  author =       "F. Mat{\'u}{\v s}",
  title =        "On equivalence of {Markov} properties over undirected
                 graphs",
  journal =      "Journal of Applied Probability",
  volume =       "29",
  pages =        "745--749",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Max.60,
  author =       "J. Max",
  title =        "Quantizing for minimum distortion",
  journal =      "IRE Transactions on Information Theory",
  volume =       "6",
  pages =        "7--12",
  year =         "1960",
  comment =      PRNNref,
}

@Book{McCullagh.Nelder.89,
  author =       "P. McCullagh and J. A. Nelder",
  title =        "Generalized Linear Models",
  publisher =    "Chapman \& Hall",
  address =      "London",
  edition =      "Second",
  year =         "1989",
  comment =      PRNNref,
}

@Article{McCulloch.Pitts.43,
  author =       "W. S. McCulloch and W. Pitts",
  title =        "A logical calculus of ideas immanent in nervous
                 activity",
  journal =      "Bulletin of Mathematical Biophysics",
  volume =       "5",
  pages =        "115--133",
  year =         "1943",
  note =         "[Reprinted in \cite{Anderson.Rosenfeld.88}]",
  comment =      PRNNref,
}

@Article{McKay.Campbell.82a,
  author =       "R. J. McKay and N. A. Campbell",
  title =        "Variable selection techniques in discriminant
                 analysis. {I}: Description",
  journal =      "British Journal of Mathematical and Statistical
                 Psychology",
  volume =       "35",
  pages =        "1--29",
  year =         "1982",
  comment =      PRNNunref,
}

@Article{McKay.Campbell.82b,
  author =       "R. J. McKay and N. A. Campbell",
  title =        "Variable selection techniques in discriminant
                 analysis. {II}: Allocation",
  journal =      "British Journal of Mathematical and Statistical
                 Psychology",
  volume =       "35",
  pages =        "30--41",
  year =         "1982",
  comment =      PRNNunref,
}

@Book{McLachlan.92,
  author =       "G. J. McLachlan",
  title =        "Discriminant Analysis and Statistical Pattern
                 Recognition",
  publisher =    Wiley,
  address =      "New York",
  year =         "1992",
  comment =      PRNNref,
}

@Book{McLachlan.Basford.88,
  author =       "G. J. McLachlan and K. E. Basford",
  title =        "Mixture Models: Inference and Applications to
                 Clustering",
  publisher =    "Marcel Dekker",
  address =      "New York",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Meinguet.79,
  author =       "J. Meinguet",
  title =        "Multivariate interpolation at arbitrary points made
                 simple",
  journal =      "Journal of Applied Mathematics and Physics (ZAMP)",
  volume =       "30",
  pages =        "292--304",
  year =         "1979",
  comment =      PRNNref,
}

@Book{Meisel.72,
  author =       "W. S. Meisel",
  title =        "Computer-Oriented Approaches to Pattern Recognition",
  publisher =    "Academic Press",
  address =      "New York",
  year =         "1972",
  comment =      PRNNunref,
}

@Article{Metropolis.ZZ.53,
  author =       "N. Metropolis and A. Rosenbluth and M. Rosenbluth and
                 A. Teller and E. Teller",
  title =        "Equations of state calculations by fast computing
                 machines",
  journal =      "Journal of Chemical Physics",
  volume =       "21",
  pages =        "1087--1091",
  year =         "1953",
  comment =      PRNNref,
}

@Article{Mhaskar.Micchelli.92,
  author =       "H. N. Mhaskar and C. A. Micchelli",
  title =        "Approximation by superposition of sigmoidal function
                 and radial basis functions",
  journal =      "Advances in Applied Mathematics",
  volume =       "13",
  pages =        "350--373",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Michalski.80,
  author =       "R. S. Michalski",
  title =        "Pattern recognition as rule-guided inductive
                 inference",
  journal =      PAMI,
  volume =       "2",
  pages =        "349--361",
  year =         "1980",
  comment =      PRNNref,
}

@InProceedings{Michie.89,
  author =       "D. Michie",
  editor =       "J. R. Quinlan",
  booktitle =    "Applications of Expert Systems volume 2",
  title =        "Problems of computer-aided concept formation",
  publisher =    "Turing Institute Press/Addison-Wesley",
  address =      "Glasgow",
  pages =        "310--333",
  year =         "1989",
  comment =      PRNNunref,
}

@Book{Michie.ZZ.94,
  editor =       "D. Michie and D. J. Spiegelhalter and C. C. Taylor",
  title =        "Machine Learning, Neural and Statistical
                 Classification",
  publisher =    "Ellis Horwood",
  address =      "New York",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Mingers.87,
  author =       "J. Mingers",
  title =        "Expert systems---rule induction with statistical
                 data",
  journal =      "Journal of the Operational Research Society",
  volume =       "38",
  pages =        "39--47",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Minnick.61,
  author =       "R. C. Minnick",
  title =        "Linear-input logic",
  journal =      "IRE Transactions on Electronic Computers",
  volume =       "10",
  pages =        "6--16",
  year =         "1961",
  comment =      PRNNref,
}

@Article{Minsky.61,
  author =       "M. Minsky",
  title =        "Steps towards artificial intelligence",
  journal =      "Proceedings of the IRE",
  volume =       "49",
  pages =        "8--30",
  year =         "1961",
  comment =      PRNNref,
}

@Book{Minsky.Papert.88,
  author =       "M. L. Minsky and S. A. Papert",
  title =        "Perceptrons. An Introduction to Computational
                 Geometry",
  publisher =    "The MIT Press",
  address =      "Cambridge, MA",
  edition =      "Expanded",
  year =         "1988",
  ISBN =         "0-262-63111-3",
  comment =      PRNNref,
}

@Article{Moller.93,
  author =       "M M{\o}ller",
  title =        "A scaled conjugate gradient algorithm for fast
                 supervised learning",
  journal =      NNks,
  volume =       "6",
  pages =        "525--533",
  year =         "1993",
  comment =      PRNNref,
}

@InProceedings{Moody.89,
  author =       "J. E. Moody",
  title =        "Fast learning in multi-resolution hierarchies",
  crossref =     "NIPS1",
  pages =        "29--39",
  year =         "1989",
  comment =      PRNNref,
}

@InProceedings{Moody.91,
  author =       "J. E. Moody",
  booktitle =    "First IEEE-SP Workshop on Neural Networks in Signal
                 Processing",
  title =        "Note on generalization, regularization and
                 architecture selection in nonlinear learning systems",
  publisher =    "IEEE Computer Society Press",
  address =      "Los Alamitos, CA",
  pages =        "1--10",
  year =         "1991",
  comment =      PRNNref,
}

@InProceedings{Moody.92,
  author =       "J. E. Moody",
  title =        "The \emph{effective} number of parameters: an analysis
                 of generalization and regularization in nonlinear
                 learning systems",
  crossref =     "NIPS4",
  pages =        "847--854",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Moody.Darken.89,
  author =       "J. Moody and C. J. Darken",
  title =        "Fast learning in networks of locally-tuned processing
                 units",
  journal =      NC,
  volume =       "1",
  pages =        "281--294",
  year =         "1989",
  comment =      PRNNref,
}

@InProceedings{Moody.Utans.92,
  author =       "J. Moody and J. Utans",
  title =        "Principled architecture selection for neural networks:
                 application to corporate bond rating prediction",
  crossref =     "NIPS4",
  pages =        "683--690",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Moody.Utans.95,
  author =       "J. Moody and J. Utans",
  editor =       "A.-P. Refenes",
  booktitle =    "Neural Networks in the Capital Markets",
  title =        "Architecture selection strategies for neural networks:
                 application to corporate bond rating prediction",
  publisher =    Wiley,
  address =      "Chichester",
  pages =        "277--300",
  year =         "1995",
  comment =      PRNNref,
}

@InProceedings{Moore.89,
  author =       "B. Moore",
  editor =       "D. Touretzky and G. Hinton and T. Sejnowski",
  booktitle =    "Proceedings of the 1988 Connectionist Models Summer
                 School",
  title =        "{ART} 1 and pattern clustering",
  publisher =    MK,
  address =      "San Mateo, CA",
  pages =        "174--185",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Moran.Murphy.79,
  author =       "M. A. Moran and B. J. Murphy",
  title =        "A closer look at two alternative methods of
                 statistical discrimination",
  journal =      ApplStat,
  volume =       "28",
  pages =        "223--232",
  year =         "1979",
  comment =      PRNNref,
}

@Unpublished{Morgan.Messenger.73,
  author =       "J. N. Morgan and R. C. Messenger",
  title =        "\emph{THAID}: a Sequential Search Program for the
                 Analysis of Nominal Scale Dependent Variables",
  year =         "1973",
  note =         "Survey Research Center, Institute for Social Research,
                 University of Michigan",
  comment =      PRNNref,
}

@Article{Morgan.Sonquist.63,
  author =       "J. N. Morgan and J. A. Sonquist",
  title =        "Problems in the analysis of survey data, and a
                 proposal",
  journal =      JASA,
  volume =       "58",
  pages =        "415--434",
  year =         "1963",
  comment =      PRNNref,
}

@Article{Morin.Raeside.81,
  author =       "R. L. Morin and D. E. Raeside",
  title =        "A reappraisal of distance-weighted $k$-nearest
                 neighbor classification for pattern recognition with
                 missing data",
  journal =      SMC,
  volume =       "11",
  pages =        "241--243",
  year =         "1981",
  comment =      PRNNref,
}

@Article{Mosteller.Wallace.63,
  author =       "F. Mosteller and D. L. Wallace",
  title =        "Inference in an authorship problem",
  journal =      JASA,
  volume =       "58",
  pages =        "275--309",
  year =         "1963",
  comment =      PRNNref,
}

@Article{Moulton.91,
  author =       "B. R. Moulton",
  title =        "A {Bayesian}-approach to regression selection and
                 estimation with application to a price-index for radio
                 services",
  journal =      "Journal of Econometrics",
  volume =       "49",
  pages =        "169--193",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Moussouris.74,
  author =       "J. Moussouris",
  title =        "{Gibbs} and {Markov} random systems with constraints",
  journal =      "Journal of Statistical Physics",
  volume =       "10",
  pages =        "11--33",
  year =         "1974",
  comment =      PRNNref,
}

@InProceedings{Murata.ZZ.91,
  author =       "N. Murata and S. Yoshizawa and S. Amari",
  editor =       "T. Kohonen and K. M{\"a}kisara and O. Simula and J.
                 Kangas",
  booktitle =    "Artificial Neural Networks. Proceedings of ICANN-91",
  title =        "A criterion for determining the number of parameters
                 in an artificial neural network model",
  volume =       "I",
  publisher =    "North Holland",
  address =      "Amsterdam",
  pages =        "9--14",
  year =         "1991",
  comment =      PRNNref,
}

@InProceedings{Murata.ZZ.93,
  author =       "N. Murata and S. Yoshizawa and S. Amari",
  title =        "Learning curves, model selection and complexity of
                 neural networks",
  crossref =     "NIPS5",
  pages =        "607--614",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Murata.ZZ.94,
  author =       "N. Murata and S. Yoshizawa and S. Amari",
  title =        "Network information criterion---determining the number
                 of hidden units for artificial neural network models",
  journal =      TNN,
  volume =       "5",
  pages =        "865--872",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Muroga.65,
  author       = "S. Muroga",
  title        = "Lower bounds of the number of threshold functions and a
                  maximum weight",
  journal      = "IEEE Transactions on Electronic Computers",
  volume       = "14",
  pages        = "136--148",
  year         = "1965",
  comment =      PRNNunref,
}

@Book{Muroga.71,
  author =       "S. Muroga",
  title =        "Threshold Logic and its Applications",
  publisher =    Wiley,
  address =      "New York",
  year =         "1971",
  comment =      PRNNref,
}

@Article{Muroga.ZZ.61,
  author =       "S. Muroga and I. Toda and S. Takasu",
  title =        "Theory of majority decision elements",
  journal =      "Journal of the Franklin Institute",
  volume =       "271",
  pages =        "376--418",
  year =         "1961",
  comment =      PRNNunref,
}

@TechReport{Murphy.Aha.95,
  author =       "P. M. Murphy and D. W. Aha",
  title =        "\emph{UCI Repository of Machine Learning Databases}",
  type =         "Machine-readable collection",
  institution =  "Dept of Information and Computer Science, University
                 of California, Irvine",
  year =         "1995",
  note =         "[Available by anonymous ftp from {\tt ics.uci.edu} in
                 directory {\tt pub/machine-learning-databases}]",
  comment =      PRNNref,
}

@Article{Murtagh.85,
  author =       "F. Murtagh",
  title =        "A survey of algorithms for contiguity-constrained
                 clustering and related problems",
  journal =      "Computer Journal",
  volume =       "28",
  pages =        "82--88",
  year =         "1985",
  comment =      PRNNref,
}

@InProceedings{Murtagh.95a,
  author =       "F. Murtagh",
  editor =       "I. J. Cox and P. Hansen and B. Julesz.",
  booktitle =    "Partitioning Data Sets",
  title =        "Contiguity-constrained hierarchical clustering",
  publisher =    "American Mathematical Society",
  address =      "Providence, RI",
  pages =        "143--152",
  year =         "1995",
  series =       "DIMACS",
  comment =      PRNNref,
}

@Article{Murtagh.95b,
  author =       "F. Murtagh",
  title =        "Interpreting the {Kohonen} self-organizing feature map
                 using contiguity-constrained clustering",
  journal =      PRL,
  volume =       "16",
  pages =        "399--408",
  year =         "1995",
  comment =      PRNNref,
}

@InProceedings{Murthy.66,
  author =       "V. K. Murthy",
  editor =       "P. R. Krishnaiah",
  booktitle =    "Multivariate Analysis",
  title =        "Nonparametric estimation of multivariate densities
                 with applications",
  publisher =    "Academic Press",
  address =      "New York",
  pages =        "43--56",
  year =         "1966",
  comment =      PRNNunref,
}

@Article{Musavi.ZZ.92,
  author =       "M. T. Musavi and W. Ahmed and K. H. Chan and K. B.
                 Faris and D. M. Hummels",
  title =        "On the training of radial basis function classifiers",
  journal =      NNks,
  volume =       "5",
  pages =        "595--603",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Myles.Hand.90,
  author =       "J. P. Myles and D. J. Hand",
  title =        "The multiclass metric problem in nearest neighbour
                 discrimination rules",
  journal =      PR,
  volume =       "23",
  pages =        "1291--1297",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Narendra.Fukunaga.77,
  author =       "P. M. Narendra and K. Fukunaga",
  title =        "A branch and bound algorithm for feature subset
                 selection",
  journal =      IEC,
  volume =       "26",
  pages =        "917--922",
  year =         "1977",
  comment =      PRNNref,
}

@Book{Nash.90,
  author =       "J. C. Nash",
  title =        "Compact Numerical Methods for Computers. Linear
                 Algebra and Function Minimization",
  publisher =    "Adam Hilger",
  address =      "Bristol",
  edition =      "Second",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Neal.92a,
  author =       "R. Neal",
  title =        "Connectionist learning of belief networks",
  journal =      AI,
  volume =       "56",
  pages =        "71--113",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Neal.92b,
  author =       "R. M. Neal",
  title =        "Asymmetric parallel {Boltzmann} machines are belief
                 networks",
  journal =      NC,
  volume =       "4",
  pages =        "832--834",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Neal.93,
  author =       "R. Neal",
  title =        "{Bayesian} learning via stochastic dynamics",
  crossref =     "NIPS5",
  pages =        "475--482",
  year =         "1993",
  comment =      PRNNref,
}

@PhdThesis{Neal.95,
  author =       "R. M. Neal",
  title =        "{Bayesian} Learning for Neural Networks",
  school =       "Department of Computer Science, University of
                 Toronto",
  year =         "1995",
  comment =      PRNNref,
}

@Book{Neal.96,
  author =       "R. M. Neal",
  title =        "{Bayesian} Learning for Neural Networks",
  year =         "1996",
  publisher =    Springer,
  address =      "New York",
  series       = "Lecture Notes in Statistics",
  number       = "118",
  comment =      PRNNref,
}

@Book{Neapolitan.90,
  author =       "E. Neapolitan",
  title =        "Probabilistic Reasoning in Expert Systems. Theory and
                 Algorithms",
  publisher =    Wiley,
  address =      "New York",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Niblett.87,
  author =       "T. Niblett",
  editor =       "I. Bratko and N. Lavra{\v c}",
  booktitle =    "Progress in Machine Learning",
  title =        "Constructing decision trees in noisy domains",
  publisher =    "Sigma Press",
  address =      "Wilmslow",
  pages =        "67--78",
  year =         "1987",
  comment =      PRNNref,
}

@InProceedings{Niblett.Bratko.87,
  author =       "T. Niblett and I. Bratko",
  editor =       "M. A. Bramer",
  booktitle =    "Research and Development in Expert Systems III.
                 Proceedings of Expert Systems '86, Brighton 1986",
  title =        "Learning decision rules in noisy domains",
  publisher =    "Cambridge University Press",
  address =      "Cambridge",
  pages =        "25--34",
  year =         "1987",
  comment =      PRNNunref,
}

@Article{Niemann.Goppert.88,
  author =       "H. Niemann and G. Goppert",
  title =        "An efficient branch-and-bound nearest neighbour
                 classifier",
  journal =      PRL,
  volume =       "7",
  pages =        "67--72",
  year =         "1988",
  note =         NNset,
  comment =      PRNNref,
}

@InProceedings{Nowlan.Hinton.92a,
  author =       "S. J. Nowlan and G. E. Hinton",
  title =        "Adaptive soft weight tying using {Gaussian} mixtures",
  crossref =     "NIPS4",
  pages =        "993--1000",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Nowlan.Hinton.92b,
  author =       "S. J. Nowlan and G. E. Hinton",
  title =        "Simplifying neural networks by soft weight-sharing",
  journal =      NC,
  volume =       "4",
  pages =        "473--493",
  year =         "1992",
  note =         "[Reprinted with an introduction as pp. 369--394 of
                 \cite{Wolpert.95}]",
  comment =      PRNNref,
}

@Article{Oja.82,
  author =       "E. Oja",
  title =        "A simplified neuron model as a principal component
                 analyzer",
  journal =      "Journal of Mathematical Biology",
  volume =       "16",
  pages =        "267--273",
  year =         "1982",
  comment =      PRNNref,
}

@Article{Oja.89,
  author =       "E. Oja",
  title =        "Neural networks, principal components and subspaces",
  journal =      IJNS,
  volume =       "1",
  pages =        "61--68",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Oja.92,
  author =       "E. Oja",
  title =        "Principal components, minor components and linear
                 neural networks",
  journal =      NNks,
  volume =       "5",
  pages =        "927--935",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Oja.Karhunen.85,
  author =       "E. Oja and J. Karhunen",
  title =        "On stochastic-approximation of the eigenvectors and
                 eigenvalues of the expectation of a random matrix",
  journal =      "Journal of Mathematical Analysis and its
                 Applications",
  volume =       "106",
  pages =        "69--84",
  year =         "1985",
  comment =      PRNNref,
}

@Article{Olesen.93,
  author =       "K. G. Olesen",
  title =        "Causal probabilistic networks with both discrete and
                 continuous variables",
  journal =      PAMI,
  volume =       "15",
  pages =        "275--279",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Oliver.ZZ.79,
  author =       "L. H. Oliver and R. S. Poulsen and G. T. Toussaint and
                 C. Louis",
  title =        "Classification of atypical cells in the automated
                 cytoscreening for cervical cancer",
  journal =      PR,
  volume =       "11",
  pages =        "205--212",
  year =         "1979",
  comment =      PRNNunref,
}

@Article{Olkin.Tate.61,
  author =       "I. Olkin and R. F. Tate",
  title =        "Multivariate correlation models with mixed discrete
                 and continuous variates",
  journal =      AnnMathStat,
  volume =       "32",
  pages =        "445--465",
  year =         "1961",
  comment =      PRNNref,
}

@Article{Ooyen.Nienhuis.92,
  author =       "A. van Ooyen and B. Nienhuis",
  title =        "Improving the convergence of the back-propagation
                 algorithm",
  journal =      NNks,
  volume =       "5",
  pages =        "465--471",
  year =         "1992",
  note =         "[See also letter to the editor and response,
                 \textbf{6}, 611--612]",
  comment =      PRNNref,
}

@Article{Ott.89,
  author =       "J. Ott",
  title =        "Computer-simulation methods in human linkage
                 analysis",
  journal =      PNAS,
  volume =       "86",
  pages =        "4175--4178",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Owen.84,
  author =       "A. Owen",
  title =        "A neighbourhood-based {LANDSAT} classifier",
  journal =      "Canadian Journal of Statistics",
  volume =       "12",
  pages =        "191--200",
  year =         "1984",
  comment =      PRNNref,
}

@InProceedings{Owens.Filkin.89,
  author =       "A. J. Owens and D. L. Filkin",
  booktitle =    "Proceedings of the International Conference on Neural
                 Networks (Washington, 1989),",
  title =        "Efficient training of the back propagation network by
                 solving a system of stiff ordinary differential
                 equations",
  volume =       "II",
  publisher =    "IEEE Press",
  address =      "New York",
  pages =        "381--386",
  year =         "1989",
  comment =      PRNNref,
}

@InProceedings{Pagallo.89,
  author =       "G. Pagallo",
  editor =       "N. Sridharan",
  booktitle =    "Proceedings of the 11th International Joint
                 Conference on Artificial Intelligence (Detroit, 1989)",
  title =        "Learning {DNF} by decision trees",
  publisher =    MK,
  address =      "San Mateo, CA",
  pages =        "639--644",
  year =         "1989",
  comment =      PRNNref,
}

@InProceedings{Pagallo.Haussler.89,
  author =       "G. Pagallo and D. Haussler",
  editor =       "A. M. Segre",
  booktitle =    "Proceedings of the Sixth International Workshop on
                 Machine Learning (Ithaca, 1989)",
  title =        "Two algorithms that learn {DNF} by discovering
                 relevant features",
  publisher =    MK,
  address =      "San Mateo, CA",
  pages =        "119--123",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Pagallo.Haussler.90,
  author =       "G. Pagallo and D. Haussler",
  title =        "Boolean feature discovery in empirical learning",
  journal =      ML,
  volume =       "5",
  pages =        "71--99",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Park.Sandberg.91,
  author =       "J. Park and I. W. Sandberg",
  title =        "Universal approximation using radial-basis-function
                 networks",
  journal =      NC,
  volume =       "3",
  pages =        "246--257",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Parthasarthy.Chatterji.90,
  author =       "G. Parthasarthy and B. N. Chatterji",
  title =        "A class of new {KNN} methods for low sample problems",
  journal =      SMC,
  volume =       "20",
  pages =        "715--718",
  year =         "1990",
  comment =      PRNNref,
}

@Book{Parberry.94,
  author       = "I. Parberry",
  title        = "Circuit Complexity and Neural Networks",
  publisher    = "MIT Press",
  address      = "Cambridge, MA",
  year         = "1994",
  ISBN         = "0-262-16148-6",
  comment =      PRNNref,
}

@Article{Parrondo.VanderBroeck.93,
  author       = "J. M. R. Parrondo and C. {Van der Broeck}",
  title        = "{Vapnik}-{Chervonenkis} bounds for generalization",
  journal      = "J. Phys. A",
  volume       = "26",
  pages        = "2211--2223",
  year         = "1993",
  comment =      PRNNref,
}

@Article{Parzen.62,
  author =       "E. Parzen",
  title =        "On the estimation of a probability density function
                 and mode",
  journal =      AnnMathStat,
  volume =       "33",
  pages =        "1065--1076",
  year =         "1962",
  comment =      PRNNref,
}

@Article{Patrick.Fisher.69,
  author =       "E. A. Patrick and F. P. {Fisher II}",
  title =        "Nonparametric feature selection",
  journal =      IEIT,
  volume =       "15",
  pages =        "577--584",
  year =         "1969",
  comment =      PRNNref,
}

@Book{Patterson.Niblett.83,
  author =       "A. Patterson and T. Niblett",
  title =        "{ACLS} User Manual",
  publisher =    "Intelligent Terminals Ltd",
  address =      "Glasgow",
  year =         "1983",
  comment =      PRNNunref,
}

@Article{Pavlidis.93,
  author =       "T. Pavlidis",
  title =        "Recognition of printed text under realistic
                 conditions",
  journal =      PRL,
  volume =       "14",
  pages =        "317--326",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Payne.Meisel.77,
  author =       "H. J. Payne and W. S. Meisel",
  title =        "An algorithm for constructing optimal binary decision
                 trees",
  journal =      IEC,
  volume =       "26",
  pages =        "905--916",
  year =         "1977",
  comment =      PRNNref,
}

@Article{Pearl.79,
  author =       "J. Pearl",
  title =        "Capacity and error estimates for {Boolean} classifiers
                 with limited capacity",
  journal =      PAMI,
  volume =       "1",
  pages =        "350--356",
  year =         "1979",
  comment =      PRNNref,
}

@InProceedings{Pearl.82,
  author =       "J. Pearl",
  editor =       "D. Waltz",
  booktitle =    "Proceedings of the AAAI National Conference on
                 Artificial Intelligence (Pittsburgh, 1982)",
  title =        "Reverend {Bayes} on inference engines: a distributed
                 hierarchical approach",
  publisher =    "AAAI",
  address =      "Menlo Park, CA",
  pages =        "133--136",
  year =         "1982",
  comment =      PRNNref,
}

@Article{Pearl.86,
  author =       "J. Pearl",
  title =        "Fusion, propagation, and structuring in belief
                 networks",
  journal =      AI,
  volume =       "29",
  pages =        "241--288",
  year =         "1986",
  note =         URset,
  comment =      PRNNref,
}

@Article{Pearl.87,
  author =       "J. Pearl",
  title =        "Evidential reasoning using stochastic simulation of
                 causal models",
  journal =      AI,
  volume =       "32",
  pages =        "245--257",
  year =         "1987",
  comment =      PRNNref,
}

@Book{Pearl.88,
  author =       "J. Pearl",
  title =        "Probabilistic Inference in Intelligent Systems.
                 Networks of Plausible Inference",
  publisher =    MK,
  address =      "San Mateo, CA",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Pearl.93a,
  author =       "J. Pearl",
  title =        "Belief networks revisited",
  journal =      AI,
  volume =       "59",
  pages =        "49--56",
  year =         "1993",
  comment =      PRNNref,
}

@Misc{Pearl.93b,
  author =       "J. Pearl",
  title =        "Graphical models, causality and intervention",
  year =         "1993",
  note =         "Contribution to the discussion of
                 \cite{Spiegelhalter.ZZ.93}",
  comment =      PRNNref,
}

@InProceedings{Pearl.95,
  author =       "J. Pearl",
  title =        "From {Bayesian} networks to causal networks",
  crossref =     "Gammerman.95",
  pages =        "1--31",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Pearlmutter.94,
  author =       "B. A. Pearlmutter",
  title =        "Fast exact multiplication by the {Hessian}",
  journal =      NC,
  volume =       "6",
  pages =        "147--160",
  year =         "1994",
  comment =      PRNNref,
}

@InProceedings{Pearlmutter.Rosenfeld.91,
  author =       "B. A. Pearlmutter and R. Rosenfeld",
  title =        "{Chaitin--Kolmogorov} complexity and generalization in
                 neural networks",
  crossref =     "NIPS3",
  pages =        "925--931",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Peck.ZZ.89,
  author =       "R. Peck and L. Fisher and J. {Van Ness}",
  title =        "Approximate confidence intervals for the number of
                 clusters",
  journal =      JASA,
  volume =       "84",
  pages =        "184--191",
  year =         "1989",
  comment =      PRNNref,
}

@TechReport{Peng.ZZ.94,
  author =       "F. Peng and R. A. Jacobs and M. A. Tanner",
  title =        "{Bayesian} inference in mixtures-of-experts and
                 hierarchical mixtures-of-experts architectures",
  institution =  "Dept of Biostatistics, University of Rochester, NY",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Penrod.Wagner.77,
  author =       "C. S. Penrod and T. J. Wagner",
  title =        "Another look at the edited nearest neighbor rule",
  journal =      SMC,
  volume =       "7",
  pages =        "92--94",
  year =         "1977",
  comment =      PRNNref,
}

@Book{Peretto.92,
  author =       "P. Peretto",
  title =        "An Introduction to the Modeling of Neural Networks",
  publisher =    "Cambridge University Press",
  address =      "Cambridge",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Perrone.Cooper.93,
  author =       "M. P. Perrone and L. N. Cooper",
  title =        "When networks disagree: Ensemble methods for hybrid
                 neural networks",
  crossref =     "Mammone.93",
  pages =        "126--142",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Peskun.73,
  author =       "P. H. Peskun",
  title =        "Optimal {Monte-Carlo} sampling using {Markov} chains",
  journal =      Bka,
  volume =       "60",
  pages =        "607--612",
  year =         "1973",
  comment =      PRNNref,
}

@Article{Peterson.Anderson.87,
  author =       "C. Peterson and J. R. Anderson",
  title =        "A mean field learning algorithm for neural networks",
  journal =      ComSys,
  volume =       "1",
  pages =        "995--1019",
  year =         "1987",
  comment =      PRNNref,
}

@Book{Pitas.93,
  editor =       "I. Pitas",
  title =        "Parallel Algorithms for Digital Image Processing,
                 Computer Vision and Neural Networks",
  publisher =    Wiley,
  address =      "Chichester",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Ploughman.Boehnke.89,
  author =       "L. M. Ploughman and M. Boehnke",
  title =        "Estimating the power of a proposed linkage study for a
                 complex genetic trait",
  journal =      "American Journal of Human Genetics",
  volume =       "44",
  pages =        "543--551",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Poggio.Girosi.90a,
  author =       "T. Poggio and F. Girosi",
  title =        "Regularization algorithms for learning that are
                 equivalent to multilayer networks",
  journal =      "Science",
  volume =       "247",
  pages =        "978--982",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Poggio.Girosi.90b,
  author =       "T. Poggio and F. Girosi",
  title =        "Networks for approximation and learning",
  journal =      PIEEE,
  volume =       "78",
  pages =        "1481--1497",
  year =         "1990",
  note =         rep-Lau,
  comment =      PRNNref,
}

@Book{Pollard.84,
  author =       "D. Pollard",
  title =        "Convergence of Stochastic Processes",
  publisher =    Springer,
  address =      "New York",
  year =         "1984",
  comment =      PRNNref,
}

@TechReport{Pollard.86,
  author =       "D. Pollard",
  title =        "Rates of uniform almost-sure convergence for empirical
                 processes indexed by unbounded classes of functions",
  type =         "Unpublished paper",
  institution =  "Dept of Statistics, Yale University",
  year =         "1986",
  comment =      PRNNref,
}

@Book{Pollard.90,
  author =       "D. Pollard",
  title =        "Empirical Processes: Theory and Applications",
  publisher =    "Institute of Mathematical Statistics and American
                 Statistical Association",
  address =      "Hayward, CA",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Posse.90,
  author =       "C. Posse",
  title =        "An effective two-dimensional projection pursuit
                 algorithm",
  journal =      "Communications in Statistics---Simulation and
                 Computation",
  volume =       "19",
  pages =        "1143--1164",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Posse.95a,
  author =       "C. Posse",
  title =        "Tools for two-dimensional exploratory projection
                 pursuit",
  journal =      JCGS,
  volume =       "4",
  pages =        "83--100",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Posse.95b,
  author =       "C. Posse",
  title =        "Projection pursuit exploratory data analysis",
  journal =      CSDA,
  year =         "1995",
  comment =      PRNNunref,
}

@InProceedings{Powell.87,
  author =       "M. J. D. Powell",
  editor =       "J. C. Mason and M. G. Cox",
  booktitle =    "Algorithms for Approximation",
  title =        "Radial basis functions for multivariable
                 interpolation: a review",
  publisher =    "Clarendon Press",
  address =      "Oxford",
  pages =        "143--167",
  year =         "1987",
  comment =      PRNNref,
}

@InProceedings{Powell.92,
  author =       "M. J. D. Powell",
  editor =       "W. Light",
  booktitle =    "Advances in Numerical Analysis",
  title =        "The theory of radial function approximation in 1990",
  volume =       "II",
  publisher =    "Clarendon Press",
  address =      "Oxford",
  pages =        "105--210",
  year =         "1992",
  comment =      PRNNref,
}

@TechReport{Prechelt.94,
  author =       "L. Prechelt",
  title =        "A study of experimental evaluation of current neural
                 network learning algorithms: current research
                 practice",
  number =       "19/94",
  institution =  "Fakult{\"a}t f{\"u}r Informatik, Universit{\"a}t
                 Kahlsruhe",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Prentice.Pyke.79,
  author =       "R. Prentice and R. Pyke",
  title =        "Logistic disease incidence models and case-control
                 studies",
  journal =      Bka,
  volume =       "66",
  pages =        "403--411",
  year =         "1979",
  comment =      PRNNref,
}

@Book{Preparata.Shamos.85,
  author =       "F. P. Preparata and M. I. Shamos",
  title =        "Computational Geometry. An Introduction",
  publisher =    Springer,
  address =      "New York",
  year =         "1985",
  comment =      PRNNref,
}

@Book{Press.ZZ.92,
  author =       "W. H. Press and B. P. Flannery and S. A. Teukolsky and
                 W. T. Vetterling",
  title =        "Numerical Recipes in {C}",
  publisher =    "Cambridge University Press",
  address =      "Cambridge",
  edition =      "Second",
  year =         "1992",
  comment =      PRNNref,
}

@Book{Preston.74,
  author =       "C. J. Preston",
  title =        "{Gibbs} States on Countable Sets",
  publisher =    "Cambridge University Press",
  address =      "London",
  year =         "1974",
  comment =      PRNNunref,
}

@Book{Preston.76,
  author =       "C. J. Preston",
  title =        "Random Fields",
  volume =       "534",
  publisher =    Springer,
  address =      "Berlin",
  year =         "1976",
  series =       "Lecture Notes in Mathematics",
  comment =      PRNNref,
}

@Book{Przytula.Prasanna.93,
  author       = "K. W. Przytula and V. K. Prasanna",
  title        = "Parallel Digital Implementation of Neural Networks",
  publisher    = "Prentice Hall",
  address      = "Englewood Cliffs, NJ",
  year         = "1993",
  comment =      PRNNunref,
}

@Article{Quenouille.49,
  author =       "M. H. Quenouille",
  title =        "Approximate tests of correlation in time series",
  journal =      JRSSB,
  volume =       "11",
  pages =        "68--84",
  year =         "1949",
  comment =      PRNNref,
}

@InProceedings{Quinlan.79,
  author =       "J. R. Quinlan",
  editor =       "D. Michie",
  booktitle =    "Expert Systems in the Microelectronic Age",
  title =        "Discovering rules by induction from large collections
                 of examples",
  publisher =    "Edinburgh University Press",
  address =      "Edinburgh",
  pages =        "168--201",
  year =         "1979",
  comment =      PRNNunref,
}

@InProceedings{Quinlan.83,
  author =       "J. R. Quinlan",
  editor =       "R. S. Michalski and J. G. Carbonell and T. M.
                 Mitchell",
  booktitle =    "Machine Learning",
  title =        "Learning efficient classification procedures and their
                 application to chess end-games",
  publisher =    "Tioga",
  address =      "Palo Alto, CA",
  pages =        "463--482",
  year =         "1983",
  comment =      PRNNunref,
}

@Article{Quinlan.86,
  author =       "J. R. Quinlan",
  title =        "Induction of decision trees",
  journal =      ML,
  volume =       "1",
  pages =        "81--106",
  year =         "1986",
  note =         MLset,
  comment =      PRNNref,
}

@Article{Quinlan.87a,
  author =       "J. R. Quinlan",
  title =        "Simplifying decision trees",
  journal =      "International Journal of Man--Machine Studies",
  volume =       "27",
  pages =        "221--234",
  year =         "1987",
  comment =      PRNNref,
}

@InProceedings{Quinlan.87b,
  author =       "J. R. Quinlan",
  editor =       "J. McDermott",
  booktitle =    "Proceedings of the Tenth International Joint
                 Conference on Artificial Intelligence (Milan, 1987)",
  title =        "Generating production rules from decision trees",
  publisher =    MK,
  address =      "San Mateo, CA",
  year =         "1987",
  comment =      PRNNref,
}

@InProceedings{Quinlan.88,
  author =       "J. R. Quinlan",
  editor =       "J. E. Hayes and D. Michie and J. Richards",
  booktitle =    "Machine Intelligence 11",
  title =        "Decision trees and multi-valued attributes",
  publisher =    "Clarendon Press",
  address =      "Oxford",
  pages =        "305--318",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Quinlan.90,
  author =       "J. R. Quinlan",
  title =        "Decision trees and decision making",
  journal =      SMC,
  volume =       "20",
  pages =        "339--346",
  year =         "1990",
  comment =      PRNNref,
}

@Book{Quinlan.93,
  author =       "J. R. Quinlan",
  title =        "{C4}.5: Programs for Machine Learning",
  publisher =    MK,
  address =      "San Mateo, CA",
  year =         "1993",
  comment =      PRNNref,
}

@TechReport{Raftery.93,
  author =       "A. E. Raftery",
  title =        "Approximate {Bayes} factors and accounting for model
                 uncertainty in generalized linear models",
  number =       "255",
  institution =  "Dept of Statistics, University of Washington",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Rao.48,
  author =       "C. R. Rao",
  title =        "The utilization of multiple measurements in problems
                 of biological classification (with discussion)",
  journal =      JRSSB,
  volume =       "10",
  pages =        "159--203",
  year =         "1948",
  comment =      PRNNref,
}

@Article{Rao.60,
  author =       "C. R. Rao",
  title =        "Multivariate analysis: an indispensable statistical
                 aid in applied research",
  journal =      "Sankhy{\=a}",
  volume =       "22",
  pages =        "317--338",
  year =         "1960",
  comment =      PRNNref,
}

@Article{Rayens.Greene.91,
  author =       "W. Rayens and T. Greene",
  title =        "Covariance pooling and stabilization for
                 classification",
  journal =      CSDA,
  volume =       "11",
  pages =        "17--42",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Redner.Walker.84,
  author =       "R. A. Redner and H. F. Walker",
  title =        "Mixture densities, maximum likelihood and the {EM}
                 algorithm",
  journal =      "SIAM Review",
  volume =       "26",
  pages =        "195--239",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Reed.93,
  author =       "R. Reed",
  title =        "Pruning algorithms---a survey",
  journal =      TNN,
  volume =       "4",
  pages =        "740--747",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Reilly.ZZ.82,
  author =       "D. L. Reilly and L. N. Cooper and C. Elbaum",
  title =        "A neural model for category learning",
  journal =      BioCyb,
  volume =       "45",
  pages =        "35--41",
  year =         "1982",
  note =         "[Reprinted in \cite{Anderson.ZZ.90}]",
  comment =      PRNNref,
}

@Article{Richards.72,
  author =       "L. E. Richards",
  title =        "Refinement and extension of distribution-free
                 discriminate analysis",
  journal =      ApplStat,
  volume =       "21",
  pages =        "174--176",
  year =         "1972",
  comment =      PRNNref,
}

@Article{Riffenburgh.Clunies-Ross.60,
  author =       "R. H. Riffenburgh and C. W. Clunies-Ross",
  title =        "Linear discriminant analysis",
  journal =      "Pacific Science",
  volume =       "14",
  pages =        "251--256",
  year =         "1960",
  comment =      PRNNunref,
}

@InProceedings{Rimey.Brown.92,
  author =       "R. Rimey and C. Brown",
  editor =       "A. Blake and A. Yuille",
  booktitle =    "Active Vision",
  title =        "Task-oriented vision with multiple {Bayes} nets",
  publisher =    "The MIT Press",
  address =      "Cambridge, MA",
  pages =        "217--236",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Ripley.77,
  author =       "B. D. Ripley",
  title =        "Modelling spatial patterns (with discussion)",
  journal =      JRSSB,
  volume =       "39",
  pages =        "172--212",
  year =         "1977",
  comment =      PRNNref,
}

@Article{Ripley.79,
  author =       "B. D. Ripley",
  title =        "Algorithm {AS137}. {Simulating} spatial patterns:
                 dependent samples from a multivariate density",
  journal =      ApplStat,
  volume =       "28",
  pages =        "109--112",
  year =         "1979",
  comment =      PRNNref,
}

@Book{Ripley.87,
  author =       "B. D. Ripley",
  title =        "Stochastic Simulation",
  publisher =    Wiley,
  address =      "New York",
  year =         "1987",
  ISBN =         "0-471-81884-4",
  comment =      PRNNref,
}

@Book{Ripley.88,
  author =       "B. D. Ripley",
  title =        "Statistical Inference for Spatial Processes",
  publisher =    "Cambridge University Press",
  address =      "Cambridge",
  year =         "1988",
  comment =      PRNNref,
}

@InProceedings{Ripley.93,
  author =       "B. D. Ripley",
  editor =       "O. E. Barndorff-Nielsen and J. L. Jensen and W. S.
                 Kendall",
  booktitle =    "Networks and Chaos---Statistical and Probabilistic
                 Aspects",
  title =        "Statistical aspects of neural networks",
  publisher =    "Chapman \& Hall",
  address =      "London",
  pages =        "40--123",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Ripley.94a,
  author =       "B. D. Ripley",
  title =        "Neural networks and related methods for classification
                 (with discussion)",
  journal =      JRSSB,
  volume =       "56",
  pages =        "409--456",
  year =         "1994",
  comment =      PRNNref,
}

@InProceedings{Ripley.94b,
  author =       "B. D. Ripley",
  editor =       "K. V. Mardia",
  booktitle =    "Statistics and Images 2",
  title =        "Neural networks and flexible regression and
                 discrimination",
  volume =       "2",
  publisher =    "Carfax",
  address =      "Abingdon",
  pages =        "39--57",
  year =         "1994",
  series =       "Advances in Applied Statistics",
  comment =      PRNNref,
}

@InProceedings{Ripley.94c,
  author =       "B. D. Ripley",
  title =        "Flexible non-linear approaches to classification",
  crossref =     "Cherkassky.ZZ.94",
  pages =        "105--126",
  year =         "1994",
  comment =      PRNNref,
}

@InProceedings{Ripley.95,
  author =       "B. D. Ripley",
  editor =       "B. Kappen and S. Gielen",
  booktitle =    "Neural Networks: Artificial Intelligence and
                 Industrial Applications",
  title =        "Statistical ideas for selecting network
                 architectures",
  publisher =    Springer,
  address =      "London",
  pages =        "183--190",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Ripley.Kelly.77,
  author =       "B. D. Ripley and F. P. Kelly",
  title =        "{Markov} point processes",
  journal =      "Journal of the London Mathematical Society (2)",
  volume =       "15",
  pages =        "188--192",
  year =         "1977",
  comment =      PRNNref,
}

@Article{Ripley.Kirkland.90,
  author =       "B. D. Ripley and M. D. Kirkland",
  title =        "Iterative simulation methods",
  journal =      "Journal of Computational and Applied Mathematics",
  volume =       "31",
  pages =        "165--172",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Rissanen.83,
  author =       "J. Rissanen",
  title =        "A universal prior for integers and estimation by
                 minimum description length",
  journal =      AnnStat,
  volume =       "11",
  pages =        "416--431",
  year =         "1983",
  comment =      PRNNref,
}

@Article{Rissanen.87,
  author =       "J. Rissanen",
  title =        "Stochastic complexity (with discussion)",
  journal =      JRSSB,
  volume =       "49",
  pages =        "223--239",
  year =         "1987",
  comment =      PRNNref,
}

@Book{Rissanen.89,
  author =       "J. Rissanen",
  title =        "Stochastic Complexity in Statistical Inquiry",
  publisher =    "World Scientific Publishing Co",
  address =      "Singapore",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Ritter.ZZ.75,
  author =       "G. L. Ritter and H. B. Woodruff and S. R. Lowry and T.
                 L. Isenhour",
  title =        "An algorithm for a selective nearest neighbor decision
                 rule",
  journal =      IEIT,
  volume =       "21",
  pages =        "665--669",
  year =         "1975",
  note =         NNset,
  comment =      PRNNref,
}

@Book{Ritter.ZZ.92,
  author =       "H. Ritter and T. Martinetz and K. Schulten",
  title =        "Neural Computation and Self-Organizing Maps. An
                 Introduction",
  publisher =    "Addison-Wesley",
  address =      "Reading, MA",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Roberts.Tarassenko.95,
  author =       "S. Roberts and L. Tarassenko",
  editor =       "A. F. Murray",
  booktitle =    "Neural Network Applications",
  title =        "Automated sleep {EEG} analysis using an {RBF}
                 network",
  publisher =    "Kluwer Academic Publishers",
  address =      "Dordrecht",
  pages =        "305--322",
  year =         "1995",
  comment =      PRNNref,
}

@InProceedings{Robinson.77,
  author =       "R. W. Robinson",
  editor =       "C. H. C. Little",
  booktitle =    "Combinatorial Mathematics V",
  title =        "Counting unlabeled acyclic digraphs",
  volume =       "622",
  publisher =    Springer,
  address =      "Berlin",
  pages =        "28--43",
  year =         "1977",
  series =       "Lecture Notes in Mathematics",
  comment =      PRNNref,
}

@Article{Roeder.90,
  author =       "K. Roeder",
  title =        "Density estimation with confidence sets exemplified by
                 superclusters and voids in galaxies",
  journal =      JASA,
  volume =       "85",
  pages =        "617--624",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Roosen.Hastie.94,
  author =       "C. B. Roosen and T. J. Hastie",
  title =        "Automatic smoothing spline projection pursuit",
  journal =      JCGS,
  volume =       "3",
  pages =        "235--248",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Rose.ZZ.76,
  author =       "D. J. Rose and R. E. Tarjan and G. S. Lueker",
  title =        "Algorithmic aspects of vertex elimination on graphs",
  journal =      "SIAM Journal on Computing",
  volume =       "5",
  pages =        "266--283",
  year =         "1976",
  comment =      PRNNref,
}

@Article{Rosenblatt.56,
  author =       "M. Rosenblatt",
  title =        "Remarks on some nonparametric estimates of a density
                 function",
  journal =      AnnMathStat,
  volume =       "27",
  pages =        "832--837",
  year =         "1956",
  comment =      PRNNref,
}

@TechReport{Rosenblatt.57,
  author =       "F. Rosenblatt",
  title =        "The perceptron---a perceiving and recognizing
                 automaton",
  type =         "Report",
  number =       "85-460-1",
  institution =  "Cornell Aeronautical Laboratory",
  year =         "1957",
  comment =      PRNNref,
}

@Article{Rosenblatt.58,
  author =       "F. Rosenblatt",
  title =        "The perceptron: {A} probabilistic model for
                 information storage and organization in the brain",
  journal =      "Psychological Review",
  volume =       "65",
  pages =        "386--408",
  year =         "1958",
  note =         MLset,
  comment =      PRNNref,
}

@Book{Rosenblatt.62,
  author =       "F. Rosenblatt",
  title =        "Principles of Neurodynamics",
  publisher =    "Spartan Books",
  address =      "Washington, DC",
  year =         "1962",
  comment =      PRNNunref,
}

@Article{Rounds.80,
  author =       "E. M. Rounds",
  title =        "A combined nonparametric approach to feature selection
                 and binary decision tree design",
  journal =      PR,
  volume =       "12",
  pages =        "313--317",
  year =         "1980",
  comment =      PRNNunref,
}

@Book{Rousseeuw.Leroy.87,
  author =       "P. J. Rousseeuw and A. M. Leroy",
  title =        "Robust Regression and Outlier Detection",
  publisher =    Wiley,
  address =      "New York",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Rousseeuw.Zomeren.90,
  author =       "P. J. Rousseeuw and B. C. van Zomeren",
  title =        "Unmasking multivariate outliers and leverage points
                 (with discussion)",
  journal =      JASA,
  volume =       "85",
  pages =        "633--651",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Ruck.ZZ.92,
  author =       "D. W. Ruck and S. K. Rogers and M. Kabrisky and P. S.
                 Maybeck and M. E. Oxley",
  title =        "Comparative analysis of backpropagation and the
                 extended {Kalman} filter for training multilayer
                 perceptrons",
  journal =      PAMI,
  volume =       "14",
  pages =        "686--691",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Ruiz.86,
  author =       "E. V. Ruiz",
  title =        "An algorithm for finding nearest neighbours in
                 (approximately) constant average time",
  journal =      PRL,
  volume =       "4",
  pages =        "145--158",
  year =         "1986",
  comment =      PRNNref,
}

@Book{Rumelhart.McClelland.86,
  editor =       "D. E. Rumelhart and J. L. McClelland",
  title =        "Parallel Distributed Processing: Explorations in the
                 Microstructure of Cognition. Volume 1. Foundations",
  publisher =    "The MIT Press",
  address =      "Cambridge, MA",
  year =         "1986",
  ISBN =         "0-262-18120-7",
  comment =      PRNNref,
}

@Article{Rumelhart.ZZ.86,
  author =       "D. E. Rumelhart and G. E. Hinton and R. J. Williams",
  title =        "Learning representations by back-propagating errors",
  journal =      Nat,
  volume =       "323",
  pages =        "533--536",
  year =         "1986",
  note =         "[Reprinted in \cite{Anderson.Rosenfeld.88}]",
  comment =      PRNNref,
}

@Book{Russell.Norvig.95,
  author =       "S. J. Russell and P. Norvig",
  title =        "Artificial Intelligence. {A} Modern Approach",
  publisher =    "Prentice-Hall",
  address =      "Englewood Cliffs, NJ",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Ruzicka.93,
  author =       "P. R{\.u}{\u z}i{\u c}ka",
  title =        "On the convergence of learning algorithm for
                 topological maps",
  journal =      "Neural Network World",
  volume =       "4",
  pages =        "413--424",
  year =         "1993",
  comment =      PRNNunref,
}

@InProceedings{Sa.Ballard.93,
  author =       "V. R. de Sa and D. H. Ballard",
  title =        "A note on learning vector quantization",
  crossref =     "NIPS5",
  pages =        "220--227",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Saarinen.ZZ.93,
  author =       "S. Saarinen and R. Bramley and G. Cybenko",
  title =        "Ill-conditioning in neural network training problems",
  journal =      "SIAM Journal on Scientific Computing",
  volume =       "14",
  pages =        "693--714",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Safavian.Landgrebe.91,
  author =       "S. R Safavian and D. Landgrebe",
  title =        "A survey of decision tree classifier methodology",
  journal =      SMC,
  volume =       "21",
  pages =        "660--674",
  year =         "1991",
  comment =      PRNNref,
}

@InProceedings{Sakurai.93,
  author       = "A. Sakurai",
  booktitle    = "Proceedings of the 1993 World Congress on Neural
                  Networks",
  title        = "Tighter bounds of the {VC}-dimension of three-layer
                  networks",
  volume       = "3",
  publisher    = "Erlbaum",
  address      = "Hillsdale, NJ",
  pages        = "540--543",
  year         = "1993",
  comment =      PRNNunref,
}

@InProceedings{Salomon.91,
  author =       "R. Salomon",
  booktitle =    "Parallel Problem Solving From Nature (Dortmund,
                 1990)",
  title =        "Improved convergence rate of back-propagation with
                 dynamic adaption of the learning rate",
  volume =       "496",
  pages =        "269--273",
  year =         "1991",
  series =       "Lecture Notes in Computer Science",
  comment =      PRNNref,
}

@Article{Samal.Iyengar.92,
  author =       "A. Samal and P. A. Iyengar",
  title =        "Automatic recognition and analysis of human faces and
                 facial expressions: a survey",
  journal =      PR,
  volume =       "25",
  pages =        "65--77",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Sammon.69,
  author =       "Sammon, Jr., J. W.",
  title =        "A non-linear mapping for data structure analysis",
  journal =      IEC,
  volume =       "18",
  pages =        "401--409",
  year =         "1969",
  comment =      PRNNref,
}

@Article{Sanger.89,
  author =       "T. D. Sanger",
  title =        "Optimal unsupervised learning in a single-layer linear
                 feedforward network",
  journal =      NNks,
  volume =       "2",
  pages =        "459--473",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Sankar.Mammone.93,
  author =       "A. Sankar and R. J. Mammone",
  title =        "Growing and pruning neural tree networks",
  journal =      IEC,
  volume =       "42",
  pages =        "291--299",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Santer.Duffy.86,
  author =       "T. J. Santer and D. E. Duffy",
  title =        "A note on {A.~A}lbert and {J.~A.~A}nderson's
                 conditions for the existence of maximum likelihood
                 estimates in logistic regression models",
  journal =      Bka,
  volume =       "73",
  pages =        "755--758",
  year =         "1986",
  comment =      PRNNref,
}

@Book{Schalkoff.92,
  author =       "R. J. Schalkoff",
  title =        "Pattern Recognition: Statistical, Structural and
                 Neural Approaches",
  publisher =    Wiley,
  address =      "New York",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Schlimmer.Fisher.86,
  author =       "J. C. Schlimmer and D. H. Fisher",
  editor =       "Kehler, T. and Rosenschein, S.",
  booktitle =    "Proceedings of the Fifth National Conference on
                 Artificial Intelligence, Philadelphia",
  title =        "A case study of incremental concept induction",
  volume =        "1",
  publisher =    MK,
  address =      "San Mateo, CA",
  pages =        "496--501",
  year =         "1986",
  comment =      PRNNref,
}

@Article{Schlimmer.Granger.86,
  author =       "J. C. Schlimmer and Granger, Jr., R. H.",
  title =        "Incremental learning from noisy data",
  journal =      ML,
  volume =       "1",
  pages =        "317--354",
  year =         "1986",
  comment =      PRNNref,
}

@InProceedings{Schmidhuber.89,
  author =       "J. Schmidhuber",
  booktitle =    "Connectionism in Perspective",
  title =        "Accelerated learning in back-propagation nets",
  publisher =    "Elsevier",
  address =      "Amsterdam",
  pages =        "439--445",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Schoenberg.35,
  author =       "I. J. Schoenberg",
  title =        "Remarks to {Maurice Fr\'echet's} article ``Sur la
                 definition axiomatique d'une classe d'espaces
                 distanci\'es vectoriellement applicable sur l'espace de
                 {Hilbert}''",
  journal =      "Annals of Mathematics",
  volume =       "36",
  pages =        "724--732",
  year =         "1935",
  comment =      PRNNunref,
}

@Article{Schuermann.Doster.84,
  author =       "J. Schuermann and D. Doster",
  title =        "A decision-theoretic approach in hierarchical
                 classifier design",
  journal =      PR,
  volume =       "17",
  pages =        "359--369",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Schwarz.78,
  author =       "G. Schwarz",
  title =        "Estimating the dimension of a model",
  journal =      AnnStat,
  volume =       "6",
  pages =        "461--464",
  year =         "1978",
  comment =      PRNNref,
}

@Article{Schwemer.Dunn.80,
  author =       "G. T. Schwemer and O. J. Dunn",
  title =        "Posterior probability estimators in classification
                 simulations",
  journal =      "Communications in Statistics---Simulation and
                 Computation",
  volume =       "B9",
  pages =        "133--140",
  year =         "1980",
  comment =      PRNNref,
}

@Book{Scott.92,
  author =       "D. W. Scott",
  title =        "Multivariate Density Estimation. Theory, Practice and
                 Visualization",
  publisher =    Wiley,
  address =      "New York",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Scott.Symons.71,
  author =       "A. J. Scott and M. J. Symons",
  title =        "Clustering methods based on likelihood ratio
                 criteria",
  journal =      Biom,
  volume =       "27",
  pages =        "387--397",
  year =         "1971",
  comment =      PRNNref,
}

@Article{Scott.Wild.86,
  author =       "A. J. Scott and C. J. Wild",
  title =        "Fitting logistic models under case-control or choice
                 based sampling",
  journal =      JRSSB,
  volume =       "48",
  pages =        "170--182",
  year =         "1986",
  comment =      PRNNref,
}

@Book{Seber.Wild.89,
  author =       "G. A. F. Seber and C. J. Wild",
  title =        "Nonlinear Regression",
  publisher =    Wiley,
  address =      "New York",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Sebestyen.62,
  author =       "G. S. Sebestyen",
  title =        "Pattern recognition by an adaptive process of sample
                 set construction",
  journal =      IEIT,
  volume =       "82--S",
  pages =        "91",
  year =         "1962",
  comment =      PRNNref,
}

@Book{Sedgewick.90,
  author =       "R. Sedgewick",
  title =        "Algorithms in {C}",
  publisher =    "Addison-Wesley",
  address =      "Reading, MA",
  year =         "1990",
  comment =      PRNNref,
}

@Book{Sen.Srivastava.90,
  author =       "A. Sen and M. Srivastava",
  title =        "Regression Analysis. Theory, Methods and
                 Applications",
  publisher =    Springer,
  address =      "New York",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Sethi.90,
  author =       "I. K. Sethi",
  title =        "Entropy nets: from decision trees to neural networks",
  journal =      PIEEE,
  volume =       "78",
  pages =        "1605--1613",
  year =         "1990",
  note =         rep-Lau,
  comment =      PRNNref,
}

@InProceedings{Sethi.91,
  author =       "I. K. Sethi",
  title =        "Decision tree performance enhancement using an
                 artificial neural network implementation",
  crossref =     "Sethi.Jain.91",
  pages =        "71--88",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Sethi.Sarvarayudu.82,
  author =       "I. K. Sethi and G. P. R. Sarvarayudu",
  title =        "Hierarchical classifier design using mutual
                 information",
  journal =      PAMI,
  volume =       "4",
  pages =        "441--445",
  year =         "1982",
  comment =      PRNNref,
}

@InProceedings{Shachter.Peot.90,
  author =       "R. D. Shachter and M. A. Peot",
  editor =       "M. Henrion and R. D. Shachter and L. N. Kanal and J.
                 F. Lemmer",
  booktitle =    "Uncertainty in Artificial Intelligence 5",
  title =        "Simulation approaches to general probabilistic
                 inference on belief networks",
  publisher =    "North-Holland",
  address =      "Amsterdam",
  pages =        "221--231",
  year =         "1990",
  comment =      PRNNunref,
}

@Book{Shafer.96,
  author       = "Glenn Shafer",
  title        = "Probabilistic Expert Systems",
  number       = "67",
  publisher    = "SIAM",
  address      = "Philadelphia, PA",
  year         = "1996",
  ISBN         = "0-89871-373-0",
  series       = "CBMS-NSF Regional Conference Series in Applied
                  Mathematics",
  comment =      PRNNref,
}

@Book{Shafer.Pearl.90,
  editor =       "G. Shafer and J. Pearl",
  title =        "Readings in Uncertainty Reasoning",
  publisher =    MK,
  address =      "San Mateo, CA",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Shafer.Shenoy.86,
  author =       "G. Shafer and P. P. Shenoy",
  title =        "Propagating belief functions with local computations",
  journal =      "IEEE Expert",
  volume =       "1",
  number =       "3",
  pages =        "43--52",
  year =         "1986",
  comment =      PRNNunref,
}

@InProceedings{Shanno.90,
  author =       "D. F. Shanno",
  editor =       "W. T. {Miller III} and R. S. Sutton and P. J. Werbos",
  booktitle =    "Neural Networks for Control",
  title =        "Recent advances in numerical techniques for
                 large-scale optimization",
  publisher =    "The MIT Press",
  address =      "Cambridge, MA",
  pages =        "171--178",
  year =         "1990",
  ISBN =         "0-262-13261-3",
  comment =      PRNNref,
}

@Article{Shanno.Phua.80,
  author =       "D. F. Shanno and K. H. Phua",
  title =        "Remark on ``{Algorithm 500}: Minimization of unconstrained
                 multivariable functions''",
  journal =      TOMS,
  volume =       "6",
  pages =        "618--622",
  year =         "1980",
  comment =      PRNNunref,
}

@Book{Shavlik.Dietterich.90,
  editor =       "J. W. Shavlik and T. G. Dietterich",
  title =        "Readings in Machine Learning",
  publisher =    MK,
  address =      "San Mateo, CA",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Shawe-Taylor.Anthony.91,
  author =       "J. Shawe-Taylor and M. Anthony",
  title =        "Sample sizes for multiple-output threshold networks",
  journal =      "Network",
  volume =       "2",
  pages =        "107--117",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Sheehan.Thomas.93,
  author =       "N. Sheehan and A. Thomas",
  title =        "On the irreducibility of a {Markov} chain defined on a
                 space of genotype configurations by a sampling scheme",
  journal =      Biom,
  volume =       "49",
  pages =        "163--175",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Shenoy.89,
  author =       "P. P. Shenoy",
  title =        "A valuation-based language for expert systems",
  journal =      "International Journal of Approximate Reasoning",
  volume =       "3",
  pages =        "383--411",
  year =         "1989",
  comment =      PRNNunref,
}

@InProceedings{Shenoy.Shafer.90,
  author =       "P. P. Shenoy and G. Shafer",
  editor =       "R. D. Shachter and T. S. Levitt and L. N. Kanal and J.
                 F. Lemmer",
  booktitle =    "Uncertainty in Artificial Intelligence 4",
  title =        "Axioms of probability and belief-function
                 propagation",
  publisher =    "North-Holland",
  address =      "Amsterdam",
  pages =        "169--198",
  year =         "1990",
  note =         URset,
  comment =      PRNNref,
}

@InProceedings{Shenoy.ZZ.88,
  author =       "P. P. Shenoy and G. Shafer and K. Mellouli",
  editor =       "J. F. Lemmer and L. N. Kanal",
  booktitle =    "Uncertainty in Artificial Intelligence 2",
  title =        "Propagation of belief functions: a distributed
                 approach",
  publisher =    "North-Holland",
  address =      "Amsterdam",
  pages =        "325--335",
  year =         "1988",
  comment =      PRNNref,
}

@InProceedings{Shepanski.87,
  author =       "J. F. Shepanski",
  editor =       "M. Caudill and C. Butler",
  booktitle =    "Proceedings of IEEE First International Conference on
                 Neural Networks, San Diego, 1987",
  title =        "Fast learning in artificial neural systems: multilayer
                 perceptron training using optimal estimation",
  volume =       "I",
  publisher =    "IEEE Press",
  address =      "Long Beach, CA",
  pages =        "465--472",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Shepard.62a,
  author =       "R. N. Shepard",
  title =        "The analysis of proximities: multidimensional scaling
                 with an unknown distance function {I}",
  journal =      PSym,
  volume =       "27",
  pages =        "125--139",
  year =         "1962",
  comment =      PRNNunref,
}

@Article{Shepard.62b,
  author =       "R. N. Shepard",
  title =        "The analysis of proximities: multidimensional scaling
                 with an unknown distance function {II}",
  journal =      PSym,
  volume =       "27",
  pages =        "219--246",
  year =         "1962",
  comment =      PRNNunref,
}

@Article{Shibata.76,
  author =       "R. Shibata",
  title =        "Selection of the order of an auto\-regressive model by
                 {Akaike}'s Information Criterion",
  journal =      Bka,
  volume =       "63",
  pages =        "117--126",
  year =         "1976",
  comment =      PRNNref,
}

@Article{Shibata.80,
  author =       "R. Shibata",
  title =        "Asymptotically efficient selection of the order of the
                 model for estimating parameters of a linear process",
  journal =      AnnStat,
  volume =       "8",
  pages =        "147--164",
  year =         "1980",
  comment =      PRNNref,
}

@Article{Shibata.81,
  author =       "R. Shibata",
  title =        "An optimal selection of regression variables",
  journal =      Bka,
  volume =       "68",
  pages =        "45--54",
  year =         "1981",
  comment =      PRNNref,
}

@InProceedings{Short.Fukunaga.80,
  author =       "R. D. Short and K. Fukunaga",
  booktitle =    "Proceedings of the Fifth IEEE International Conference
                 on Pattern Recognition (Miami Beach, 1980)",
  title =        "A new nearest neighbor distance measure",
  publisher =    "IEEE Computer Society Press",
  address =      "Los Alamitos, CA",
  pages =        "81--86",
  year =         "1980",
  comment =      PRNNunref,
}

@Article{Short.Fukunaga.81,
  author =       "R. D. Short and K. Fukunaga",
  title =        "The optimal distance measure for nearest neighbor
                 classification",
  journal =      IEIT,
  volume =       "27",
  pages =        "622--627",
  year =         "1981",
  note =         NNset,
  comment =      PRNNref,
}

@Article{Sietsma.Dow.91,
  author =       "J. Sietsma and R. J. F. Dow",
  title =        "Creating artificial neural networks that generalize",
  journal =      NNks,
  volume =       "4",
  pages =        "67--79",
  year =         "1991",
  comment =      PRNNref,
}

@InProceedings{Silva.Almeida.90,
  author =       "F. M. Silva and L. B. Almeida",
  editor =       "R. Eckmiller",
  booktitle =    "Advanced Neural Computers",
  title =        "Speeding up back-propagation",
  publisher =    "Elsevier",
  address =      "Amsterdam",
  pages =        "151--158",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Silvapulle.Burridge.86,
  author =       "M. J. Silvapulle and J. Burridge",
  title =        "Existence of maximum likelihood estimates in
                 regression models for grouped and ungrouped data",
  journal =      JRSSB,
  volume =       "48",
  pages =        "100--106",
  year =         "1986",
  comment =      PRNNref,
}

@Article{Silverman.85,
  author =       "B. W. Silverman",
  title =        "Some aspects of the spline smoothing approach to
                 non-parametric regression curve fitting (with
                 discussion)",
  journal =      JRSSB,
  volume =       "47",
  pages =        "1--52",
  year =         "1985",
  comment =      PRNNref,
}

@Book{Silverman.86,
  author =       "B. W. Silverman",
  title =        "Density Estimation for Statistics and Data Analysis",
  publisher =    "Chapman \& Hall",
  address =      "London",
  year =         "1986",
  comment =      PRNNref,
}

@Article{Silverman.Jones.89,
  author =       "B. W. Silverman and M. C. Jones",
  title =        "{E. Fix} and {J. L. Hodges} (1951): An important
                 contribution to nonparametric discriminant analysis and
                 density estimation",
  journal =      ISR,
  volume =       "57",
  pages =        "233--247",
  year =         "1989",
  comment =      PRNNref,
}

@InProceedings{Simard.ZZ.93,
  author =       "P. Simard and Y. {Le Cun} and J. Denker",
  title =        "Efficient pattern recognition using a new
                 transformation distance",
  crossref =     "NIPS5",
  pages =        "50--58",
  year =         "1993",
  comment =      PRNNref,
}

@Book{Simmons.63,
  author =       "G. F. Simmons",
  title =        "Introduction to Topology and Modern Analysis",
  publisher =    "McGraw-Hill",
  address =      "New York",
  year =         "1963",
  comment =      PRNNref,
}

@InProceedings{Singer.Tishby.94,
  author =       "Y. Singer and N. Tishby",
  title =        "Decoding cursive scripts",
  crossref =     "NIPS6",
  pages =        "833--840",
  year =         "1994",
  comment =      PRNNref,
}

@InProceedings{Singhal.Wu.89,
  author =       "S. Singhal and L. Wu",
  title =        "Training multilayer perceptrons with the extended
                 {Kalman} filter",
  crossref =     "NIPS1",
  pages =        "133--140",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Smith.47,
  author =       "C. A. B. Smith",
  title =        "Some examples of discrimination",
  journal =      "Annals of Eugenics",
  volume =       "13",
  pages =        "272--282",
  year =         "1947",
  comment =      PRNNunref,
}

@Article{Smith.68,
  author =       "F. W. Smith",
  title =        "Pattern classifier design by linear programming",
  journal =      IEC,
  volume =       "17",
  pages =        "367--372",
  year =         "1968",
  comment =      PRNNref,
}

@Article{Smith.69,
  author =       "F. W. Smith",
  title =        "Design of multicategory pattern classifiers with
                 two-category classifier design procedures",
  journal =      IEC,
  volume =       "18",
  pages =        "548--551",
  year =         "1969",
  comment =      PRNNref,
}

@Article{Smith.89,
  author =       "J. Q. Smith",
  title =        "Influence diagrams for statistical modelling",
  journal =      AnnStat,
  volume =       "17",
  pages =        "654--672",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Smith.91,
  author =       "A. F. M. Smith",
  title =        "Discussion of `{Posterior} {Bayes} factors'",
  journal =      JRSSB,
  volume =       "53",
  pages =        "132--133",
  year =         "1991",
  comment =      PRNNref,
}

@Book{Smith.Medin.81,
  author =       "E. E. Smith and D. L. Medin",
  title =        "Categories and Concepts",
  publisher =    "Harvard University Press",
  address =      "Cambridge, MA",
  year =         "1981",
  comment =      PRNNunref,
}

@Article{Smith.Roberts.93,
  author =       "A. F. M. Smith and G. O. Roberts",
  title =        "{Bayesian} computation via the {Gibbs} sampler and
                 related {Markov} chain {Monte Carlo} methods (with
                 discussion)",
  journal =      JRSSB,
  volume =       "55",
  pages =        "3--23",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Smith.Spiegelhalter.80,
  author =       "A. F. M. Smith and D. J. Spiegelhalter",
  title =        "{Bayes} factors and choice criteria for linear
                 models",
  journal =      JRSSB,
  volume =       "42",
  pages =        "213--220",
  year =         "1980",
  comment =      PRNNref,
}

@InProceedings{Smith.ZZ.88,
  author =       "J. W. Smith and J. E. Everhart and W. C. Dickson and
                 W. C. Knowler and R. S. Johannes",
  editor =       "R. A. Greenes",
  booktitle =    "Proceedings of the Symposium on Computer Applications
                 in Medical Care (Washington, 1988)",
  title =        "Using the {ADAP} learning algorithm to forecast the
                 onset of diabetes mellitus",
  publisher =    "IEEE Computer Society Press",
  address =      "Los Alamitos, CA",
  pages =        "261--265",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Solla.ZZ.88,
  author =       "S. A. Solla and E. Levin and M. Fleisher",
  title =        "Accelerated learning in layered neural networks",
  journal =      ComSys,
  volume =       "2",
  pages =        "625--639",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Sontag.92,
  author =       "E. D. Sontag",
  title =        "Feedback stabilization using two-hidden-layer nets",
  journal =      TNN,
  volume =       "3",
  pages =        "981--990",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Spackman.92,
  author =       "K. A. Spackman",
  editor =       "P. D. Clayton",
  booktitle =    "Proceedings of the Fifteenth Annual Symposium on
                 Computer Applications in Medical Care, Washington
                 1991",
  title =        "Maximum likelihood training of connectionist models:
                 comparison with least-squares back propagation and
                 logistic regression",
  publisher =    "McGraw-Hill",
  address =      "New York",
  pages =        "285--289",
  year =         "1992",
  comment =      PRNNref,
}

@Book{Spath.85,
  author =       "H. Sp{\"a}th",
  title =        "Cluster Dissection and Analysis. Theory, {FORTRAN}
                 programs, examples",
  publisher =    "Ellis Horwood",
  address =      "Chichester",
  year =         "1985",
  comment =      PRNNref,
}

@Article{Specht.67a,
  author =       "D. F. Specht",
  title =        "Vectorcardiographic diagnosis using the polynomial
                 discriminant method of pattern recognition",
  journal =      "IEEE Transactions on Bio-medical Engineering",
  volume =       "14",
  pages =        "90--95",
  year =         "1967",
  comment =      PRNNref,
}

@Article{Specht.67b,
  author =       "D. F. Specht",
  title =        "Generation of polynomial discriminant functions for
                 pattern recognition",
  journal =      IEEC,
  volume =       "16",
  pages =        "308--319",
  year =         "1967",
  comment =      PRNNref,
}

@Article{Specht.90a,
  author =       "D. F. Specht",
  title =        "Probabilistic neural networks",
  journal =      NNks,
  volume =       "3",
  pages =        "109--118",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Specht.90b,
  author =       "D. F. Specht",
  title =        "Probabilistic neural networks and the polynomial
                 Adaline as complementary techniques for
                 classification",
  journal =      TNN,
  volume =       "1",
  pages =        "111--121",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Specht.91,
  author =       "D. F. Specht",
  title =        "A general regression neural network",
  journal =      TNN,
  volume =       "2",
  pages =        "568--576",
  year =         "1991",
  comment =      PRNNref,
}

@InProceedings{Speed.90,
  author =       "T. Speed",
  title =        "Complexity, calibration and causality in influence
                 diagrams",
  crossref =     "Oliver.Smith.90",
  pages =        "49--63",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Spiegelhalter.90,
  author =       "D. J. Spiegelhalter",
  title =        "Fast algorithms for probabilistic reasoning in
                 influence diagrams, with applications in genetics and
                 expert systems",
  crossref =     "Oliver.Smith.90",
  pages =        "361--384",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Spiegelhalter.Lauritzen.90,
  author =       "D. J. Spiegelhalter and S. L. Lauritzen",
  title =        "Sequential updating of conditional probabilities on
                 directed graphical structures",
  journal =      Nks,
  volume =       "20",
  pages =        "579--605",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Spiegelhalter.Smith.82,
  author =       "D. J. Spiegelhalter and A. F. M. Smith",
  title =        "{Bayes} factors for linear and log-linear models with
                 vague prior information",
  journal =      JRSSB,
  volume =       "44",
  pages =        "377--387",
  year =         "1982",
  comment =      PRNNref,
}

@Article{Spiegelhalter.ZZ.93,
  author =       "D. J. Spiegelhalter and A. P. Dawid and S. L.
                 Lauritzen and R. G. Cowell",
  title =        "{Bayesian} analysis in expert systems (with
                 discussion)",
  journal =      StatSci,
  volume =       "8",
  pages =        "219--283",
  year =         "1993",
  comment =      PRNNref,
}

@Book{Spirtes.ZZ.93,
  author =       "P. Spirtes and C. Glymour and R. Scheines",
  title =        "Causality, Prediction, and Search",
  volume =       "81",
  publisher =    Springer,
  address =      "New York",
  year =         "1993",
  series =       "Lecture Notes in Statistics",
  comment =      PRNNref,
}

@Article{Srihari.92,
  author =       "S. N. Srihari",
  title =        "High-performance reading machines",
  journal =      PIEEE,
  volume =       "80",
  pages =        "1120--1132",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Srinvas.Breese.90,
  author =       "S. Srinvas and J. Breese",
  editor =       "L. N. Kanal and J. Lemmer and T. S. Levitt",
  booktitle =    "Uncertainty in Artificial Intelligence 6",
  title =        "{IDEAL}: a software package for the analysis of
                 influence diagrams",
  publisher =    "North-Holland",
  address =      "Amsterdam",
  pages =        "212--219",
  year =         "1990",
  comment =      PRNNunref,
}

@Book{Stace.91,
  author =       "C. Stace",
  title =        "New Flora of the British Isles",
  publisher =    "Cambridge University Press",
  address =      "Cambridge",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Stanfill.Waltz.86,
  author =       "C. Stanfill and D. Waltz",
  title =        "Toward memory-based reasoning",
  journal =      "Communications of the Association for Computing
                 Machinery",
  volume =       "29",
  pages =        "1213--1228",
  year =         "1986",
  comment =      PRNNref,
}

@Article{Stewart.87,
  author =       "L. Stewart",
  title =        "Hierarchical {Bayesian} analysis using {Monte Carlo}
                 integration: computing posterior distributions when
                 there are many possible models",
  journal =      "The Statistician",
  volume =       "36",
  pages =        "211--219",
  year =         "1987",
  comment =      PRNNref,
}

@InProceedings{Stinchcombe.White.89,
  author =       "M. Stinchcombe and H. White",
  booktitle =    "Proceedings of the International Joint Conference on
                 Neural Networks (Washington, 1989)",
  title =        "Universal approximation using feedforward networks
                 with non-sigmoid hidden layer activation functions",
  volume =       "I",
  publisher =    "IEEE Press",
  address =      "Long Beach, CA",
  pages =        "613--617",
  year =         "1989",
  comment =      PRNNref,
}

@InProceedings{Stinchcombe.White.90,
  author =       "M. Stinchcombe and H. White",
  booktitle =    "Proceedings of the International Joint Conference on
                 Neural Networks, San Diego",
  title =        "Approximating and learning unknown mappings using
                 multilayer feedforward networks with bounded weights",
  volume =       "III",
  publisher =    "IEEE Press",
  address =      "Long Beach, CA",
  pages =        "7--16",
  year =         "1990",
  comment =      PRNNunref,
}

@Article{Stone.74,
  author =       "M. Stone",
  title =        "Cross-validatory choice and assessment of statistical
                 predictions (with discussion)",
  journal =      JRSSB,
  volume =       "36",
  pages =        "111--147",
  year =         "1974",
  comment =      PRNNref,
}

@Article{Stone.77,
  author =       "C. J. Stone",
  title =        "Consistent nonparametric regression (with
                 discussion)",
  journal =      AnnStat,
  volume =       "5",
  pages =        "595--645",
  year =         "1977",
  comment =      PRNNref,
}

@Article{Stone.77a,
  author =       "M. Stone",
  title =        "Asymptotics for and against cross-validation",
  journal =      Bka,
  volume =       "64",
  pages =        "29--35",
  year =         "1977",
  comment =      PRNNref,
}

@Article{Stone.77b,
  author =       "M. Stone",
  title =        "An asymptotic equivalence of choice of model by
                 cross-validation and {Akaike's} criterion",
  journal =      JRSSB,
  volume =       "39",
  pages =        "44--47",
  year =         "1977",
  comment =      PRNNref,
}

@Article{Stone.79,
  author =       "M. Stone",
  title =        "Comments on model selection criteria of {Akaike} and
                 {Schwarz}",
  journal =      JRSSB,
  volume =       "41",
  pages =        "276--278",
  year =         "1979",
  comment =      PRNNref,
}

@Article{Stone.85,
  author =       "C. J. Stone",
  title =        "Additive regression and other nonparametric models",
  journal =      AnnStat,
  volume =       "13",
  pages =        "689--705",
  year =         "1985",
  comment =      PRNNref,
}

@Article{Stone.86,
  author =       "C. J. Stone",
  title =        "The dimensionality reduction principle for generalized
                 additive models",
  journal =      AnnStat,
  volume =       "14",
  pages =        "590--606",
  year =         "1986",
  comment =      PRNNref,
}

@Article{Streit.Luginbuhl.94,
  author =       "R. L. Streit and T. E. Luginbuhl",
  title =        "Maximum likelihood training of probabilistic neural
                 networks",
  journal =      TNN,
  volume =       "5",
  pages =        "764--783",
  year =         "1994",
  comment =      PRNNref,
}

@InProceedings{Stromberg.ZZ.91,
  author =       "J. E. Str{\"o}mberg and J. Zrida and A. Isaksson",
  booktitle =    "IEEE International Conference on Acoustics, Speech and
                 Signal Processing (Toronto, 1991)",
  title =        "Neural trees---using neural nets in a tree classifier
                 structure",
  publisher =    "IEEE Press",
  address =      "Long Beach, CA",
  pages =        "137--140",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Styblinski.Tang.90,
  author =       "M. A. Styblinski and T.-S. Tang",
  title =        "Experiments in nonconvex optimization: stochastic
                 approximation and simulated annealing",
  journal =      NNks,
  volume =       "3",
  pages =        "467--483",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Suen.ZZ.92,
  author =       "C. Y. Suen and C. Nadal and R. Legault and T. A. Mai
                 and L. Lam",
  title =        "Computer recognition of unconstrained handwritten
                 numerals",
  journal =      PIEEE,
  volume =       "80",
  pages =        "1162--1180",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Suen.ZZ.93,
  author =       "C. Y. Suen and R. Legault and C. Nadal and M. Cheriet
                 and L. Lam",
  title =        "Building a new generation of handwriting recognition
                 systems",
  journal =      PRL,
  volume =       "14",
  pages =        "303--315",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Sussmann.92,
  author =       "H. J. Sussmann",
  title =        "Uniqueness of the weights for minimal feedforward nets
                 with a given input--output map",
  journal =      NNks,
  volume =       "5",
  pages =        "589--593",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Swain.Hauska.77,
  author =       "P. H. Swain and H. Hauska",
  title =        "The decision tree classifier: design and potential",
  journal =      "IEEE Transactions on Geoscience Electronics",
  volume =       "15",
  pages =        "142--147",
  year =         "1977",
  comment =      PRNNref,
}

@InProceedings{Swayne.ZZ.91,
  author =       "D. F. Swayne and D. Cook and A. Buja",
  booktitle =    "Proceedings of the ASA Section on Statistical
                 Graphics",
  title =        "{XG}obi: interactive dynamic graphics in the {X}
                 window system with a link to {S}",
  publisher =    "American Statistical Association",
  address =      "Alexandria, VA",
  pages =        "1--8",
  year =         "1991",
  comment =      PRNNref,
}

@InProceedings{Swonger.72,
  author =       "C. W. Swonger",
  editor =       "S. Watanabe",
  booktitle =    "Frontiers of Pattern Recognition",
  title =        "Sample set condensation for a condensed nearest
                 neighbor decision rule for pattern recognition",
  publisher =    "Academic Press",
  address =      "Orlando",
  pages =        "511--519",
  year =         "1972",
  comment =      PRNNunref,
}

@InProceedings{Tarassenko.ZZ.95,
  author =       "L. Tarassenko and P. Hayton and N. Cerneaz and M.
                 Brady",
  booktitle =    "Proceedings of the Fourth International IEE Conference
                 on Artificial Neural Networks (Cambridge, 1995).",
  title =        "Novelty detection for the identification of masses in
                 mammograms",
  year =         "1995",
  pages =        "442--447",
  volume =       "409",
  publisher =    "IEE",
  series =       "IEE Conference Publication",
  comment =      PRNNref,
}

@Article{Tarjan.Yannakakis.84,
  author =       "R. E. Tarjan and M. Yannakakis",
  title =        "Simple linear-time algorithms to test chordality of
                 graphs, test acyclicity of hypergraphs, and selectively
                 reduce acyclic hypergraphs",
  journal =      "SIAM Journal of Computing",
  volume =       "13",
  pages =        "566--579",
  year =         "1984",
  comment =      PRNNref,
}

@Book{Tarter.Lock.93,
  author =       "M. E. Tarter and M. D. Lock",
  title =        "Model-Free Curve Estimation",
  publisher =    "Chapman \& Hall",
  address =      "New York",
  year =         "1993",
  comment =      PRNNunref,
}

@Book{Therrien.89,
  author =       "C. W. Therrien",
  title =        "Decision, Estimation, and Classification: An
                 Introduction to Pattern Recognition and Related
                 Topics",
  publisher =    Wiley,
  address =      "New York",
  year =         "1989",
  comment =      PRNNref,
}

@Book{Thisted.88,
  author =       "R. A. Thisted",
  title =        "Elements of Statistical Computing. Numerical
                 Computation",
  publisher =    "Chapman \& Hall",
  address =      "New York",
  year =         "1988",
  comment =      PRNNref,
}

@Book{Thompson.85,
  author =       "E. A. Thompson",
  title =        "Pedigree Analysis in Human Genetics",
  publisher =    "Johns Hopkins University Press",
  address =      "Baltimore, MD",
  year =         "1985",
  comment =      PRNNunref,
}

@Book{Thornton.92,
  author =       "C. J. Thornton",
  title =        "Techniques in Computational Learning. An
                 Introduction",
  publisher =    "Chapman \& Hall",
  address =      "London",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Tibshirani.92,
  author =       "R. Tibshirani",
  title =        "Principal curves revisited",
  journal =      StatComp,
  volume =       "2",
  pages =        "183--190",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Tierney.94,
  author =       "L. Tierney",
  title =        "{Markov} chains for exploring posterior distributions
                 (with discussion)",
  journal =      AnnStat,
  volume =       "22",
  pages =        "1701--1762",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Tierney.Kadane.86,
  author =       "L. Tierney and J. B. Kadane",
  title =        "Accurate approximations for posterior moments and
                 marginal densities",
  journal =      JASA,
  volume =       "81",
  pages =        "82--86",
  year =         "1986",
  comment =      PRNNref,
}

@Article{Titterington.76,
  author =       "D. M. Titterington",
  title =        "Updating a diagnostic system using unconfirmed cases",
  journal =      ApplStat,
  volume =       "25",
  pages =        "238--247",
  year =         "1976",
  comment =      PRNNref,
}

@Article{Titterington.80,
  author =       "D. M. Titterington",
  title =        "A comparative study of kernel-based density estimates
                 for categorical data",
  journal =      Techno,
  volume =       "22",
  pages =        "259--268",
  year =         "1980",
  comment =      PRNNref,
}

@Article{Titterington.84,
  author =       "D. M. Titterington",
  title =        "Recursive parameter estimation using incomplete data",
  journal =      JRSSB,
  volume =       "46",
  pages =        "257--267",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Titterington.ZZ.81,
  author =       "D. M. Titterington and G. D. Murray and L. S. Murray
                 and D. J. Spiegelhalter and A. M. Skene and J. D. F.
                 Habbema and G. J. Gelpka",
  title =        "Comparison of discrimination techniques applied to a
                 complex data set of head injured patients (with
                 discussion)",
  journal =      JRSSA,
  volume =       "144",
  pages =        "145--174",
  year =         "1981",
  comment =      PRNNref,
}

@Book{Titterington.ZZ.85,
  author =       "D. M. Titterington and A. F. M. Smith and U. E.
                 Makov",
  title =        "Statistical Analysis of Finite Mixture Distributions",
  publisher =    Wiley,
  address =      "Chichester",
  year =         "1985",
  comment =      PRNNref,
}

@InProceedings{Todd.95,
  author =       "B. S. Todd",
  title =        "Weighted inference rules and {Bayesian} belief
                 networks",
  crossref =     "Gammerman.95",
  pages =        "205--225",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Tollenaere.90,
  author =       "T. Tollenaere",
  title =        "Super{SAB}: fast adaptive back propagation with good
                 scaling properties",
  journal =      NNks,
  volume =       "3",
  pages =        "561--573",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Tomek.76a,
  author =       "I. Tomek",
  title =        "A generalization of the $k$-{NN} rule",
  journal =      SMC,
  volume =       "6",
  pages =        "121--126",
  year =         "1976",
  note =         NNset,
  comment =      PRNNref,
}

@Article{Tomek.76b,
  author =       "I. Tomek",
  title =        "An experiment with the edited nearest-neighbor rule",
  journal =      SMC,
  volume =       "6",
  pages =        "448--452",
  year =         "1976",
  note =         NNset,
  comment =      PRNNref,
}

@Article{Tomek.76c,
  author =       "I. Tomek",
  title =        "Two modifications of {CNN}",
  journal =      SMC,
  volume =       "6",
  pages =        "769--772",
  year =         "1976",
  comment =      PRNNref,
}

@Article{Torgerson.52,
  author =       "W. S. Torgerson",
  title =        "Multidimensional scaling {I}. {Theory} and method",
  journal =      PSym,
  volume =       "17",
  pages =        "401--419",
  year =         "1952",
  comment =      PRNNunref,
}

@Book{Torgerson.58,
  author =       "W. S. Torgerson",
  title =        "Theory and Methods of Scaling",
  publisher =    Wiley,
  address =      "New York",
  year =         "1958",
  comment =      PRNNunref,
}

@Article{Traaven.91,
  author =       "H. G. C. Tr{\aa}v\'en",
  title =        "A neural network approach to statistical pattern
                 classification by ``semiparametric'' estimation of
                 probability density functions",
  journal =      TNN,
  volume =       "2",
  pages =        "366--377",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Tsypkin.66,
  author =       "Ya. Z. Tsypkin",
  title =        "Use of the stochastic approximation method in
                 estimating unknown distribution densities from
                 observations",
  journal =      AuRC,
  volume =       "27",
  pages =        "432--434",
  year =         "1966",
  comment =      PRNNunref,
}

@Article{Tutz.86,
  author =       "G. Tutz",
  title =        "An alternative choice of smoothing for kernel-based
                 density estimates in discrete discriminant analysis",
  journal =      Bka,
  volume =       "73",
  pages =        "405--411",
  year =         "1986",
  comment =      PRNNref,
}

@Article{Tutz.88,
  author =       "G. Tutz",
  title =        "Smoothing for discrete kernels in discrimination",
  journal =      "Biometrical Journal",
  volume =       "6",
  pages =        "729--739",
  year =         "1988",
  comment =      PRNNref,
}

@Article{Tutz.89,
  author =       "G. Tutz",
  title =        "On cross-validation for discrete kernel estimates in
                 discrimination",
  journal =      CSTM,
  volume =       "18",
  pages =        "4145--4162",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Ullmann.74,
  author =       "J. R. Ullmann",
  title =        "Automatic selection of reference data for use in a
                 nearest-neighbor method of pattern classification",
  journal =      IEIT,
  volume =       "20",
  pages =        "541--543",
  year =         "1974",
  comment =      PRNNref,
}

@InProceedings{Ultsch.93a,
  author =       "A. Ultsch",
  editor =       "O. Opitz and B. Lausen and R. Klar",
  booktitle =    "Information and Classification",
  title =        "Knowledge extraction from self-organizing neural
                 networks",
  publisher =    Springer,
  address =      "Berlin",
  pages =        "301--306",
  year =         "1993",
  comment =      PRNNunref,
}

@InProceedings{Ultsch.93b,
  author =       "A. Ultsch",
  editor =       "O. Opitz and B. Lausen and R. Klar",
  booktitle =    "Information and Classification",
  title =        "Self-organizing neural networks for visualization and
                 classification",
  publisher =    Springer,
  address =      "Berlin",
  pages =        "307--313",
  year =         "1993",
  comment =      PRNNunref,
}

@Article{Upton.91,
  author =       "G. J. G. Upton",
  title =        "The exploratory analysis of survey data using
                 log-linear models",
  journal =      "The Statistician",
  volume =       "40",
  pages =        "169--182",
  year =         "1991",
  comment =      PRNNref,
}

@InProceedings{Usui.ZZ.91,
  author =       "S. Usui and S. Nakauchi and M. Nakano",
  editor =       "T. Kohonenand K. M{\"a}kisara and O. Simula and volume
                 I J. Kangas",
  booktitle =    "Artificial Neural Networks. Proceedings of ICANN-91",
  title =        "Internal color representation acquired by a five-layer
                 neural network",
  publisher =    "North Holland",
  address =      "Amsterdam",
  pages =        "867--872",
  year =         "1991",
  comment =      PRNNref,
}

@InProceedings{Utgoff.88a,
  author =       "P. E. Utgoff",
  editor =       "J. Laird",
  booktitle =    "Proceedings of the Fifth International Conference on
                 Machine Learning",
  title =        "{ID5}: an incremental {ID3}",
  publisher =    MK,
  address =      "San Mateo, CA",
  pages =        "107--120",
  year =         "1988",
  comment =      PRNNunref,
}

@InProceedings{Utgoff.88b,
  author =       "P. E. Utgoff",
  editor =       "R. G. Smith and T. M. Mitchell",
  booktitle =    "Proceedings of the Seventh AAAI National Conference on
                 Artificial Intelligence, St Paul",
  title =        "Perceptron trees: a case study in hybrid concept
                 representations",
  publisher =    MK,
  address =      "San Mateo, CA",
  pages =        "601--606",
  year =         "1988",
  comment =      PRNNref,
}

@InProceedings{Utgoff.89,
  author =       "P. E. Utgoff",
  editor =       "A. M. Segre",
  booktitle =    "Proceedings of the Sixth International Workshop on
                 Machine Learning (Ithaca, 1989)",
  title =        "Improved training via incremental learning",
  publisher =    MK,
  address =      "San Mateo, CA",
  pages =        "362--365",
  year =         "1989",
  comment =      PRNNref,
}

@Article{Utgoff.90,
  author =       "P. E. Utgoff",
  title =        "Incremental induction of decision trees",
  journal =      ML,
  volume =       "4",
  pages =        "161--186",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Utgoff.Brodley.90,
  author =       "P. E. Utgoff and C. E. Brodley",
  editor =       "B. W. Porter and R. J. Mooney",
  booktitle =    "Proceedings of the Seventh International Workshop on
                 Machine Learning",
  title =        "An incremental method for multivariate splits in
                 decision trees",
  publisher =    MK,
  address =      "San Mateo, CA",
  pages =        "58--65",
  year =         "1990",
  comment =      PRNNunref,
}

@Article{Valiant.84,
  author =       "L. G. Valiant",
  title =        "A theory of the learnable",
  journal =      "Communications of the Association for Computing
                 Machinery",
  volume =       "27",
  pages =        "1134--1142",
  year =         "1984",
  note =         MLset,
  comment =      PRNNref,
}

@Article{VanRyzin.66,
  author =       "J. {Van Ryzin}",
  title =        "{Bayes} risk consistency of classification procedures
                 using density estimation",
  journal =      "Sankhy{\=a}",
  volume =       "A28",
  pages =        "261--270",
  year =         "1966",
  comment =      PRNNref,
}

@InProceedings{VanWelde.89,
  author =       "W. {Van de Welde}",
  editor =       "K. Morik",
  booktitle =    "Proceedings of the Fourth European Working Session on
                 Learning",
  title =        "{IDL}, or taming the multi\-plexer",
  publisher =    "Pitman",
  address =      "London",
  pages =        "211--226",
  year =         "1989",
  comment =      PRNNunref,
}

@InProceedings{VanWelde.90,
  author =       "W. {Van de Welde}",
  editor =       "B. W. Porter and R. J. Mooney",
  booktitle =    "Proceedings of the Seventh International Workshop on
                 Machine Learning",
  title =        "Incremental induction of topologically minimal trees",
  publisher =    MK,
  address =      "San Mateo, CA",
  pages =        "66--74",
  year =         "1990",
  comment =      PRNNunref,
}

@Book{Vapnik.82,
  author =       "V. N. Vapnik",
  title =        "Estimation of Dependencies based on Empirical Data",
  publisher =    Springer,
  address =      "New York",
  year =         "1982",
  comment =      PRNNunref,
}

@InProceedings{Vapnik.92,
  author =       "V. Vapnik",
  title =        "Principles of risk minimization for learning theory",
  crossref =     "NIPS4",
  pages =        "831--838",
  year =         "1992",
  comment =      PRNNref,
}

@Book{Vapnik.95,
  author       = "V. N. Vapnik",
  title        = "The Nature of Statistical Learning Theory",
  publisher    = "Springer",
  address      = "New York",
  year         = "1995",
  comment =      PRNNref,
}

@Article{Vapnik.Chervonenkis.71,
  author =       "V. N. Vapnik and A. Ya. Chervonenkis",
  title =        "On the uniform convergence of relative frequencies of
                 events to their probabilities",
  journal =      "Theory of Probability and its Applications",
  volume =       "16",
  pages =        "264--280",
  year =         "1971",
  comment =      PRNNref,
}

@Book{Venables.Ripley.94,
  author =       "W. N. Venables and B. D. Ripley",
  title =        "Modern Applied Statistics with {S}-Plus",
  publisher =    Springer,
  address =      "New York",
  year =         "1994",
  ISBN =         "0-387-94350-1",
  comment =      PRNNref,
}

@InProceedings{Verma.Pearl.90,
  author =       "T. Verma and J. Pearl",
  editor =       "R. D. Shachter and T. S. Levitt and L. N. Kanal and J.
                 F. Lemmer",
  booktitle =    "Uncertainty in Artificial Intelligence 4",
  title =        "Causal networks: semantics and expressiveness",
  publisher =    "North-Holland",
  address =      "Amsterdam",
  pages =        "69--76",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Verma.Pearl.91,
  author =       "T. S. Verma and J. Pearl",
  editor =       "P. P. Bonissone and M. Henrion and L. N. Kanal and J.
                 F. Lemmer",
  booktitle =    "Uncertainty in Artificial Intelligence 6",
  title =        "Equivalence and synthesis of causal models",
  publisher =    "North Holland",
  address =      "Amsterdam",
  pages =        "255--268",
  year =         "1991",
  comment =      PRNNref,
}

@Article{Villegas.69,
  author =       "C. Villegas",
  title =        "On the a priori distribution of the covariance
                 matrix",
  journal =      AnnMathStat,
  volume =       "40",
  pages =        "1098--1099",
  year =         "1969",
  comment =      PRNNref,
}

@Article{Vinod.69,
  author =       "H. Vinod",
  title =        "Integer programming and the theory of grouping",
  journal =      JASA,
  volume =       "64",
  pages =        "506--517",
  year =         "1969",
  comment =      PRNNref,
}

@Article{Vlachonikolos.90,
  author =       "I. Vlachonikolos",
  title =        "Predictive discrimination and classification with
                 mixed binary and continuous variables",
  journal =      Bka,
  volume =       "77",
  pages =        "657--662",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Wagner.73,
  author =       "T. J. Wagner",
  title =        "Convergence of the edited nearest neighbor",
  journal =      IEIT,
  volume =       "19",
  pages =        "696--697",
  year =         "1973",
  comment =      PRNNref,
}

@Book{Wahba.90,
  author =       "G. Wahba",
  title =        "Spline Models for Observational Data",
  publisher =    "SIAM",
  address =      "Philadelphia",
  year =         "1990",
  comment =      PRNNref,
}

@InProceedings{Wahba.95,
  author =       "G. Wahba",
  editor =       "M. Arbib",
  booktitle =    "The Handbook of Brain Theory and Neural Networks",
  title =        "Generalization and regularization in nonlinear
                 learning systems",
  publisher =    "The MIT Press",
  address =      "Cambridge, MA",
  pages =        "426--430",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Wahba.Wold.75,
  author =       "G. Wahba and S. Wold",
  title =        "A completely automatic French curve",
  journal =      "Communications in Statistics",
  volume =       "4",
  pages =        "1--17",
  year =         "1975",
  comment =      PRNNunref,
}

@InProceedings{Wahba.ZZ.95,
  author =       "G. Wahba and C. Gu and Y. Wang and R. Chappell",
  title =        "Soft classification a.k.a. risk estimation via
                 penalized log likelihood and smoothing spline analysis
                 of variance",
  crossref =     "Wolpert.95",
  pages =        "331--359",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Wakahara.93,
  author =       "T. Wakahara",
  title =        "Towards robust handwritten character recognition",
  journal =      PRL,
  volume =       "14",
  pages =        "345--354",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Wallace.Freeman.87,
  author =       "C. S. Wallace and P. R. Freeman",
  title =        "Estimation and inference by compact encoding (with
                 discussion)",
  journal =      JRSSB,
  volume =       "49",
  pages =        "240--265",
  year =         "1987",
  comment =      PRNNref,
}

@Book{Wand.Jones.95,
  author =       "M. P. Wand and M. C. Jones",
  title =        "Kernel Smoothing",
  publisher =    "Chapman \& Hall",
  address =      "London",
  year =         "1995",
  comment =      PRNNref,
}

@Article{Wang.Suen.84,
  author =       "Q. R. Wang and C. Y. Suen",
  title =        "Analysis and design of a decision tree based on
                 entropy reduction and its application to large
                 character set recognition",
  journal =      PAMI,
  volume =       "6",
  pages =        "406--417",
  year =         "1984",
  comment =      PRNNref,
}

@Article{Wang.Suen.87,
  author =       "Q. R. Wang and C. Y. Suen",
  title =        "Large tree classifier with heuristic search and global
                 training",
  journal =      PAMI,
  volume =       "9",
  pages =        "91--102",
  year =         "1987",
  comment =      PRNNref,
}

@InProceedings{Wang.ZZ.94,
  author =       "C. Wang and S. S. Venkatesh and J. S. Judd",
  title =        "Optimal stopping and effective machine complexity in
                 learning",
  crossref =     "NIPS6",
  pages =        "303--310",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Ward.63,
  author =       "Ward, Jr., J. H.",
  title =        "Hierarchical grouping to optimize an objective
                 function",
  journal =      JASA,
  volume =       "58",
  pages =        "236--244",
  year =         "1963",
  comment =      PRNNref,
}

@Article{Warner.ZZ.61,
  author =       "H. R. Warner and A. F. Toronto and L. R. Veasey and R.
                 Stephenson",
  title =        "A mathematical model for medical
                 diagnosis---application to congenital heart disease",
  journal =      "Journal of the American Medical Association",
  volume =       "177",
  pages =        "177--184",
  year =         "1961",
  comment =      PRNNunref,
}

@Book{Wasserman.93,
  author =       "P. D. Wasserman",
  title =        "Advanced Methods in Neural Computing",
  publisher =    "Van Nostrand Reinhold",
  address =      "New York",
  year =         "1993",
  comment =      PRNNref,
}

@Book{Watanabe.69,
  author =       "S. Watanabe",
  title =        "Knowing and Guessing",
  publisher =    Wiley,
  address =      "New York",
  year =         "1969",
  comment =      PRNNunref,
}

@InProceedings{Waterhouse.Robinson.94,
  author =       "S. R. Waterhouse and A. J. Robinson",
  booktitle =    "Proceedings of the 1994 IEEE Workshop on Neural
                 Networks for Signal Processing IV",
  title =        "Classification using hierarchical mixtures of
                 experts",
  publisher =    "IEEE Press",
  address =      "Long Beach, CA",
  pages =        "177--186",
  year =         "1994",
  comment =      PRNNunref,
}

@InProceedings{Watrous.87,
  author =       "R. L. Watrous",
  editor =       "M. Caudill and C. Butler",
  booktitle =    "Proceedings of the IEEE First International Conference
                 on Neural Networks (San Diego, 1987)",
  title =        "Learning algorithms for connectionist networks:
                 applied gradient methods of nonlinear optimization",
  volume =       "II",
  publisher =    "IEEE Press",
  address =      "New York",
  pages =        "619--627",
  year =         "1987",
  comment =      PRNNref,
}

@Article{Webb.94,
  author =       "A. R. Webb",
  title =        "Functional approximation by feed-forward networks: a
                 least-squares approach",
  journal =      TNN,
  volume =       "5",
  pages =        "363--371",
  year =         "1994",
  comment =      PRNNref,
}

@Book{Weigend.Gershenfeld.93,
  editor =       "A. S. Weigend and N. A. Gershenfeld",
  title =        "Time Series Prediction: Forecasting the Future and
                 Understanding the Past",
  publisher =    "Addison-Wesley",
  address =      "Reading, MA",
  year =         "1993",
  comment =      PRNNref,
}

@Article{Weigend.ZZ.90,
  author =       "A. S. Weigend and B. A. Huberman and D. E. Rumelhart",
  title =        "Predicting the future: a connectionist approach",
  journal =      IJNS,
  volume =       "1",
  pages =        "193--209",
  year =         "1990",
  comment =      PRNNunref,
}

@InProceedings{Weigend.ZZ.91,
  author =       "A. S. Weigend and D. E. Rumelhart and B. A. Huberman",
  title =        "Generalization by weight-elimination with application
                 to forecasting",
  crossref =     "NIPS3",
  pages =        "875--882",
  year =         "1991",
  comment =      PRNNref,
}

@InProceedings{Weigend.ZZ.92,
  author =       "A. S. Weigend and B. A. Huberman and D. E. Rumelhart",
  editor =       "M. Casdagli and S. Eubank",
  booktitle =    "Nonlinear Modeling and Forecasting",
  title =        "Predicting sunspots and exchange rates with
                 connectionist networks",
  publisher =    "Addison-Wesley",
  address =      "Redwood City, CA",
  pages =        "395--432",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Weiss.91,
  author =       "S. M. Weiss",
  title =        "Small sample error rate estimation for $k$-{NN}
                 classifiers",
  journal =      PAMI,
  volume =       "3",
  pages =        "285--289",
  year =         "1991",
  comment =      PRNNref,
}

@Book{Weiss.Kulikowski.91,
  author =       "S. M. Weiss and C. A. Kulikowski",
  title =        "Computer Systems that Learn: Classification and
                 Prediction Methods from Statistics, Neural Nets,
                 Machine Learning and Expert Systems",
  publisher =    MK,
  address =      "San Mateo, CA",
  year =         "1991",
  comment =      PRNNref,
}

@InProceedings{Wen.90,
  author =       "W. X. Wen",
  booktitle =    "Proceedings of the Sixth Workshop on Uncertainty in
                 Artificial Intelligence (Cambridge, MA)",
  title =        "Optimal decomposition of belief functions",
  pages =        "245--256",
  year =         "1990",
  comment =      PRNNunref,
}

@PhdThesis{Werbos.74,
  author =       "P. J. Werbos",
  title =        "Beyond Regression: New Tools for Prediction and
                 Analysis in the Behavioural Sciences",
  school =       "Harvard University",
  year =         "1974",
  note =         "[Reprinted in \cite{Werbos.94}]",
  comment =      PRNNref,
}

@InProceedings{Werbos.88,
  author =       "P. J. Werbos",
  booktitle =    "Proceedings of the IEEE International Conference on
                 Neural Networks, San Diego, 1988",
  title =        "Backpropagation: past and future",
  volume =       "I",
  publisher =    "IEEE Press",
  address =      "Long Beach, CA",
  pages =        "343--353",
  year =         "1988",
  comment =      PRNNref,
}

@Book{Werbos.94,
  author =       "P. J. Werbos",
  title =        "The Roots of Backpropagation. From Ordered Derivatives
                 to Neural Networks and Political Forecasting",
  publisher =    Wiley,
  address =      "New York",
  year =         "1994",
  comment =      PRNNref,
}

@Book{West.Harrison.89,
  author =       "M. West and P. J. Harrison",
  title =        "{Bayesian} Forecasting and Dynamic Models",
  publisher =    Springer,
  address =      "New York",
  year =         "1989",
  comment =      PRNNref,
}

@InProceedings{Wetterschereck.Dietterich.92,
  author =       "D. Wetterschereck and T. Dietterich",
  title =        "Improving the performance of radial basis function
                 networks by learning center locations",
  crossref =     "NIPS4",
  pages =        "1133--1140",
  year =         "1992",
  comment =      PRNNref,
}

@Article{White.82,
  author =       "H. White",
  title =        "Maximum-likelihood estimation of mis-specified
                 models",
  journal =      "Econometrica",
  volume =       "50",
  pages =        "1--25",
  year =         "1982",
  comment =      PRNNref,
}

@Article{White.89a,
  author =       "H. White",
  title =        "Learning in artificial neural networks: {A}
                 statistical perspective",
  journal =      NC,
  volume =       "1",
  pages =        "425--464",
  year =         "1989",
  note =         "[Reprinted in \cite{White.92}]",
  comment =      PRNNref,
}

@Article{White.89b,
  author =       "H. White",
  title =        "Some asymptotic results for learning in single
                 hidden-layer feedforward networks",
  journal =      JASA,
  volume =       "84",
  pages =        "1003--1013",
  year =         "1989",
  note =         "[Reprinted in \cite{White.92}. Correction:
                 \textbf{87}, 1252]",
  comment =      PRNNref,
}

@Article{White.90,
  author =       "H. White",
  title =        "Connectionist nonparametric regression: multilayer
                 feedforward networks can learn arbitrary mappings",
  journal =      NNks,
  volume =       "3",
  pages =        "535--549",
  year =         "1990",
  note =         "[Reprinted in \cite{White.92}]",
  comment =      PRNNref,
}

@Book{White.92,
  author =       "H. White",
  title =        "Artificial Neural Networks: Approximation and Learning
                 Theory",
  publisher =    "Blackwell",
  address =      "Oxford",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{White.Woolridge.91,
  author =       "H. White and J. Woolridge",
  editor =       "W. Barnett and J. Powell and G. Tauchen",
  booktitle =    "Nonparametric and Semi-Parametric Methods in
                 Econometrics and Statistics",
  title =        "Some results on sieve estimation with dependent
                 observations",
  publisher =    "Cambridge University Press",
  address =      "New York",
  year =         "1991",
  note =         "[Reprinted in \cite{White.92}]",
  comment =      PRNNunref,
}

@Article{Widrow.Hoff.60,
  author =       "B. Widrow and Hoff, Jr., M. E.",
  title =        "Adaptive switching circuits",
  journal =      "IRE WESCON Convention Record",
  volume =       "4",
  pages =        "96--104",
  year =         "1960",
  note =         "[Reprinted in \cite{Anderson.Rosenfeld.88}]",
  comment =      PRNNunref,
}

@Article{Williams.Lambert.59,
  author =       "W. T. Williams and J. M. Lambert",
  title =        "Multivariate methods in plant ecology. {I}.
                 Association-analysis in plant communities",
  journal =      "Journal of Ecology",
  volume =       "47",
  pages =        "83--101",
  year =         "1959",
  comment =      PRNNunref,
}

@Article{Wilson.72,
  author =       "D. L. Wilson",
  title =        "Asymptotic properties of nearest neighbor rules using
                 edited data",
  journal =      SMC,
  volume =       "2",
  pages =        "408--421",
  year =         "1972",
  note =         NNset,
  comment =      PRNNref,
}

@Book{Winston.92,
  author =       "P. H. Winston",
  title =        AI,
  publisher =    "Addison-Wesley",
  address =      "Reading, MA",
  edition =      "Third",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Wolberg.Mangarasian.90,
  author =       "W. H. Wolberg and O. L. Mangarasian",
  title =        "Multisurface method of pattern separation for medical
                 diagnosis applied to breast cytology",
  journal =      PNAS,
  volume =       "87",
  pages =        "9193--9196",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Wolfe.70,
  author =       "J. H. Wolfe",
  title =        "Pattern clustering via multivariate mixture analysis",
  journal =      "Multivariate Behavioural Research",
  volume =       "5",
  pages =        "329--350",
  year =         "1970",
  comment =      PRNNunref,
}

@Article{Wolpert.92,
  author =       "D. H. Wolpert",
  title =        "Stacked generalization",
  journal =      NNks,
  volume =       "5",
  pages =        "241--259",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Wolpert.93,
  author =       "D. H. Wolpert",
  title =        "On the use of evidence in neural networks",
  crossref =     "NIPS5",
  pages =        "539--546",
  year =         "1993",
  comment =      PRNNref,
}

@InProceedings{Wolpert.94a,
  author =       "D. H. Wolpert",
  title =        "{Bayesian} backpropagation over {I}-{O} functions
                 rather than weights",
  crossref =     "NIPS6",
  pages =        "200--207",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Wolpert.94b,
  author =       "D. H. Wolpert",
  title =        "Contribution to the discussion of \cite{Ripley.94a}",
  journal =      JRSSB,
  volume =       "56",
  pages =        "450--451",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Wu.83,
  author =       "C. F. J. Wu",
  title =        "On the convergence properties of the {EM} algorithm",
  journal =      AnnStat,
  volume =       "11",
  pages =        "95--103",
  year =         "1983",
  comment =      PRNNref,
}

@Article{Xu.ZZ.92,
  author =       "L. Xu and A. Kryzak and C. Y. Suen",
  title =        "Methods of combining multiple classifiers and their
                 applications to handwriting recognition",
  journal =      SMC,
  volume =       "22",
  pages =        "418--435",
  year =         "1992",
  comment =      PRNNref,
}

@Article{Xu.ZZ.94,
  author =       "L. Xu and A. Kryzak and A. Yuille",
  title =        "On radial basis function nets and kernel regression:
                 statistical consistency, convergence rates, and
                 receptive field sizes",
  journal =      NNks,
  volume =       "7",
  pages =        "609--628",
  year =         "1994",
  comment =      PRNNref,
}

@Article{Yair.Gersho.90a,
  author =       "E. Yair and A. Gersho",
  title =        "The {Boltzmann} perceptron network: a soft
                 classifier",
  journal =      NNks,
  volume =       "3",
  pages =        "203--221",
  year =         "1990",
  comment =      PRNNref,
}

@Article{Yair.Gersho.90b,
  author =       "E. Yair and A. Gersho",
  title =        "Maximum \emph{a posteriori} decision and evaluation of
                 class probabilities by {Boltzmann} perceptron
                 classifiers",
  journal =      PIEEE,
  volume =       "78",
  pages =        "1620--1678",
  year =         "1990",
  note =         rep-Lau,
  comment =      PRNNref,
}

@Article{Yannakakis.81,
  author =       "M. Yannakakis",
  title =        "Computing the minimal fill-in is {NP}-complete",
  journal =      "SIAM Journal of Algebraic and Discrete Methods",
  volume =       "2",
  pages =        "77--79",
  year =         "1981",
  comment =      PRNNref,
}

@Article{York.92,
  author =       "J. York",
  title =        "Use of the {Gibbs} sampler in expert systems",
  journal =      AI,
  volume =       "56",
  pages =        "115--130, 397--398",
  year =         "1992",
  comment =      PRNNref,
}

@Book{Young.Calvert.74,
  author =       "T. Y. Young and T. W. Calvert",
  title =        "Classification, Estimation and Pattern Recognition",
  publisher =    "American Elsevier",
  address =      "New York",
  year =         "1974",
  comment =      PRNNref,
}

@Article{Young.Householder.38,
  author =       "G. Young and A. S. Householder",
  title =        "Discussion of a set of points in terms of their mutual
                 distances",
  journal =      PSym,
  volume =       "3",
  pages =        "19--22",
  year =         "1938",
  comment =      PRNNunref,
}

@Article{Zador.82,
  author =       "P. L. Zador",
  title =        "Asymptotic quantization error of continuous signals
                 and the quantization dimension",
  journal =      IEIT,
  volume =       "28",
  pages =        "139--149",
  year =         "1982",
  comment =      PRNNref,
}

@Article{Zeger.ZZ.92,
  author =       "K. Zeger and J. Vaisey and A. Gersho",
  title =        "Globally optimal vector quantization design by
                 stochastic relaxation",
  journal =      "IEEE Transactions on Signal Processing",
  volume =       "40",
  pages =        "310--322",
  year =         "1992",
  comment =      PRNNref,
}

@InProceedings{Zhao.Atkeson.92,
  author =       "Y. Zhao and C. G. Atkeson",
  title =        "Some approximation properties of projection pursuit
                 learning networks",
  crossref =     "NIPS4",
  pages =        "936--943",
  year =         "1992",
  comment =      PRNNref,
}

% cross-references -----------------------------------------------

@Book{NIPS1,
  editor =       "D. S. Touretzky",
  booktitle =    "Advances in Neural Information Processing Systems.
                 Proceedings of the 1988 Conference",
  title =        "Advances in Neural Information Processing Systems.
                 Proceedings of the 1988 Conference",
  publisher =    MK,
  address =      "San Mateo, CA",
  year =         "1989",
  comment =      PRNNref,
}

@Book{NIPS2,
  editor =       "D. S. Touretzky",
  booktitle =    "Advances in Neural Information Processing Systems 2.
                 Proceedings of the 1989 Conference",
  title =        "Advances in Neural Information Processing Systems 2.
                 Proceedings of the 1989 Conference",
  publisher =    MK,
  address =      "San Mateo, CA",
  year =         "1990",
  comment =      PRNNref,
}

@Book{NIPS3,
  editor =       "R. P. Lippmann and J. E. Moody and D. S. Touretzky",
  booktitle =    "Advances in Neural Information Processing Systems 3.
                 Proceedings of the 1990 Conference",
  title =        "Advances in Neural Information Processing Systems 3.
                 Proceedings of the 1990 Conference",
  publisher =    MK,
  address =      "San Mateo, CA",
  year =         "1991",
  comment =      PRNNref,
}

@Book{NIPS4,
  editor =       "J. E. Moody and S. J. Hanson and R. P. Lippmann",
  booktitle =    "Advances in Neural Information Processing Systems 4.
                 Proceedings of the 1991 Conference",
  title =        "Advances in Neural Information Processing Systems 4.
                 Proceedings of the 1991 Conference",
  publisher =    MK,
  address =      "San Mateo, CA",
  year =         "1992",
  comment =      PRNNref,
}

@Book{NIPS5,
  editor =       "S. J. Hanson and J. D. Cowan and C. L. Giles",
  booktitle =    "Advances in Neural Information Processing Systems 5.
                 Proceedings of the 1992 Conference",
  title =        "Advances in Neural Information Processing Systems 5.
                 Proceedings of the 1992 Conference",
  publisher =    MK,
  address =      "San Mateo, CA",
  year =         "1993",
  comment =      PRNNref,
}

@Book{NIPS6,
  editor =       "J. D. Cowan and G. Tesauro and J. Alspector",
  booktitle =    "Advances in Neural Information Processing Systems 6.
                 Proceedings of the 1993 Conference",
  title =        "Advances in Neural Information Processing Systems 6.
                 Proceedings of the 1993 Conference",
  publisher =    MK,
  address =      "San Francisco, CA",
  year =         "1994",
  comment =      PRNNref,
}

@Book{Chambers.Hastie.92,
  editor =       "J. M. Chambers and T. J. Hastie",
  booktitle =    "Statistical Models in {S}",
  title =        "Statistical Models in {S}",
  publisher =    "Wadsworth and Brooks/Cole",
  address =      "Pacific Grove, CA",
  year =         "1992",
  comment =      PRNNref,
}

@Book{Cherkassky.ZZ.94,
  editor =       "V. Cherkassky and J. H. Friedman and H. Wechsler",
  booktitle =    "From Statistics to Neural Networks. Theory and Pattern
                 Recognition Applications",
  title =        "From Statistics to Neural Networks. Theory and Pattern
                 Recognition Applications",
  publisher =    Springer,
  address =      "Berlin",
  year =         "1994",
  comment =      PRNNref,
}

@Book{Gammerman.95,
  editor =       "A. Gammerman",
  booktitle =    "Probabilistic Reasoning and {Bayesian} Belief
                 Networks",
  title =        "Probabilistic Reasoning and {Bayesian} Belief
                 Networks",
  publisher =    "Alfred Waller",
  address =      "Henley-on-Thames",
  year =         "1995",
  comment =      PRNNref,
}

@Book{Mammone.93,
  editor =       "R. J. Mammone",
  booktitle =    "Artificial Neural Networks for Speech and Vision",
  title =        "Artificial Neural Networks for Speech and Vision",
  publisher =    "Chapman \& Hall",
  address =      "London",
  year =         "1993",
  comment =      PRNNref,
}

@Book{Oliver.Smith.90,
  editor =       "R. M. Oliver and J. Q. Smith",
  booktitle =    "Influence Diagrams, Belief Nets and Decision
                 Analysis",
  title =        "Influence Diagrams, Belief Nets and Decision
                 Analysis",
  publisher =    Wiley,
  address =      "Chichester",
  year =         "1990",
  comment =      PRNNref,
}

@Book{Sethi.Jain.91,
  editor =       "I. K. Sethi and A. K. Jain",
  booktitle =    "Artificial Neural Networks and Statistical Pattern
                 Recognition. Old and New Connections",
  title =        "Artificial Neural Networks and Statistical Pattern
                 Recognition. Old and New Connections",
  publisher =    "North Holland",
  address =      "Amsterdam",
  year =         "1991",
  comment =      PRNNref,
}

@Book{Wolpert.95,
  editor =       "D. H. Wolpert",
  booktitle =    "The Mathematics of Generalization",
  title =        "The Mathematics of Generalization",
  publisher =    "Addison-Wesley",
  address =      "Reading, MA",
  year =         "1995",
  comment =      PRNNref,
}
