\begin{thebibliography}{19} \expandafter\ifx\csname natexlab\endcsname\relax\def\natexlab#1{#1}\fi \expandafter\ifx\csname url\endcsname\relax \def\url#1{{\tt #1}}\fi \bibitem[Bernardo and Smith(1994)]{Bernardo94} J.~M. Bernardo and A.~F.~M. Smith. \newblock {\em Bayesian Theory}. \newblock Wiley Series in Probability and Mathematical Statistics. John Wiley and Sons, Chichester, 1994. \bibitem[Boulton and Wallace(1970)]{Boulton70} D.~M. Boulton and C.~S. Wallace. \newblock A program for numerical classification. \newblock {\em The Computer Journal}, 13\penalty0 (1):\penalty0 63--69, 1970. \bibitem[Denison et~al.(1998)Denison, Mallick, and Smith]{Denison98} D.~G.~T. Denison, B.~K. Mallick, and A.~F.~M. Smith. \newblock Automatic {B}ayesian curve fitting. \newblock {\em Journal of the Royal Statistical Society. Series B (Methodological)}, \penalty0 (60):\penalty0 335--350, 1998. \bibitem[Dobson(1983)]{Dobson83} A.~J. Dobson. \newblock {\em An Introduction to Statistical Modelling}. \newblock Chapman and Hall, London, 1983. \bibitem[Donoho and Johnstone(1994)]{Donoho94} D.~L. Donoho and I.~M. Johnstone. \newblock Ideal spatial adaptation by wavelet shrinkage. \newblock {\em Biometrika}, 81:\penalty0 425--455, 1994. \bibitem[Dowe et~al.(1998)Dowe, Baxter, Oliver, and Wallace]{Dowe98} D.~L. Dowe, R.~A. Baxter, J.~J. Oliver, and C.~S. Wallace. \newblock Point estimation using the {K}ullback-{L}eibler loss function and {MML}. \newblock In {\em Pacific-Asia Conference on Knowledge Discovery and Data Mining (PAKDD98)}, volume 1394 of {\em Lecture Notes in Artificial Intelligence}, pages 87--95. Springer-Verlag, 1998. \bibitem[Farr and Wallace(2002)]{Farr02} G.~E. Farr and C.~S. Wallace. \newblock The complexity of strict minimum message length inference. \newblock {\em The Computer Journal}, 45\penalty0 (3):\penalty0 285--292, 2002. \bibitem[Fitzgibbon et~al.(2002{\natexlab{a}})Fitzgibbon, Dowe, and Allison]{Fitzgibbon02c} L.~J. Fitzgibbon, D.~L. Dowe, and L.~Allison. \newblock Message from {M}onte {C}arlo. \newblock Technical Report 107, School of Computer Science and Software Engineering, Monash University, Clayton, Victoria 3800, Australia, 2002{\natexlab{a}}. \bibitem[Fitzgibbon et~al.(2002{\natexlab{b}})Fitzgibbon, Dowe, and Allison]{Fitzgibbon02a} L.~J. Fitzgibbon, D.~L. Dowe, and L.~Allison. \newblock Univariate polynomial inference by {M}onte {C}arlo message length approximation. \newblock In C.~Sammut and A.~Hoffmann, editors, {\em Proceedings of the Nineteenth International Conference on Machine Learning (ICML-2002)}, pages 147--154, San Francisco, July 2002{\natexlab{b}}. University of New South Wales, Sydney, Australia, Morgan Kaufmann. \bibitem[Gilks et~al.(1996)Gilks, Richardson, and Spiegelhalter]{Gilks96} W.~R. Gilks, S.~Richardson, and D.~J. Spiegelhalter. \newblock {\em {M}arkov chain {M}onte {C}arlo in practice}. \newblock Chapman-Hall, London, 1996. \bibitem[Gilks et~al.(1994)Gilks, Thomas, and Spiegelhalter]{Gilks94} W.~R. Gilks, A.~Thomas, and D.~J. Spiegelhalter. \newblock A language and program for complex {B}ayesian modelling. \newblock {\em Statistician. Special Issue: Conference on Practical {B}ayesian Statistics}, 43\penalty0 (1):\penalty0 169--177, 1994. \bibitem[Green(1995)]{Green95} P.~J. Green. \newblock Reversible jump {M}arkov chain {M}onte {C}arlo computation and {B}ayesian model determination. \newblock {\em Biometrika}, 82:\penalty0 711--732, 1995. \bibitem[Lindsey(1994)]{Lindsey94} J.~K. Lindsey. \newblock {\em Models for Repeated Measurements}. \newblock Oxford Statistical Science Series 10. Clarendon Press, Oxford, 1994. \bibitem[Madigan and Raftery(1994)]{Madigan94} D.~M. Madigan and A.~E. Raftery. \newblock Model selection and accounting for model uncertainty in graphical models using {O}ccam's window. \newblock {\em Journal of the American Statistical Association}, 89\penalty0 (428):\penalty0 1535--1546, December 1994. \bibitem[Raftery et~al.(1997)Raftery, Madigan, and Hoeting]{Raftery97} A.~E. Raftery, D.~Madigan, and J.~A. Hoeting. \newblock Bayesian model averaging for linear regression models. \newblock {\em Journal of the American Statistical Association}, 92:\penalty0 179--191, 1997. \bibitem[Wallace and Boulton(1968)]{Wallace68} C.~S. Wallace and D.~M. Boulton. \newblock An information measure for classification. \newblock {\em Computer Journal}, 11\penalty0 (2):\penalty0 185--194, August 1968. \bibitem[Wallace and Boulton(1975)]{Wallace75} C.~S. Wallace and D.~M. Boulton. \newblock An invariant {B}ayes method for point estimation. \newblock {\em Classification Society Bulletin}, 3\penalty0 (3):\penalty0 11--34, 1975. \bibitem[Wallace and Dowe(1999)]{Wallace99} C.~S. Wallace and D.~L. Dowe. \newblock Minimum message length and {K}olmogorov complexity. \newblock {\em The Computer Journal, Special Issue - Kolmogorov Complexity}, 42\penalty0 (4):\penalty0 270--283, 1999. \bibitem[Wallace and Freeman(1987)]{Wallace87} C.~S. Wallace and P.~R. Freeman. \newblock Estimation and inference by compact encoding (with discussion). \newblock {\em Journal of the Royal Statistical Society. Series B (Methodological)}, 49:\penalty0 240--265, 1987. \end{thebibliography}