@ARTICLE {quinlan86:iodt,
	AUTHOR = "J. Ross Quinlan",
	TITLE = "Induction of decision trees",
	JOURNAL = "Machine Learning",
	VOLUME = "1(1)",
	YEAR = 1986,
	PAGES = "81--106" 
	}

@ARTICLE {efron79:bmalatj,
	AUTHOR = "Bradley Efron",
	TITLE = "Bootstrap Methods: Another look at the jackknife",
	JOURNAL = "Anns. Statist.",
	YEAR = "1979",
	VOLUME = "7",
	PAGES = "1--26"
	}

@ARTICLE {stone74;cvcaaosp,
	AUTHOR = "M. Stone",
	TITLE = "Cross-validatory choice and assessment of statistical
			predictions",
	JOURNAL = "J. Royal Statistical Society B",
	YEAR = 1974,
	VOLUME = 36,
	PAGES = "111--147"
	}


@ARTICLE {stone78:afaacv,
	AUTHOR = "M. Stone",
	TITLE = "Asymtotics for and against cross-validation",
	JOURNAL = "Biometrika",
	YEAR = 1977,
	VOLUME = "64(1)",
	PAGES = "29--35"
	}

@ARTICLE {schaffer93:oaab,
	AUTHOR = "C. Schaffer",
	TITLE = "Overfitting avoidance as bias",
	JOURNAL = "Machine Learning",
	YEAR = 1993,
	VOLUME = "10",
	PAGES = "153--178"
	}

@INCOLLECTION {mosteller68:dais,
	AUTHOR = "F. Mosteller and J. W. Tukey",
	TITLE = "Data Analysis, Including Statistics",
	BOOKTITLE = "Handbook of Social Psychology Vol. 2",
	PUBLISHER = "Addison-Wesley",
	EDITOR = "G. Lindzey and E. Aronson",
	YEAR = "1968",
	PAGES = "1--26"
	}

@TECHREPORT{wolpert93:ooaab,
	AUTHOR = "David H. Wolpert",	
	TITLE = "On overfitting avoidance as bias",
	INSTITUTION = "The Sante Fe Institute",
	NUMBER = "SFI TR 92-03-5001",
	YEAR = 1992
	}


	
@INPROCEEDINGS{mehta95:mbdtp,
	AUTHOR = "M. Mehta and J. Rissanen and R. Agrawal",
	TITLE = "{MDL}-based decision tree pruning",
	PUBLISHER = "AAAI Press",
	BOOKTITLE = "Proceedings of the First International Conference on Knowledge Discovery and Data Mining",
	YEAR = 1995,
	PAGES = "216--221",
	}

@ARTICLE{murphy94:etdfaeiooridti,
	AUTHOR = "P.M. Murphy and M.J. Pazzani",
	TITLE = "Exploring the Decision Forest: An empirical investigation of {Occam's}
		{Razor} in decision tree induction",
	JOURNAL = "Journal of Artificial Intelligence Research", 
	YEAR = "1994",
	VOLUME = "1",
	PAGES = "257--275"
	}

@BOOK{miller90:ssir,
	AUTHOR = "Alan J. Miller",
	TITLE = "Subset Selection in Regression",
	PUBLISHER = "Chapman and Hall",
	YEAR = 1990
	}

%PAC  AA
@ARTICLE{valiant84:dl,
	AUTHOR = "L. G. Valiant",
	TITLE = "Deductive Learning",
	JOURNAL = "Philosophical Transactions of the Royal Society of London A",
	VOLUME = 312,
	PAGES = "441--446", 
	YEAR = 1984
	}

%PAC  AA
@ARTICLE{valiant84:atotl,
	AUTHOR = "L. G. Valiant",
	TITLE = "A Theory of the Learnable",
	JOURNAL = "Communications of the ACM",
	VOLUME = 25,
	NUMBER = 11,
	PAGES = "1134--1142",
	YEAR = 1984
	}

% PAC AA
@INPROCEEDINGS{valiant85:ldoc,
	AUTHOR = "L. G. Valiant",
	TITLE = "Learning Disjunctions of Conjunctions",
	BOOKTITLE = "Proceedings of the 9th International Joint Conference on Artificial Intelligence", 
	PAGES = "550--566",
	YEAR = 1985
	}

% The uniform convergence paper
@ARTICLE{vapnik71:otucorfoettp,
	AUTHOR = "V. N. Vapnik and A. Y. Chervonenkis",
	TITLE = "On the uniform convergence of relative frequencies of events to their probabilities",
	JOURNAL = "Theory of Probability and its Applications",
	VOLUME = 16,
	NUMBER = 2,
	PAGES = "264--280",
	YEAR = 1971
	}

@ARTICLE{vapnik82:eodboed,
	AUTHOR = "V. N. Vapnik",
	TITLE = "Estimation of dependencies based on empirical data",
	JOURNAL = "Theory of Probability and its Applications",
	PUBLISHER = "Springer Verlag",
	YEAR = 1971
	}

@ARTICLE{schapire90:otsowk,
	AUTHOR = "Robert E. Schapire",
	TITLE = "The strength of weak learnability",
	JOURNAL = "Machine Learning",
	VOLUME = 5,
	NUMBER = 2,
	PAGES = "197--227", 
	YEAR = 1990
	}

@ARTICLE{rissanen78:mbsdd,
	AUTHOR = "J. Rissanen",
	TITLE = "Modeling by shortest data description",
	JOURNAL = "Automatica",
	VOLUME = 14,
	PAGES = "465--471",
	YEAR = 1978
	}

@ARTICLE{quinlan89:idtutmdlp,
	AUTHOR = "J. Ross Quinlan and Ron L. Rivest",
	TITLE = "Inferring decision trees using the minimum description length principle",
	JOURNAL = "Information and Computation",
	VOLUME = 80,
	NUMBER = 3,
	PAGES = "227--248",
	YEAR = 1989
	}

@INPROCEEDINGS{freund90:bawlabm,
	AUTHOR = "Yoav Freund",
	TITLE = "Boosting a weak learning algorithm by majority",
	BOOKTITLE = "Proceedings of the 3rd Workshop on Computational Learning Theory",
	PUBLISHED = "Morgan Kaufmann",
	PAGES = "202--216",
	YEAR = 1990
	}

@INPROCEEDINGS{freund92:aibaaiiolc,
	AUTHOR = "Yoav Freund",
	TITLE = "An improved boosting algorithm and its implications on learning complexity",
	BOOKTITLE = "Proceedings of the 5th Workshop on Computational Leaning Theory",
	PAGES = "391--398",
	PUBLISHED = "ACM Press",
	YEAR = 1992
	}

@ARTICLE{board92:otnooa,
	AUTHOR = "R. Board and L. Pitt",
	TITLE = "On the necessity of {Occam} algorithms",
	JOURNAL = "Theoretical Computer Science",
	VOLUME = 100,
	PAGES = "157--184",
	YEAR = 1992
	}

@ARTICLE{baum89:wsngvg,
	AUTHOR = "E. Baum and D. Haussler",
	TITLE = "What size net gives valid generalization?",
	JOURNAL = "Neural Computation",
	VOLUME = 1,
	NUMBER = 1,
	PAGES = "151--160",
	YEAR = 1989
	}

@ARTICLE{littlestone94:twma,
	AUTHOR = "N. Littlestone and M. Warmuth",
	TITLE = "The weighted majority algorithm",
	JOURNAL = "Information and Computation",
	VOLUME = 108,
	PAGES = "212--261",
	YEAR = 1994
	}

@TECHREPORT{littlestone91:twma,
	AUTHOR = "N. Littlestone and M. Warmuth",
	TITLE = "The weighted majority algorithm",
	INSTITUTION = "Univ. of California Santa Cruz, Computer Engineering and Information Sciences Dept.",
	NUMBER = "UCSC-CRL-91-28",
	YEAR = 1991
	}

@BOOK{leadbetter80:earporsap,
	AUTHOR = "M. R. Leadbetter and Georg Lindgren 
			and Holger Rootz\'en",
	TITLE = "Extremes and Related Properties 
			of Random Sequences and Processes",
	PUBLISHER = "Springer Verlag",
	YEAR = 1980
	}

@BOOK{judd90:nndatcol,
	AUTHOR = "J. S. Judd",
	TITLE = "{Neural Network} Design and the Complexity of Learning",
	PUBLISHER = "MIT Press",
	YEAR = 1990
	}

@ARTICLE{tukey93:tpomc,
	AUTHOR = "John W. Tukey",
	TITLE = "The problem of multiple comparisons",
	EDITOR = "Henry I. Braun",
	BOOKTITLE = "The Collected Works of John W. Tukey",
	VOLUME = 8,
	PAGES = "1--300",
	YEAR = 1993
	}

@BOOK{klockars86:mc,
	AUTHOR = "Alan J. Klockars and Gilbert Sax",
	TITLE = "Multiple Comparisons",
	PUBLISHER = "Sage Publications",
	YEAR = 1986
	}

@UNPUBLISHED{tukey53:tpomc,
	AUTHOR = "John W. Tukey",
	TITLE = "The problem of Multiple Comparisons",
	NOTE = "{\em Unpublished manuscript},\/ Princeton University",
	YEAR = 1953
	}

@ARTICLE{tukey49:cimitaov,
	AUTHOR = "John W. Tukey",
	TITLE = "Comparing individual means in the analysis of variance",
	JOURNAL = "Biometrics",
	VOLUME = 9,
	PAGES = "99--114",
	YEAR = 1949
	}

@BOOK{sarndal92:mass, 
	AUTHOR = "Carl-Erik S{\"{a}}rndal and Bengt Swensson and Jan Wretman",
	TITLE = "Model Assisted Survey Sampling", 
	SERIES = "Springer Series in Statistics", 
	PUBLISHER = "Springer Verlag", 
	YEAR = 1992
	}

% independent random groups 
@ARTICLE{mahalanobis39:assotaujib,
	AUTHOR = "P. C. Mahalanobis",
	TITLE = "A sample survey of the acreage under gute in {Bengal}",
	JOURNAL = "Sankhya",
	VOLUME = 4,
	PAGES = "511--531",
	YEAR = 1939
	}

@ARTICLE{mahalanobis44:olsss,
	AUTHOR = "P. C. Mahalanobis",
	TITLE = "On large-scale sample surveys",
	JOURNAL = "Philosophical Transactions of the Royal Society of London B",
	VOLUME = 231,
	PAGES = "329-451",
	YEAR = 1944
	}

@ARTICLE{mahalanobis46:reissitisi,
	AUTHOR = "P. C. Mahalanobis",
	TITLE = "Recent experiments in statistical sampling in the {Indian} {Statistical} {Institute}", 
	JOURNAL = "Journal of the Royal Statistical Society", 
	VOLUME = 109,
	PAGES = "325-370",
	YEAR = 1946
	}

@ARTICLE{demeng56:ososdtrwepaws,
	AUTHOR = "W. E. Deming",
	TITLE = "On simplifications of sampling design through replication with equal probabilities and without stages", 
	JOURNAL = "Journal of the American Statistical Association",
	VOLUME = 51,
	PAGES = "24--53",
	YEAR = 1956
	}

# jackknife
@ARTICLE{quenouille49:pips,
	AUTHOR = "M. H. Quenouille", 
	TITLE = "Problems in plane sampling", 
	JOURNAL = "Annals of Mathematical Statistics", 
	VOLUME = 20,
	PAGES = "355--375", 
	YEAR = 1949
	}

# jackknife
@ARTICLE{quenouille56:nobis,
	AUTHOR = "M. H. Quenouille", 
	TITLE = "Notes on bias in estimation", 
	JOURNAL = "Biometrika", 
	VOLUME = 43,
	PAGES = "353--360", 
	YEAR = 1956
	}

# jackknife
@ARTICLE{tukey58:bacisqls,
	AUTHOR = "John W. Tukey",
	TITLE = "Bias and confidence in not-quite large samples (abstract)",
	JOURNAL = "Annals of Mathematical Statistics", 
	VOLUME = 29,
	PAGES = "614", 
	YEAR = 1958
	}

@BOOK{efron82:bacisqls,
	AUTHOR = "Bradley Efron", 
	TITLE = "The Jackknife, the Bootstrap, and other resampling plans", 
	PUBLISHER = "Society for Industrial and Applied Mathematics, Philadelphia",
	SERIES = "CBMS-NSF regional conference series in applied mathematics",
	YEAR = 1982
	}

#----------------------------------------
# reinforcement learning

# awm's bib: /usr0/awm/l/papers/bib/all.bib

@TECHREPORT{gordon95:sfaidp,
	AUTHOR = "Geoffrey J. Gordon",
	TITLE = "Stable function approximation in dynamic programming",
	INSTITUTION = "Carnegie Mellon University",
	NUMBER = "CMU-CS-95-103",
	YEAR = 1995
	}

@INPROCEEDINGS{gordon95:sfaidp:ml,
	AUTHOR = "Geoffrey J. Gordon",
	TITLE = "Stable function approximation in dynamic programming",
	BOOKTITLE = "Proceedings of 12th International Conference on Machine Learning", 
	PUBLISHER = "Morgan Kaufmann",
	YEAR = 1995
	}

@TECHREPORT{davies97:miatffrl,
	AUTHOR = "Scott Davies",
	TITLE = "Multilinear Interpolation and Triangulation for Fast Reinforcement Learning", 
	INSTITUTION = "Carnegie Mellon University",
	NUMBER = "(In writing)",
	YEAR=1997
	}

@TECHREPORT{ng97:anatrl,
	AUTHOR = "(Name omitted for anonymity in reviews)",
	TITLE = "A new approach to {Reinforcement Learning} with function approximators",
	INSTITUTION = "(Institution omitted)",
	NUMBER = "(In writing)",
	YEAR=1997
	}

@INPROCEEDINGS{davies97:mtaifrl:nips,
	AUTHOR      = "S. Davies",
	TITLE       = "{Multidimensional Triangulation and Interpolation for
             		  Reinforcement Learning}",
	BOOKTITLE   = "{Advances in Neural Information Processing Systems 9}",
	PUBLISHER  = "{Morgan Kaufmann}",
	YEAR       = "1997"
	}

@ARTICLE{sutton88:ltpbtmotd,
	AUTHOR      = "R. S. Sutton",
	TITLE       = "{Learning to Predict by the Methods of Temporal Differences}",
	JOURNAL     = "{Machine Learning}",
	VOLUME      = "{3}",
	PAGES       = "{9--44}",
	YEAR        = "1988"
	}

@BOOK{bellman57:dp,
	AUTHOR      = "R. E. Bellman",
	TITLE       = "{Dynamic Programming}",
	PUBLISHER   = "{Princeton University Press, Princeton, NJ}",
	YEAR        = "1957"
	}

@INPROCEEDINGS{boyan95:girl,
	AUTHOR      = "Justin A. Boyan and Andrew W. Moore",
	TITLE       = "{Generalization in Reinforcement Learning:
	               Safely Approximating the Value Function}",
	BOOKTITLE   = "{Advances in Neural Information Processing Systems 7}",
	YEAR        = "1995"
	}

# cite this for the "original" acrobot
@INPROCEEDINGS{sutton:girl,
	AUTHOR      = "R. S. Sutton",
	TITLE       = "{Generalization in Reinforcement Learning: Successful
                Examples Using Sparse Coarse Coding}",
	BOOKTITLE   = "{Advances in Neural Information Processing Systems 8}",
	EDITOR      = "D. Touretzky and M. Mozer and M. Hasselmo",
	YEAR        = "1996"
	}

@TECHREPORT{harmon96:ssttbe,
	AUTHOR = "M. E. Harmon and Leemon C. Baird",
	TITLE="Spurious Solutions to the Bellman Equation",
    	NUMBER = {WL-TR-96-\"To Be Assigned\"},
	INSTITUTION = " Wright-Patterson Air Force Base Ohio: Wright Laboratory",
	YEAR = 1996
	}

@INPROCEEDINGS{baird95:ra:ml,
	AUTHOR = "Leemon C. Baird",
	TITLE = "Residual Algorithms: Reinforcement Learning with Function Approximation",
	BOOKTITLE = "Proceedings of 12th International Conference on Machine Learning", 
	PUBLISHER = "Morgan Kaufmann",
	YEAR = 1995
	}

@INPROCEEDINGS{baird95:ra,
	AUTHOR = "Leemon C. Baird",
	TITLE = "Residual Algorithms",
	BOOKTITLE = "Proceedings of the Workshop on Value
	    Function Approximation, Machine Learning Conference 1995",
	EDITOR = "Justin A. Boyan and Andrew W. Moore and Richard S. Sutton",
	YEAR = 1995
	}

@TECHREPORT{tesauro91:piitdl,
Author      = "G. J. Tesauro",
Title       = "{Practical Issues in Temporal Difference Learning}",
Institution = "{IBM T. J. Watson Research Center, NY}",
Type        = "{RC 17223 (76307)}",
Year        = "1991"
}

@INPROCEEDINGS{williams94:tpbogpboivf,
	AUTHOR = "R. J. Williams and Leemon C. Baird, L. C.",
	TITLE="Tight Performance Bounds on Greedy Policies Based on Imperfect Value Functions",
	BOOKTITLE="Proceedings of the Tenth Yale Workshop on Adaptive and Learning Systems",
	PUBLISHER = "Yale University",
	YEAR = 1994
	}

@INPROCEEDINGS{bradtke93:rlatlqr,
	AUTHOR      = "S. J. Bradtke",
	TITLE       = "{Reinforcement Learning} applied to linear quadratic regulation",
	BOOKTITLE   = "{Advances in Neural Information Processing Systems 9}",
	PUBLISHER  = "{Morgan Kaufmann}",
	YEAR       = "1993"
	}

@MASTERSTHESIS{boyan92:mnnflcdgs,
	AUTHOR = "Justin A. Boyan",
	TITLE = "Modular neural networks for learning context-dependent game strategies",
	SCHOOL = "Cambridge University",
	YEAR = 1992
	}

@BOOK{nric,
	AUTHOR = "William H. Press and Saul A. Teukolsky and William T. Vetterling and Brian Flannery",
	TITLE = "Numerical Recipes in C",
	PUBLISHER = "Cambridge University Press",
	YEAR = 1992
	}

@BOOK{gerald89:ana, 
	AUTHOR = "Curtis F. Geralk and Patrick O. Wheatley",
	TITLE = "Applied Numerical Analysis (4th Ed.)",
	PUBLISHER = "Addison-Wesley",
	YEAR = 1989
	}

@ARTICLE{press89:qrn,
	AUTHOR = "William H. Press and Saul A. Teukolsky",
 	TITLE = "{Quasi- (that is, Sub-) Random Numbers}",
	JOURNAL = "{Computers in Physics}",
	VOLUME = 3,
 	PAGES = "76--79",
	NUMBER = 6,
	YEAR= 1989
	}

@INPROCEEDINGS{kearns96:aboteocv,
	AUTHOR = "Michael J. Kearns", 
 	TITLE = "A bound on the error of {Cross Validation} using the approximation and estimation rates, with consequences for the training-test split",
	BOOKTITLE   = "{Advances in Neural Information Processing Systems 8}",
	PUBLISHER  = "{Morgan Kaufmann}",
	PAGES = "183--189",
	YEAR = "1996"
	}

@INPROCEEDINGS{kearns95:aeatcomsm,
	AUTHOR = "Michael J. Kearns and Yishay Mansour and Andrew Y. Ng and Dana Ron", 
 	TITLE = "An experimental and theoretical comparison of model selection methods",
	BOOKTITLE   = "{Proceedings of the Eighth ACM Conference on Computational Learning Theory}",
	PUBLISHER  = "{ACM Press}",
	PAGES = "21--30",
	YEAR = "1995"
	}

