chapitre4.bib

@article{10.2307/2289471,
  issn = {01621459},
  url = {http://www.jstor.org/stable/2289471},
  abstract = {Large sample properties of the likelihood function when the true parameter value may be on the boundary of the parameter space are described. Specifically, the asymptotic distribution of maximum likelihood estimators and likelihood ratio statistics are derived. These results generalize the work of Moran (1971), Chant (1974), and Chernoff (1954). Some of Chant's results are shown to be incorrect. The approach used in deriving these results follows from comments made by Moran and Chant. The problem is shown to be asymptotically equivalent to the problem of estimating the restricted mean of a multivariate Gaussian distribution from a sample of size 1. In this representation the Gaussian random variable corresponds to the limit of the normalized score statistic and the estimate of the mean corresponds to the limit of the normalized maximum likelihood estimator. Thus the limiting distribution of the maximum likelihood estimator is the same as the distribution of the projection of the Gaussian random variable onto the region of admissible values for the mean. A variety of examples is provided for which the limiting distributions of likelihood ratio statistics are mixtures of chi-squared distributions. One example is provided with a nuisance parameter on the boundary for which the asymptotic distribution is not a mixture of chi-squared distributions.},
  author = {Steven G. Self and Kung-Yee Liang},
  journal = {Journal of the American Statistical Association},
  number = {398},
  pages = {605--610},
  publisher = {[American Statistical Association, Taylor & Francis, Ltd.]},
  title = {Asymptotic Properties of Maximum Likelihood Estimators and Likelihood Ratio Tests Under Nonstandard Conditions},
  volume = {82},
  year = {1987}
}
@mastersthesis{projet_recherche,
  title = {Projet recherche : optimisation non-linéaire - application à la création d'indices boursiers},
  author = {Ehrhardt, Adrien},
  year = {2014},
  school = {\'Ecole Centrale de Lille}
}
@inproceedings{vincent_disc,
  title = {How to Take into Account the Discrete Parameters in the BIC Criterion?},
  author = {Vandewalle, Vincent},
  booktitle = {COMPStat},
  year = {2010}
}
@inproceedings{ho1998efficient,
  title = {An efficient global discretization method},
  author = {Ho, KM and Scott, Paul D},
  booktitle = {Pacific-Asia Conference on Knowledge Discovery and Data Mining},
  pages = {383--384},
  year = {1998},
  organization = {Springer}
}
@inproceedings{ho1997zeta,
  title = {Zeta: a global method for discretization of cotitinuous variables},
  author = {Ho, KM and Scott, PD},
  booktitle = {Proceedings of the 3rd International Conference on Knowledge Discovery and Data Mining},
  pages = {191--194},
  year = {1997}
}
@article{liu2002discretization,
  title = {Discretization: An enabling technique},
  author = {Liu, Huan and Hussain, Farhad and Tan, Chew Lim and Dash, Manoranjan},
  journal = {Data mining and knowledge discovery},
  volume = {6},
  number = {4},
  pages = {393--423},
  year = {2002},
  publisher = {Springer}
}
@incollection{dougherty1995supervised,
  title = {Supervised and unsupervised discretization of continuous features},
  author = {Dougherty, James and Kohavi, Ron and Sahami, Mehran},
  booktitle = {Machine Learning Proceedings 1995},
  pages = {194--202},
  year = {1995},
  publisher = {Elsevier}
}
@article{sun2014fast,
  title = {Fast Implementation of DeLong's Algorithm for
          Comparing the Areas Under Correlated Receiver Oerating Characteristic Curves},
  author = {Xu Sun and Weichao Xu},
  journal = {IEEE Signal Processing Letters},
  volume = {21},
  number = {11},
  pages = {1389--1393},
  year = {2014},
  publisher = {IEEE}
}
@article{anand1993improved,
  title = {An improved algorithm for neural network classification of imbalanced training sets},
  author = {Anand, Rangachari and Mehrotra, Kishan G and Mohan, Chilukuri K and Ranka, Sanjay},
  journal = {IEEE Transactions on Neural Networks},
  volume = {4},
  number = {6},
  pages = {962--969},
  year = {1993},
  publisher = {IEEE}
}
@incollection{bottou2010large,
  title = {Large-scale machine learning with stochastic gradient descent},
  author = {Bottou, L{\'e}on},
  booktitle = {Proceedings of COMPSTAT'2010},
  pages = {177--186},
  year = {2010},
  publisher = {Springer}
}
@article{reverdy2016parameter,
  title = {Parameter estimation in softmax decision-making models with linear objective functions},
  author = {Reverdy, Paul and Leonard, Naomi Ehrich},
  journal = {IEEE Transactions on Automation Science and Engineering},
  volume = {13},
  number = {1},
  pages = {54--67},
  year = {2016},
  publisher = {IEEE}
}
@article{same2011model,
  title = {Model-based clustering and segmentation of time series with changes in regime},
  author = {Sam{\'e}, Allou and Chamroukhi, Faicel and Govaert, G{\'e}rard and Aknin, Patrice},
  journal = {Advances in Data Analysis and Classification},
  volume = {5},
  number = {4},
  pages = {301--321},
  year = {2011},
  publisher = {Springer}
}
@inproceedings{chamroukhi2009regression,
  title = {A regression model with a hidden logistic process for feature extraction from time series},
  author = {Chamroukhi, Faicel and Sam{\'e}, Allou and Govaert, G{\'e}rard and Aknin, Patrice},
  booktitle = {Neural Networks, 2009. IJCNN 2009. International Joint Conference on},
  pages = {489--496},
  year = {2009},
  organization = {IEEE}
}
@book{o2006logistic,
  title = {Logistic regression models for ordinal response variables},
  author = {O'Connell, Ann A},
  number = {146},
  year = {2006},
  publisher = {Sage}
}
@book{villani2018donner,
  title = {Donner un sens {\`a} l'intelligence artificielle: pour une strat{\'e}gie nationale et europ{\'e}enne},
  author = {Villani, C{\'e}dric and Bonnet, Yann and Berthet, Charly and Levin, Fran{\c{c}}ois and Schoenauer, Marc and Cornut, Anne-Charlotte and Rondepierre, Bertrand},
  year = {2018},
  publisher = {Conseil national du num{\'e}rique}
}
@techreport{celeux_sem,
  title = {{On Stochastic Versions of the EM Algorithm}},
  author = {Celeux, Gilles and Chauveau, Didier and Diebolt, Jean},
  url = {https://hal.inria.fr/inria-00074164},
  type = {Research Report},
  number = {RR-2514},
  institution = {{INRIA}},
  year = {1995},
  keywords = {MONTE-CARLO EXPERIMENTS ; MIXTURE OF DOSTRIBUTION ; INCOMPLETE DATA MODELS ; STOCHASTIC ALGORITHMS},
  pdf = {https://hal.inria.fr/inria-00074164/file/RR-2514.pdf},
  hal_id = {inria-00074164},
  hal_version = {v1}
}
@article{casella1992explaining,
  title = {Explaining the Gibbs sampler},
  author = {Casella, George and George, Edward I},
  journal = {The American Statistician},
  volume = {46},
  number = {3},
  pages = {167--174},
  year = {1992},
  publisher = {Taylor \& Francis}
}
@article{green1995reversible,
  title = {Reversible jump Markov chain Monte Carlo computation and Bayesian model determination},
  author = {Green, Peter J},
  journal = {Biometrika},
  volume = {82},
  number = {4},
  pages = {711--732},
  year = {1995},
  publisher = {Oxford University Press}
}
@article{shaffer1995multiple,
  title = {Multiple hypothesis testing},
  author = {Shaffer, Juliet Popper},
  journal = {Annual review of psychology},
  volume = {46},
  number = {1},
  pages = {561--584},
  year = {1995},
  publisher = {Annual Reviews 4139 El Camino Way, PO Box 10139, Palo Alto, CA 94303-0139, USA}
}
@article{chen2008extended,
  title = {Extended Bayesian information criteria for model selection with large model spaces},
  author = {Chen, Jiahua and Chen, Zehua},
  journal = {Biometrika},
  volume = {95},
  number = {3},
  pages = {759--771},
  year = {2008},
  publisher = {Oxford University Press}
}
@article{tay2002modified,
  title = {A modified chi2 algorithm for discretization},
  author = {Tay, Francis EH and Shen, Lixiang},
  journal = {IEEE Transactions on Knowledge \& Data Engineering},
  number = {3},
  pages = {666--670},
  year = {2002},
  publisher = {IEEE}
}
@article{su2005extended,
  title = {An extended chi2 algorithm for discretization of real value attributes},
  author = {Su, Chao-Ton and Hsu, Jyh-Hwa},
  journal = {IEEE transactions on knowledge and data engineering},
  volume = {17},
  number = {3},
  pages = {437--441},
  year = {2005},
  publisher = {IEEE}
}
@inproceedings{wang1998concurrent,
  title = {Concurrent discretization of multiple attributes},
  author = {Wang, Ke and Liu, Bing},
  booktitle = {Pacific Rim International Conference on Artificial Intelligence},
  pages = {250--259},
  year = {1998},
  organization = {Springer}
}
@inproceedings{liu1995chi2,
  title = {Chi2: Feature selection and discretization of numeric attributes},
  author = {Liu, Huan and Setiono, Rudy},
  booktitle = {Tools with artificial intelligence, 1995. proceedings., seventh international conference on},
  pages = {388--391},
  year = {1995},
  organization = {IEEE}
}
@inproceedings{kerber1992chimerge,
  title = {Chimerge: Discretization of numeric attributes},
  author = {Kerber, Randy},
  booktitle = {Proceedings of the tenth national conference on Artificial intelligence},
  pages = {123--128},
  year = {1992},
  organization = {Aaai Press}
}
@misc{Dua:2017,
  author = {Dheeru, Dua and Karra Taniskidou, Efi},
  year = {2017},
  title = {{UCI} Machine Learning Repository},
  url = {http://archive.ics.uci.edu/ml},
  institution = {University of California, Irvine, School of Information and Computer Sciences}
}
@article{kass1980exploratory,
  title = {An exploratory technique for investigating large quantities of categorical data},
  author = {Kass, Gordon V},
  journal = {Applied statistics},
  pages = {119--127},
  year = {1980},
  publisher = {JSTOR}
}
@inproceedings{fayyad1993multi,
  title = {Multi-interval discretization of continuous-valued attributes for classification learning},
  author = {Fayyad, Usama and Irani, Keki},
  booktitle = {13th International Joint Conference on Artificial Intelligence},
  pages = {1022–-1029},
  year = {1993}
}
@inproceedings{tsang2018detecting,
  title = {Detecting Statistical Interactions from Neural Network Weights},
  author = {Michael Tsang and Dehua Cheng and Yan Liu},
  booktitle = {International Conference on Learning Representations},
  year = {2018},
  url = {https://openreview.net/forum?id=ByOfBggRZ}
}
@inproceedings{hahnloser2001permitted,
  title = {Permitted and forbidden sets in symmetric threshold-linear networks},
  author = {Hahnloser, Richard HR and Seung, H Sebastian},
  booktitle = {Advances in Neural Information Processing Systems},
  pages = {217--223},
  year = {2001}
}
@misc{chollet2015keras,
  title = {Keras},
  author = {Chollet, Fran\c{c}ois and others},
  year = {2015},
  howpublished = {\url{https://keras.io}}
}
@misc{tensorflow2015-whitepaper,
  title = { {TensorFlow}: Large-Scale Machine Learning on Heterogeneous Systems},
  url = {https://www.tensorflow.org/},
  note = {Software available from tensorflow.org},
  author = {
    Mart\'{\i}n~Abadi and
    Ashish~Agarwal and
    Paul~Barham and
    Eugene~Brevdo and
    Zhifeng~Chen and
    Craig~Citro and
    Greg~S.~Corrado and
    Andy~Davis and
    Jeffrey~Dean and
    Matthieu~Devin and
    Sanjay~Ghemawat and
    Ian~Goodfellow and
    Andrew~Harp and
    Geoffrey~Irving and
    Michael~Isard and
    Yangqing Jia and
    Rafal~Jozefowicz and
    Lukasz~Kaiser and
    Manjunath~Kudlur and
    Josh~Levenberg and
    Dandelion~Man\'{e} and
    Rajat~Monga and
    Sherry~Moore and
    Derek~Murray and
    Chris~Olah and
    Mike~Schuster and
    Jonathon~Shlens and
    Benoit~Steiner and
    Ilya~Sutskever and
    Kunal~Talwar and
    Paul~Tucker and
    Vincent~Vanhoucke and
    Vijay~Vasudevan and
    Fernanda~Vi\'{e}gas and
    Oriol~Vinyals and
    Pete~Warden and
    Martin~Wattenberg and
    Martin~Wicke and
    Yuan~Yu and
    Xiaoqiang~Zheng},
  year = {2015}
}
@article{zeng2014necessary,
  title = {A necessary condition for a good binning algorithm in credit scoring},
  author = {Zeng, Guoping},
  journal = {Applied Mathematical Sciences},
  volume = {8},
  number = {65},
  pages = {3229--3242},
  year = {2014}
}
@article{celeux1995stochastic,
  title = {On stochastic versions of the EM algorithm},
  author = {Celeux, Gilles and Chauveau, Didier and Diebolt, Jean},
  year = {1995},
  publisher = {INRIA}
}
@article{2013arXiv1305.2982B,
  author = {{Bengio}, Y.},
  title = {{Estimating or Propagating Gradients Through Stochastic Neurons}},
  journal = {ArXiv e-prints},
  archiveprefix = {arXiv},
  eprint = {1305.2982},
  keywords = {Computer Science - Machine Learning},
  year = 2013,
  month = may,
  adsurl = {http://adsabs.harvard.edu/abs/2013arXiv1305.2982B},
  adsnote = {Provided by the SAO/NASA Astrophysics Data System}
}
@article{massart2007concentration,
  title = {Concentration inequalities and model selection},
  author = {Massart, Pascal},
  year = {2007},
  publisher = {Springer}
}
@book{temme2015asymptotic,
  title = {Asymptotic methods for integrals},
  author = {Temme, Nico M},
  year = {2015},
  publisher = {World Scientific}
}
@article{ramirez2016data,
  title = {Data discretization: taxonomy and big data challenge},
  author = {Ram{\'\i}rez-Gallego, Sergio and Garc{\'\i}a, Salvador and Mouri{\~n}o-Tal{\'\i}n, H{\'e}ctor and Mart{\'\i}nez-Rego, David and Bol{\'o}n-Canedo, Ver{\'o}nica and Alonso-Betanzos, Amparo and Ben{\'\i}tez, Jos{\'e} Manuel and Herrera, Francisco},
  journal = {Wiley Interdisciplinary Reviews: Data Mining and Knowledge Discovery},
  volume = {6},
  number = {1},
  pages = {5--21},
  year = {2016},
  publisher = {Wiley Online Library}
}
@inproceedings{akaike1973information,
  title = {Information theory and an extension of the maximum likelihood principle},
  author = {Hirotugu Akaike},
  booktitle = {2nd International Symposium on Information Theory, 1973},
  pages = {267--281},
  year = {1973},
  organization = {Akademiai Kiado}
}
@article{maj2015delete,
  title = {Delete or merge regressors for linear model selection},
  author = {Maj-Ka{\'n}ska, Aleksandra and Pokarowski, Piotr and Prochenka, Agnieszka and others},
  journal = {Electronic Journal of Statistics},
  volume = {9},
  number = {2},
  pages = {1749--1778},
  year = {2015},
  publisher = {The Institute of Mathematical Statistics and the Bernoulli Society}
}
@article{berry2010testing,
  title = {Testing for interaction in binary logit and probit models: Is a product term essential?},
  author = {Berry, William D and DeMeritt, Jacqueline HR and Esarey, Justin},
  journal = {American Journal of Political Science},
  volume = {54},
  number = {1},
  pages = {248--266},
  year = {2010},
  publisher = {Wiley Online Library}
}
@article{yang2009discretization,
  title = {Discretization for naive-Bayes learning: managing discretization bias and variance},
  author = {Yang, Ying and Webb, Geoffrey I},
  journal = {Machine learning},
  volume = {74},
  number = {1},
  pages = {39--74},
  year = {2009},
  publisher = {Springer}
}
@book{hosmer2013applied,
  title = {Applied logistic regression},
  author = {Hosmer Jr, David W and Lemeshow, Stanley and Sturdivant, Rodney X},
  volume = {398},
  year = {2013},
  publisher = {John Wiley \& Sons}
}
@incollection{Bengio+chapter2007,
  author = {Bengio, Yoshua and LeCun, Yann},
  booktitle = {Large Scale Kernel Machines},
  publisher = {MIT Press},
  title = {Scaling Learning Algorithms Towards {AI}},
  year = {2007}
}
@article{Hinton06,
  author = {Hinton, Geoffrey E. and Osindero, Simon and Teh, Yee Whye},
  journal = {Neural Computation},
  pages = {1527--1554},
  title = {A Fast Learning Algorithm for Deep Belief Nets},
  volume = {18},
  year = {2006}
}

This file was generated by bibtex2html 1.96.