Skip to content

Commit

Permalink
Polishing
Browse files Browse the repository at this point in the history
  • Loading branch information
jfouret committed Oct 25, 2023
1 parent 4c8dcd9 commit 8cc67d2
Show file tree
Hide file tree
Showing 10 changed files with 487 additions and 148 deletions.
106 changes: 91 additions & 15 deletions biblio.bib
Original file line number Diff line number Diff line change
Expand Up @@ -10,22 +10,23 @@ @article{Turing1950
issn = {0026-4423},
doi = {10.1093/mind/LIX.236.433},
url = {https://doi.org/10.1093/mind/LIX.236.433},
eprint = {https://academic.oup.com/mind/article-pdf/LIX/236/433/30123314/lix-236-433.pdf},
}
@article{neyman1933,
title={On the problem of the most efficient tests of statistical hypotheses},
author={Neyman, J. and Pearson, E. S.},
journal={Philosophical Transactions of the Royal Society of London. Series A},
title={On the Problem of the Most Efficient Tests of Statistical Hypotheses},
author={Jerzy Neyman and Egon Sharpe Pearson},
journal={Philosophical Transactions of the Royal Society A},
year={1933},
volume={231},
pages={289-337},
year={1933}
url={https://api.semanticscholar.org/CorpusID:85550403}
}
@misc{
jannai2023,
title={Human or Not? A Gamified Approach to the Turing Test},
author = {Jannai, Daniel and Meron, Amos and Lenz, Barak and Levine, Yoav and Shoham, Yoav}, year={2023},
eprint={2305.20010},
archivePrefix={arXiv}
@misc{jannai2023,
title={Human or Not? A Gamified Approach to the Turing Test},
author={Daniel Jannai and Amos Meron and Barak Lenz and Yoav Levine and Yoav Shoham},
journal={ArXiv},
year={2023},
volume={abs/2305.20010},
url={https://api.semanticscholar.org/CorpusID:258987666}
}
@misc{
dartmouth1955,
Expand All @@ -34,11 +35,86 @@ @misc{
url = {https://raysolomonoff.com/dartmouth/boxa/dart564props.pdf},
}
@article{student1908,
title={The probable error of a mean},
author={Student (pseudonym for W.S. Gosset)},
title={THE PROBABLE ERROR OF A MEAN},
author={Student},
journal={Biometrika},
year={1908},
volume={6},
number={1},
pages={1-25},
year={1908}
url={https://api.semanticscholar.org/CorpusID:263778821}
}
@article{Clark2018ThinkYH,
title={Think you have Solved Question Answering? Try ARC, the AI2 Reasoning Challenge},
author={Peter Clark and Isaac Cowhey and Oren Etzioni and Tushar Khot and Ashish Sabharwal and Carissa Schoenick and Oyvind Tafjord},
journal={ArXiv},
year={2018},
volume={abs/1803.05457},
url={https://api.semanticscholar.org/CorpusID:3922816}
}
@misc{zellers2019hellaswag,
title={HellaSwag: Can a Machine Really Finish Your Sentence?},
author={Rowan Zellers and Ari Holtzman and Yonatan Bisk and Ali Farhadi and Yejin Choi},
booktitle={Annual Meeting of the Association for Computational Linguistics},
year={2019},
url={https://api.semanticscholar.org/CorpusID:159041722}
}
@misc{hendrycks2021measuring,
title={Measuring Massive Multitask Language Understanding},
author={Dan Hendrycks and Collin Burns and Steven Basart and Andy Zou and Mantas Mazeika and Dawn Xiaodong Song and Jacob Steinhardt},
journal={ArXiv},
year={2020},
volume={abs/2009.03300},
url={https://api.semanticscholar.org/CorpusID:221516475}
}
@misc{lin2022truthfulqa,
title={TruthfulQA: Measuring How Models Mimic Human Falsehoods},
author={Stephanie C. Lin and Jacob Hilton and Owain Evans},
booktitle={Annual Meeting of the Association for Computational Linguistics},
year={2021},
url={https://api.semanticscholar.org/CorpusID:237532606}
}
@book{McElreath2020,
author = {McElreath, Richard},
title = {Statistical Rethinking, A Bayesian Course with example in R and STAN},
year = 2020,
publisher = "CRC Press",
address = "New York",
url={https://xcelab.net/rm/statistical-rethinking/}
}
@article{Rosenbrock1960AnAM,
title={An Automatic Method for Finding the Greatest or Least Value of a Function},
author={Howard Rosenbrock},
journal={Comput. J.},
year={1960},
volume={3},
pages={175-184},
url={https://api.semanticscholar.org/CorpusID:62755334}
}
@article{Nelder1965ASM,
title={A Simplex Method for Function Minimization},
author={John A. Nelder and Roger Mead},
journal={Comput. J.},
year={1965},
volume={7},
pages={308-313},
url={https://api.semanticscholar.org/CorpusID:2208295}
}
@article{Broyden1967QuasiNewtonMA,
title={Quasi-Newton methods and their application to function minimisation},
author={C. G. Broyden},
journal={Mathematics of Computation},
year={1967},
volume={21},
pages={368-381},
url={https://api.semanticscholar.org/CorpusID:10793035}
}
@article{Kiefer1952StochasticEO,
title={Stochastic Estimation of the Maximum of a Regression Function},
author={J. Kiefer and Jacob Wolfowitz},
journal={Annals of Mathematical Statistics},
year={1952},
volume={23},
pages={462-466},
url={https://api.semanticscholar.org/CorpusID:122078986}
}
Binary file added docs/img/statistical_rethinking.jpg
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
109 changes: 63 additions & 46 deletions docs/part0.html
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,7 @@
<link href="site_libs/quarto-html/quarto-syntax-highlighting.css" rel="stylesheet" id="quarto-text-highlighting-styles"><meta charset="utf-8">
<meta name="generator" content="quarto-1.3.450">

<meta name="author" content="Julien Fouret">
<title>ML Techniques - Machine Learning Techniques - 0</title>
<meta name="apple-mobile-web-app-capable" content="yes">
<meta name="apple-mobile-web-app-status-bar-style" content="black-translucent">
Expand Down Expand Up @@ -349,6 +350,14 @@ <h1 class="title">Machine Learning Techniques - 0</h1>
<p class="subtitle">Introduction to Artificial Intelligence and Machine Learning</p>

<div class="quarto-title-authors">
<div class="quarto-title-author">
<div class="quarto-title-author-name">
Julien Fouret
</div>
<div class="quarto-title-author-email">
<a href="mailto:[email protected]">[email protected]</a>
</div>
</div>
</div>

</section>
Expand All @@ -362,9 +371,8 @@ <h2>Table of Contents</h2>
<h1>What is Artificial Intelligence ?</h1>

</section>
<section id="can-machines-think" class="slide level2 center">
<h2>Can Machines Think ?</h2>
<p><span class="citation" data-cites="Turing1950">Turing (<a href="#/references" role="doc-biblioref" onclick="">1950</a>)</span></p>
<section id="can-machines-think-turing1950" class="slide level2 center">
<h2>Can Machines Think ?<span class="citation" data-cites="Turing1950"><sup><a href="#/references" role="doc-biblioref" onclick="">1</a></sup></span></h2>
<ul>
<li>Defining a machine</li>
<li>Understanding “thinking”</li>
Expand Down Expand Up @@ -407,7 +415,7 @@ <h2>What if A is a machine ?</h2>
</section>
<section id="a-modern-experiment-the-imitation-game-revisited" class="slide level2 center">
<h2>A Modern Experiment: The Imitation Game Revisited</h2>
<p><em>Human or Not? A Gamified Approach to the Turing Test</em> <span class="citation" data-cites="jannai2023">Jannai et al. (<a href="#/references" role="doc-biblioref" onclick="">2023</a>)</span></p>
<p><strong>Human or Not? A Gamified Approach to the Turing Test</strong><span class="citation" data-cites="jannai2023"><sup><a href="#/references" role="doc-biblioref" onclick="">2</a></sup></span></p>
<p><strong>Online 2-player game:</strong></p>
<ul>
<li>One player asks questions and must guess <strong>“Human”</strong> or <strong>“Bot”</strong></li>
Expand Down Expand Up @@ -446,9 +454,8 @@ <h2>Beyond The Turing test</h2>
</div>
</div>
</section>
<section id="pionneered-definitions-of-ai" class="slide level2 center">
<h2>Pionneered Definitions of AI</h2>
<p><span style="font-size: 75%;"> <span class="citation" data-cites="dartmouth1955">McCarthy et al. (<a href="#/references" role="doc-biblioref" onclick="">1955</a>)</span> </span></p>
<section id="pionneered-definitions-of-ai-dartmouth1955" class="slide level2 center">
<h2>Pionneered Definitions of AI<span class="citation" data-cites="dartmouth1955"><sup><a href="#/references" role="doc-biblioref" onclick="">3</a></sup></span></h2>
<p><img src="img/dartmouth_title.PNG" alt="" style="border: 2px solid black; display: block; margin: auto;"></p>
<p><img src="img/dartmouth_def.PNG" alt="" style="border: 2px solid black; display: block; margin: auto;"></p>
<div style="font-size: 70%;">
Expand Down Expand Up @@ -560,10 +567,10 @@ <h2>Measuring Artificial General intelligence</h2>
<ul>
<li><strong>General Tests</strong>:
<ul>
<li>AI2 Reasoning Challenge</li>
<li>HellaSwag</li>
<li>MMLU</li>
<li>TruthfulQA</li>
<li>AI2 Reasoning Challenge<span class="citation" data-cites="Clark2018ThinkYH"><sup><a href="#/references" role="doc-biblioref" onclick="">4</a></sup></span></li>
<li>HellaSwag<span class="citation" data-cites="zellers2019hellaswag"><sup><a href="#/references" role="doc-biblioref" onclick="">5</a></sup></span></li>
<li>MMLU<span class="citation" data-cites="hendrycks2021measuring"><sup><a href="#/references" role="doc-biblioref" onclick="">6</a></sup></span></li>
<li>TruthfulQA<span class="citation" data-cites="lin2022truthfulqa"><sup><a href="#/references" role="doc-biblioref" onclick="">7</a></sup></span></li>
</ul></li>
<li><strong>Field-specific Exams</strong>:
<ul>
Expand Down Expand Up @@ -651,33 +658,29 @@ <h2>Planning</h2>
<span>25/10 PM</span>
</p>
<ul>
<li><span class="text-box">Part 0</span> Introduction : – <em>1h30</em></li>
<li><span class="text-box">Part 1</span> Reminders and Foundations<em>1h30</em>
<li><span class="text-box">Part 0</span> <strong>Introduction to Artificial Intelligence and Machine Learning</strong> : – <em>1h30</em></li>
<li><span class="text-box">Part 1</span> <strong>Mathematical foundations to Modelling and ML</strong><em>2h30</em>
<ul>
<li>Theory of probability – <em>30min</em></li>
<li>Statistical modelling – <em>15min</em></li>
<li>Theory of probability – <em>45min</em></li>
<li>Statistical modelling – <em>30min</em></li>
<li>Model inference – <em>45min</em></li>
<li>Important definitions – <em>30min</em></li>
</ul></li>
<li><span class="text-box">TP 0</span><em>1h</em>
<ul>
<li>Fitting probability law</li>
<li>Model selection / Fixed effect (type of errors)</li>
</ul></li>
</ul>
<p class="separator">
<span>26/10 AM</span>
</p>
<ul>
<li><span class="text-box">TP 1</span><em>2h</em>
<li><span class="text-box">TP 1</span> <strong>Predict medical insurance costs</strong> <em>4h</em>
<ul>
<li>Data transformation / PCA</li>
<li>Proof: Cross-entropy from likelihood</li>
</ul></li>
<li><span class="text-box">Part 2</span> Base of Machine Learning 1/2 – <em>2h</em>
<ul>
<li>A: Typology and nomenclatures – <em>1h</em></li>
<li>B: Evaluation metrics – <em>1h</em></li>
<li>Import dataset – <em>30 min</em></li>
<li>Simple Linear Model – <em>30 min</em></li>
<li>New feature and interactions – <em>20 min</em></li>
<li>statmodels package – <em>20 min</em></li>
<li>In-sample and Out-sample errors – <em>30 min</em></li>
<li>Scikit-learn pipeline – <em>1h</em></li>
<li>Anomaly detection – <em>30 min</em></li>
<li>Conclusion/Discussion – <em>20 min</em></li>
</ul></li>
</ul>
</div>
Expand All @@ -687,52 +690,66 @@ <h2>Planning</h2>
<span>08/11 PM</span>
</p>
<ul>
<li><span class="text-box">TP 1</span><em>1h30</em>
<ul>
<li>Linear regression with few data</li>
<li>Linear (logistic) regression with multiple features</li>
<li>Bias-Variance decomposition of Loss</li>
</ul></li>
<li><span class="text-box">Part 2</span> Base of Machine Learning 1/2 – <em>30min</em>
<li><span class="text-box">Part 2</span> Base of Machine Learning 1/2 – <em>2h</em>
<ul>
<li>A: Typology and nomenclatures – <em>30min</em></li>
<li>B: Evaluation metrics – <em>1h</em></li>
<li>C: Bottlenecks and Issues – <em>30min</em></li>
</ul></li>
<li><span class="text-box">Part 3</span> Advanced Machine Learning –<em>2h</em>
<ul>
<li>A: Feature engineering – <em>1h</em></li>
<li>B: Model engineering 1/2<em>1h</em></li>
<li>B: Model engineering 1 – <em>1h</em></li>
</ul></li>
</ul>
<p class="separator">
<span>09/11 AM</span>
</p>
<ul>
<li><span class="text-box">Part 3</span> Advanced Machine Learning –<em>2h</em>
<ul>
<li>B: Model engineering 2/2 – <em>1h30</em></li>
</ul></li>
<li><span class="text-box">TP 3</span><em>2h30</em></li>
<li><span class="text-box">TP 3</span><em>4h</em></li>
</ul>
</div>
</div>
</div>
</div>
</section>
<section id="acknowledgement" class="slide level2 center">
<h2>Acknowledgement</h2>
<p><em>For fruitful discussions and corrections.</em></p>
<ul>
<li>Felix Geoffroy</li>
<li>Thomas Chaverondier</li>
<li>Grégory Morel</li>
<li>John Samuel</li>
</ul>
</section>
<section id="references" class="slide level2 smaller scrollable">
<h2>References</h2>

<div class="footer footer-default">

</div>
<div id="refs" class="references csl-bib-body hanging-indent" role="list">
<div id="refs" class="references csl-bib-body" data-line-spacing="2" role="list">
<div id="ref-Turing1950" class="csl-entry" role="listitem">
<div class="csl-left-margin">1. </div><div class="csl-right-inline">Turing, A. M. <a href="https://doi.org/10.1093/mind/LIX.236.433"><span>I.—COMPUTING MACHINERY AND INTELLIGENCE</span></a>. <em>Mind</em> <strong>LIX</strong>, 433–460 (1950).</div>
</div>
<div id="ref-jannai2023" class="csl-entry" role="listitem">
Jannai, Daniel, Amos Meron, Barak Lenz, Yoav Levine, and Yoav Shoham. 2023. <span>Human or Not? A Gamified Approach to the Turing Test.”</span> <a href="https://arxiv.org/abs/2305.20010">https://arxiv.org/abs/2305.20010</a>.
<div class="csl-left-margin">2. </div><div class="csl-right-inline">Jannai, D., Meron, A., Lenz, B., Levine, Y. &amp; Shoham, Y. <a href="https://api.semanticscholar.org/CorpusID:258987666">Human or not? A gamified approach to the turing test</a>. <em>ArXiv</em> vol. abs/2305.20010 (2023).</div>
</div>
<div id="ref-dartmouth1955" class="csl-entry" role="listitem">
McCarthy, J., M. Minsky, N. Rochester, and C. E. Shannon. 1955. <span>“A Proposal for the Dartmouth Summer Research Project on Artificial Intelligence.”</span> <a href="https://raysolomonoff.com/dartmouth/boxa/dart564props.pdf">https://raysolomonoff.com/dartmouth/boxa/dart564props.pdf</a>.
<div class="csl-left-margin">3. </div><div class="csl-right-inline">McCarthy, J., Minsky, M., Rochester, N. &amp; Shannon, C. E. <a href="https://raysolomonoff.com/dartmouth/boxa/dart564props.pdf">A proposal for the dartmouth summer research project on artificial intelligence</a>. (1955).</div>
</div>
<div id="ref-Turing1950" class="csl-entry" role="listitem">
Turing, A. M. 1950. <span><span>I.—COMPUTING MACHINERY AND INTELLIGENCE</span>.”</span> <em>Mind</em> LIX (236): 433–60. <a href="https://doi.org/10.1093/mind/LIX.236.433">https://doi.org/10.1093/mind/LIX.236.433</a>.
<div id="ref-Clark2018ThinkYH" class="csl-entry" role="listitem">
<div class="csl-left-margin">4. </div><div class="csl-right-inline">Clark, P. <em>et al.</em> <a href="https://api.semanticscholar.org/CorpusID:3922816">Think you have solved question answering? Try ARC, the AI2 reasoning challenge</a>. <em>ArXiv</em> <strong>abs/1803.05457</strong>, (2018).</div>
</div>
<div id="ref-zellers2019hellaswag" class="csl-entry" role="listitem">
<div class="csl-left-margin">5. </div><div class="csl-right-inline">Zellers, R., Holtzman, A., Bisk, Y., Farhadi, A. &amp; Choi, Y. <a href="https://api.semanticscholar.org/CorpusID:159041722">HellaSwag: Can a machine really finish your sentence?</a> (2019).</div>
</div>
<div id="ref-hendrycks2021measuring" class="csl-entry" role="listitem">
<div class="csl-left-margin">6. </div><div class="csl-right-inline">Hendrycks, D. <em>et al.</em> <a href="https://api.semanticscholar.org/CorpusID:221516475">Measuring massive multitask language understanding</a>. <em>ArXiv</em> vol. abs/2009.03300 (2020).</div>
</div>
<div id="ref-lin2022truthfulqa" class="csl-entry" role="listitem">
<div class="csl-left-margin">7. </div><div class="csl-right-inline">Lin, S. C., Hilton, J. &amp; Evans, O. <a href="https://api.semanticscholar.org/CorpusID:237532606">TruthfulQA: Measuring how models mimic human falsehoods</a>. (2021).</div>
</div>
</div>
</section></section>
Expand Down
Loading

0 comments on commit 8cc67d2

Please sign in to comment.