├── .DS_Store
├── .github
    └── workflows
    │   └── ExportPluto.yaml
├── README.md
├── hw1
    ├── hints.md
    ├── hw1.html
    ├── hw1.jl
    └── hw1.jmd
├── hw2
    ├── hints2.md
    ├── hw2_2023.jl
    ├── hw2_hint.pdf
    └── hw2_hint.tex
├── hw3
    ├── 18_337_2023_pset3.pdf
    ├── parallelhistogram.jl
    └── patiencesort1.jl
├── hw4.pdf
├── hw4
    └── hints.md
├── lecture 11
    └── adjoint handwritten notes.pdf
├── lecture 12
    ├── ..textClipping
    ├── .DS_Store
    ├── notebook.jl
    ├── reverse mode 2 (simeon).jl
    ├── reverse mode 3.jl
    ├── reverse mode 4.jl
    ├── reverse mode 4.jl.zip
    └── reverse mode 6.jl
├── lecture 14
    └── adjoint equations.pdf
├── lecture 17
    └── handwritten notes adjoint.pdf
├── lecture 22
    ├── .DS_Store
    ├── HPEC-Handbook-Kepner.pdf
    ├── MathOfBigData-Chapter1.pdf
    └── Optimizing_Xeon_Phi_for_Interactive_Data_Analysis.pdf
├── lecture 24
    ├── .DS_Store
    ├── .ipynb_checkpoints
    │   ├── Alan trying to understand MCMC-checkpoint.ipynb
    │   ├── Designing+Markov+chains-checkpoint.ipynb
    │   ├── Metropolis with linear algebra-checkpoint.ipynb
    │   └── MetropolisHastings-checkpoint.ipynb
    ├── Alan trying to understand MCMC.ipynb
    ├── Designing+Markov+chains.ipynb
    ├── Metropolis with linear algebra.ipynb
    └── MetropolisHastings.ipynb
├── lecture1
    ├── AutoDiff.ipynb
    ├── Julia is fast.ipynb
    ├── fernbach 2019 power_of_language.pptx
    └── the_dream.ipynb
├── lecture10
    ├── .DS_Store
    ├── prefix.pptx
    ├── star_and_more.pdf
    ├── trid.pdf
    └── ~$prefix.pptx
├── lecture11
    └── .DS_Store
├── lecture13
    └── handwritten_notes_vectors_adjoints.pdf
├── lecture2
    ├── .DS_Store
    ├── The Julia HPC dream - Jupyter Notebook.pdf
    ├── allocations.jl
    ├── lecture2.jl
    ├── matrix_calculus_handwritten_notes_02_08_2023.pdf
    ├── optimizing.html
    └── optimizing.jmd
├── lecture20
    └── adjointpde.pdf
├── lecture3
    ├── allocation.jl
    └── lecture_3_handwritten_2023.pdf
├── lecture4
    ├── lecture_4_handwritten_2023.pdf
    └── serial performance.jl
├── lecture5
    ├── .DS_Store
    ├── 1071_230222012837_001.pdf
    ├── de_solver_software_comparsion.pdf
    ├── ode.jl
    ├── ode_simple.jl
    └── pinn.jl
├── lecture6
    ├── .DS_Store
    ├── BACKpropagation.pdf
    ├── Backprop with Backslash.ipynb
    ├── backprop_poster.pdf
    ├── handwritten reverse mode.pdf
    ├── parallel_models.jl
    ├── pinn2.jl
    └── threads_demo.jl
├── lecture7
    ├── .DS_Store
    ├── LorenzManyWays.jl
    ├── dynamics.jl
    ├── lecture7 handwritten notes.pdf
    ├── pinn.jl
    └── pinn2.jl
├── lecture8
    ├── pi.jl
    └── threads.jl
├── lecture9
    └── reduce_prefix.jl
├── old lecture 13
    ├── .DS_Store
    ├── Reduce and Parallel Prefix.jl
    ├── firstcuda.jl
    └── prefix.ppt
├── old lecture10
    ├── .DS_Store
    ├── helloworld
    ├── mpihelloworld.jl
    └── mpijl_demo
    │   ├── data
    │       ├── 1013.txt
    │       ├── 1059-0.txt
    │       ├── 159.txt
    │       ├── 23218-0.txt
    │       ├── 35.txt
    │       ├── 36.txt
    │       ├── 5230.txt
    │       ├── 524-0.txt
    │       ├── 775-0.txt
    │       ├── 780-0.txt
    │       ├── pg11696.txt
    │       ├── pg31547.txt
    │       └── pg7308.txt
    │   ├── helloworld.jl
    │   ├── mpihelloworld.jl
    │   ├── submit.sh
    │   ├── top5norm.jl
    │   ├── top5norm_collective.jl
    │   ├── top5norm_sendrecv.jl
    │   └── word_count_helpers.jl
├── old lecture11
    ├── .DS_Store
    ├── .ipynb_checkpoints
    │   ├── intro-checkpoint.ipynb
    │   └── tracing-checkpoint.ipynb
    ├── Manifest.toml
    ├── Project.toml
    ├── intro.ipynb
    ├── lecture11.jl
    ├── tracing.ipynb
    └── utils.jl
├── old lecture9
    ├── eigenvalue derivative.ipynb
    ├── gsvd derivative.ipynb
    ├── jacobian_example.jl
    ├── lecture9-1.jl
    ├── lecture9.jl
    └── svd derivative.ipynb
├── oldhw3
    └── hints3.md
└── threads.jl


/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/.DS_Store


--------------------------------------------------------------------------------
/.github/workflows/ExportPluto.yaml:
--------------------------------------------------------------------------------
 1 | name: Export Pluto notebooks
 2 | on:
 3 |     push:
 4 |         branches:
 5 |             - main
 6 |             - master
 7 |     workflow_dispatch:
 8 | permissions:
 9 |   contents: write
10 | 
11 | # When two jobs run in parallel, cancel the older ones, to make sure that the website is generated from the most recent commit.
12 | concurrency:
13 |     group: pluto-export
14 |     cancel-in-progress: true
15 | 
16 | jobs:
17 |     build-and-deploy:
18 |         runs-on: ubuntu-latest
19 |         steps:
20 |             - name: Checkout this repository
21 |               uses: actions/checkout@v3
22 | 
23 |             - name: Install Julia
24 |               uses: julia-actions/setup-julia@v1
25 |               with:
26 |                   version: "1" # This will automatically pick the latest Julia version
27 | 
28 |             - name: Cache Julia artifacts & such
29 |               uses: julia-actions/cache@v1
30 |               with:
31 |                 cache-registries: "true"
32 | 
33 |             # We set up a folder that Pluto can use to cache exported notebooks. If the notebook file did not change, then Pluto can take the exported file from cache instead of running the notebook.
34 |             - name: Set up notebook state cache
35 |               uses: actions/cache@v3
36 |               with:
37 |                   path: pluto_state_cache
38 |                   key: ${{ runner.os }}-pluto_state_cache-v2-${{ hashFiles('**/Project.toml', '**/Manifest.toml', '.github/workflows/*' ) }}-${{ hashFiles('**/*jl') }}
39 |                   restore-keys: |
40 |                       ${{ runner.os }}-pluto_state_cache-v2-${{ hashFiles('**/Project.toml', '**/Manifest.toml', '.github/workflows/*' ) }}
41 | 
42 | 
43 |             - name: Run & export Pluto notebooks
44 |               run: |
45 |                 julia -e 'using Pkg
46 |                   Pkg.activate(mktempdir())
47 |                   Pkg.add([
48 |                     Pkg.PackageSpec(name="PlutoSliderServer", version="0.3.2-0.3"),
49 |                   ])
50 | 
51 |                   import PlutoSliderServer
52 | 
53 |                   PlutoSliderServer.github_action(".";
54 |                     Export_cache_dir="pluto_state_cache",
55 |                     Export_baked_notebookfile=false,
56 |                     Export_baked_state=false,
57 |                     # more parameters can go here
58 |                   )'
59 | 
60 | 
61 |             - name: Deploy to gh-pages
62 |               uses: JamesIves/github-pages-deploy-action@releases/v4
63 |               with:
64 |                   token: ${{ secrets.GITHUB_TOKEN }}
65 |                   branch: gh-pages
66 |                   folder: .
67 |                   single-commit: true
68 | 
69 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | # 18.337J/6.338J: Parallel Computing and Scientific Machine Learning (Spring 2023)
  2 | ## Professor Alan Edelman (and Philip the Corgi)
  3 | ## MW 3:00 to 4:30 @ Room 2-190
  4 | ## TA and Office hours: (To be confirmed)
  5 | ## [Piazza Link](https://piazza.com/mit/spring2023/18337)
  6 | ## [Canvas](https://canvas.mit.edu/courses/18760) will only be used for homework and project (+proposal) submission + lecture videos
  7 | 
  8 | ## Classes are recorded and will be uploaded on canvas. Another great resource is Chris Rackauckas' videos of 2021 spring class. See [SciMLBook](https://book.sciml.ai/).
  9 | 
 10 | 
 11 | ## Julia:
 12 | 
 13 | * Really nice Julia tutorial for the fall 2022 class [Tutorial](https://mit-c25.netlify.app/notebooks/0_julia_tutorial)
 14 | 
 15 | * [Julia cheatsheets](https://computationalthinking.mit.edu/Spring21/cheatsheets/)
 16 | 
 17 | * Julia tutorial by Steven Johnson Wed Feb 8
 18 |  *Optional* Julia Tutorial: Wed Feb 8 @ 5pm [via Zoom](https://mit.zoom.us/j/96829722642?pwd=TDhhME0wbmx0SG5RcnFOS3VScTA5Zz09)
 19 | 
 20 | * Virtually [via Zoom](https://mit.zoom.us/j/96829722642?pwd=TDhhME0wbmx0SG5RcnFOS3VScTA5Zz09).  Recording will be posted.
 21 | 
 22 | A basic overview of the Julia programming environment for numerical computations that we will use in 18.06 for simple computational exploration.   This (Zoom-based) tutorial will cover what Julia is and the basics of interaction, scalar/vector/matrix arithmetic, and plotting — we'll be using it as just a "fancy calculator" and no "real programming" will be required.
 23 | 
 24 | * [Tutorial materials](https://github.com/mitmath/julia-mit) (and links to other resources)
 25 | 
 26 | If possible, try to install Julia on your laptop beforehand using the instructions at the above link.  Failing that, you can run Julia in the cloud (see instructions above).
 27 | 
 28 | 
 29 | ## Announcement:
 30 |  
 31 | There will be  homeworks, followed by the final project. 
 32 | Everyone needs to present their work and submit a project report. 
 33 | 
 34 | 1-page Final Project proposal due : March 24 
 35 | 
 36 | Final Project presentations : April 26 to May 15
 37 | 
 38 | Final Project reports due: May 15
 39 | 
 40 | # Grading: 
 41 | 50% problem sets, 10% for the final project proposal, and 40% for the final project. Problem sets and final projects will be submitted electronically.
 42 | 
 43 | # HW
 44 | |#| Notebook|
 45 | |-|-|
 46 | |1| [HW1](https://mitmath.github.io/18337/hw1/hw1.html) |
 47 | (For matrix calculus problems, do not use indices)
 48 | |2| [HW2](https://mitmath.github.io/18337/hw2/hw2_2023.html) Due Wednesday March 1, 2023 |
 49 | |3| [HW3](https://github.com/mitmath/18337/blob/master/hw3/18_337_2023_pset3.pdf )  Due Wednesday March 15, 2023|
 50 | |4| [HW4](https://github.com/mitmath/18337/blob/master/hw4.pdf) Due Wednesday April 19, 2023 |
 51 | 
 52 | # Lecture Schedule (tentative)
 53 | |#|Day| Date |  Topic | [SciML](https://book.sciml.ai/) lecture | Materials |
 54 | |-|-|------|------|-----|--|
 55 | |1|M| 2/6 | Intro to Julia.  My Two Favorite Notebooks. |  |   [[Julia is fast]](https://github.com/mitmath/18337/blob/master/lecture1/Julia%20is%20fast.ipynb), [[AutoDiff]](https://github.com/mitmath/18337/blob/master/lecture1/AutoDiff.ipynb), [[autodiff video]](https://www.youtube.com/watch?v=vAp6nUMrKYg),
 56 | |2|W|2/8| Matrix Calculus I  and The Parallel Dream| | See [[IAP 2023 Class on Matrix Calculus]](https://github.com/mitmath/matrixcalc),[[handwritten notes]](https://github.com/mitmath/18337/blob/master/lecture2/matrix_calculus_handwritten_notes_02_08_2023.pdf),[[The Parallel Dream]](https://github.com/mitmath/18337/blob/master/lecture1/the_dream.ipynb)
 57 | |3|M|2/13| Matrix Calculus II || [[handwritten notes]](https://github.com/mitmath/18337/blob/master/lecture3/lecture_3_handwritten_2023.pdf),[[Corgi in the Washing Machine]](https://mit-c25.netlify.app/notebooks/1_hyperbolic_corgi),[[2x2 Matrix Jacobians]](https://rawcdn.githack.com/mitmath/matrixcalc/3f6758996e40c5c1070279f89f7f65e76e08003d/notes/2x2Jacobians.jl.html)
 58 | |4|W|2/15| Serial Performance | [2][2] |[[handwritten notes]](https://github.com/mitmath/18337/blob/master/lecture4/lecture_4_handwritten_2023.pdf), [[Serial Performance .jl file]](https://github.com/mitmath/18337/blob/master/lecture4/serial%20performance.jl), [[Loop Fusion Blog ]](https://julialang.org/blog/2017/01/moredots/)
 59 | |5|T|2/21| Intro to PINNs and Automatic differentiation I : Forward mode AD | [3][3] and [8][8] | [ode and Pinns](https://mit-18337-spring2023.netlify.app/lecture5/ode_simple.html),[intro to pinn handwritten notes](https://github.com/mitmath/18337/blob/master/lecture5/1071_230222012837_001.pdf),[autodiff handwritten notes](https://github.com/mitmath/JuliaComputation/blob/ec6861bc9396d2b577f1bbc8136683d4298d7dc8/slides/ad_handwritten.pdf)
 60 | |6|W|2/22| Automatic differentiation II : Reverse mode AD |[10][10]|  [pinn.jl](https://github.com/mitmath/18337/blob/master/lecture5/pinn.jl), [reverse mode ad demo](https://simeonschaub.github.io/ReverseModePluto/notebook.html),[handwritten notes](https://github.com/mitmath/18337/blob/master/lecture6/handwritten%20reverse%20mode.pdf)|
 61 | |7|M|2/27 |  Dynamical Systems & Serial Performance on Iterations |  [4][4] | [Lorenz many ways](https://github.com/mitmath/18337/blob/master/lecture7/LorenzManyWays.jl), [Dynamical Systems](https://mitmath.github.io/18337/lecture7/dynamics.html), [handwriten notes](https://github.com/mitmath/18337/blob/master/lecture7/lecture7%20handwritten%20notes.pdf) |
 62 | |8|W|3/1|  HPC & Threading | [5][5] and [6][6] | [pi.jl](https://github.com/mitmath/18337/blob/master/lecture8/pi.jl), [threads.jl](https://github.com/mitmath/18337/blob/master/lecture8/threads.jl),[HPC Slides](https://docs.google.com/presentation/d/1i6w4p26r_9lu_reHYZDIVnzh-4SdERVAoSI5i42lBU8/edit#slide=id.p)   |
 63 | |9|M|3/6| Parallelism|       |   [Parallelism in Julia Slides](https://docs.google.com/presentation/d/1kBYvDedm_VGZEdjhSLXSCPLec6N7fLZswcYENqwiw3k/edit#slide=id.p),[reduce/prefix notebook](https://mitmath.github.io/18337/lecture9/reduce_prefix.html)|
 64 | |10|W| 3/8| Prefix (and more) ||[ppt slides](https://github.com/mitmath/18337/blob/master/lecture10/prefix.pptx), [reduce/prefix notebook](https://mitmath.github.io/18337/lecture9/reduce_prefix.html),[ThreadedScans.jl](https://github.com/JuliaFolds/ThreadedScans.jl),[cuda blog](https://developer.nvidia.com/gpugems/gpugems3/part-vi-gpu-computing/chapter-39-parallel-prefix-sum-scan-cuda)|
 65 | |11|M|3/13| Adjoint Method Example | [10][10] | [Handwritten Notes](https://github.com/mitmath/18337/blob/master/lecture%2011/adjoint%20handwritten%20notes.pdf)|
 66 | |12|W|3/15| Guest Lecture - Chris Rackauckas |
 67 | |13|M|3/21 |  Vectors, Operators and Adjoints | | [Handwritten Notes](https://github.com/mitmath/18337/blob/master/lecture14/handwritten_notes_vectors_adjoints.pdf) |
 68 | |14|W|3/23 |  Adjoints of Linear, Nonlinear, Ode | [11][11] | [Handwritten Notes](https://github.com/mitmath/18337/blob/master/lecture%2014/adjoint%20equations.pdf), [18.335 adjoint notes (Johnson)](https://math.mit.edu/~stevenj/18.336/adjoint.pdf)|
 69 | |Spring Break|
 70 | |15|M|4/3| Guest Lecture, Billy Moses | | [Enzyme AD](https://enzyme.mit.edu/) |
 71 | |16|W|4/5| Guest Lecture, Keaton Burns | | [Dedalus PDE Solver](https://dedalus-project.org/) |
 72 | |17|M|4/10| Adjoints of ODE | | [Handwritten Notes](https://github.com/mitmath/18337/blob/master/lecture%2017/handwritten%20notes%20adjoint.pdf) |
 73 | |18|W|4/12| Partitioning | | |
 74 | |  |M|4/17| Patriots' Day
 75 | |19|W|4/19|  Fast Multipole and Parallel Prefix | |[Unfinished Draft](https://math.mit.edu/~edelman/publications/fast_multipole.pdf) | 
 76 | |20|M|4/24|
 77 | |21|W|4/26| Project Presentation I |
 78 | |22|M|5/1| Project Presentation II | 
 79 | |23|W|5/3| Project Presentation III | 
 80 | |24|M|5/8|  Project Presentation IV |  
 81 | |25|W|5/10| Project Presentation V |
 82 | |  |M|5/15| Class  Cancelled |
 83 | 
 84 | 
 85 | 
 86 | |8|W|3/1| GPU Parallelism I |[7][7]| [[video 1]](https://www.youtube.com/watch?v=riAbPZy9gFc),[[video2]](https://www.youtube.com/watch?v=HMmOk9GIhsw)
 87 | |9|M|3/6| GPU Paralellism II | | [[video]](https://www.youtube.com/watch?v=zHPXGBiTM5A), [[Eig&SVD derivatives notebooks]](https://github.com/mitmath/18337/tree/master/lecture9), [[2022 IAP Class Matrix Calculus]](https://github.com/mitmath/matrixcalc)
 88 | |10|W|3/8| MPI |  |  [Slides](https://github.com/SciML/SciMLBook/blob/spring21/lecture12/MPI.jl.pdf),  [[video, Lauren Milichen]](https://www.youtube.com/watch?v=LCIJj0czofo),[[Performance Metrics]](https://github.com/mitmath/18337/blob/spring21/lecture12/PerformanceMetricsSoftwareArchitecture.pdf) see p317,15.6
 89 | |11|M|3/13| Differential Equations I  | [9][9]| 
 90 | |12|W|3/15| Differential Equations II   |[10][10] |
 91 | |13|M|3/20| Neural ODE  |[11][11] | 
 92 | |14|W|3/22|   |[13][13] |
 93 | | | | | Spring Break |
 94 | |15|M|4/3|   | | [GPU Slides](https://docs.google.com/presentation/d/1npryMMe7JyLLCLdeAM3xSjLe5Q54eq0QQrZg5cxw-ds/edit?usp=sharing) [Prefix Materials](https://github.com/mitmath/18337/tree/master/lecture%2013)
 95 | |16|W|4/5|  Convolutions and PDEs | [14][14] |
 96 | |17|M|4/10|   Chris R on ode adjoints, PRAM Model |[11][11] | [[video]](https://www.youtube.com/watch?v=KCTfPyVIxpc)|
 97 | |18|W|4/12|  Linear and Nonlinear System Adjoints | [11][11] | [[video]](https://www.youtube.com/watch?v=KCTfPyVIxpc)|
 98 | |  |M|4/17| Patriots' Day
 99 | |19|W|4/19|  Lagrange Multipliers, Spectral Partitioning ||  [Partitioning Slides](https://github.com/alanedelman/18.337_2018/blob/master/Lectures/Lecture13_1022_SpectralPartitioning/Partitioning.ppt)|       |
100 | |20|M|4/24|  |[15][15]| [[video]](https://www.youtube.com/watch?v=YuaVXt--gAA),[notes on adjoint](https://github.com/mitmath/18337/blob/master/lecture20/adjointpde.pdf)|
101 | |21|W|4/26| Project Presentation I |
102 | |22|M|5/1| Project Presentation II | [Materials](https://github.com/mitmath/18337/tree/master/lecture%2022)
103 | |23|W|5/3| Project Presentation III | [16][16] | [[video](https://www.youtube.com/watch?v=32rAwtTAGdU)]
104 | |24|M|5/8|  Project Presentation IV |  
105 | |25|W|5/10| Project Presentation V |
106 | |26|M|5/15| Project Presentation VI|
107 | 
108 | 
109 | [1]:https://book.sciml.ai/notes/01/
110 | [2]:https://book.sciml.ai/notes/02-Optimizing_Serial_Code/
111 | [3]:https://book.sciml.ai/notes/03-Introduction_to_Scientific_Machine_Learning_through_Physics-Informed_Neural_Networks/
112 | [4]:https://book.sciml.ai/notes/04-How_Loops_Work-An_Introduction_to_Discrete_Dynamics/
113 | [5]:https://book.sciml.ai/notes/05-The_Basics_of_Single_Node_Parallel_Computing/
114 | [6]:https://book.sciml.ai/notes/06-The_Different_Flavors_of_Parallelism/
115 | [7]:https://book.sciml.ai/notes/07/
116 | [8]:https://book.sciml.ai/notes/08-Forward-Mode_Automatic_Differentiation_(AD)_via_High_Dimensional_Algebras/
117 | [9]:https://book.sciml.ai/notes/09/
118 | [10]:https://book.sciml.ai/notes/10-Basic_Parameter_Estimation-Reverse-Mode_AD-and_Inverse_Problems/
119 | [11]:https://book.sciml.ai/notes/11-Differentiable_Programming_and_Neural_Differential_Equations/
120 | [13]:https://book.sciml.ai/notes/13/
121 | [14]:https://book.sciml.ai/notes/14/
122 | [15]:https://book.sciml.ai/notes/15/
123 | [16]:https://book.sciml.ai/notes/16/
124 | 
125 | # Lecture Summaries and Handouts
126 | 
127 | [Class Videos](https://mit.hosted.panopto.com/Panopto/Pages/Sessions/List.aspx?folderID=9e659f61-1fd4-4b98-96a0-af940143c9c7)
128 | 
129 | ## Lecture 1:  Syllabus, Introduction to Performance, Introduction to Automatic Differentiation
130 | 
131 | Setting the stage for this course which will involve high performance computing, mathematics, and scientific machine learning, we looked
132 | at two introductory notebooks.  The first [Julia is fast]](https://github.com/mitmath/18337/blob/master/lecture1/Julia%20is%20fast.ipynb)
133 | primarily reveals just how much performance languages like Python can leave on the table.  Many people don't compare languages, so they
134 | are unlikely to be aware.  The second [AutoDiff]](https://github.com/mitmath/18337/blob/master/lecture1/AutoDiff.ipynb) reveals the "magic"
135 | of forward mode autodifferentiation showing how a compiler can "rewrite" a program through the use of software overloading and still
136 | maintain performance. This is a whole new way to see calculus, not the way you learned it in a first year class, and not finite differences either.
137 | 
138 | ## Lecture 2:  The Parallel Dream and Intro to Matrix Calculus
139 | We gave an example 
140 | [The Parallel Dream]](https://github.com/mitmath/18337/blob/master/lecture1/the_dream.ipynb)
141 | 
142 | 
143 | ### Lecture and Notes
144 | 
145 | 
146 | # Homeworks
147 | 
148 | HW1 will be due Thursday Feb 16.  This is really just a getting started homework.  
149 | 
150 | [Hw1](https://mitmath.github.io/18337/hw1/hw1.html)
151 | 
152 | # Final Project
153 | 
154 | For the second half of the class students will work on the final project. A one-page final project 
155 | proposal must be sumbitted by March 24 Friday, through canvas. 
156 | 
157 | Last three weeks (tentative)  will be student presentations. 
158 | 
159 | ## Possible Project Topics
160 | 
161 | Here's a list of [current projects](https://github.com/JuliaLabs/julialabs.github.io/blob/master/projects.md) of interest to the julialab
162 | 
163 | One possibility is to review an interesting algorithm not covered in the course
164 | and develop a high performance implementation. Some examples include:
165 | 
166 | - High performance PDE solvers for specific PDEs like Navier-Stokes
167 | - Common high performance algorithms (Ex: Jacobian-Free Newton Krylov for PDEs)
168 | - Recreation of a parameter sensitivity study in a field like biology,
169 |   pharmacology, or climate science
170 | - [Augmented Neural Ordinary Differential Equations](https://arxiv.org/abs/1904.01681)
171 | - [Neural Jump Stochastic Differential Equations](https://arxiv.org/pdf/1905.10403.pdf)
172 | - Parallelized stencil calculations
173 | - Distributed linear algebra kernels
174 | - Parallel implementations of statistical libraries, such as survival statistics
175 |   or linear models for big data. Here's [one example parallel library)](https://github.com/harrelfe/rms)
176 |   and a [second example](https://bioconductor.org/packages/release/data/experiment/html/RegParallel.html).
177 | - Parallelization of data analysis methods
178 | - Type-generic implementations of sparse linear algebra methods
179 | - A fast regex library
180 | - Math library primitives (exp, log, etc.)
181 | 
182 | Another possibility is to work on state-of-the-art performance engineering.
183 | This would be implementing a new auto-parallelization or performance enhancement.
184 | For these types of projects, implementing an application for benchmarking is not
185 | required, and one can instead benchmark the effects on already existing code to
186 | find cases where it is beneficial (or leads to performance regressions).
187 | Possible examples are:
188 | 
189 | - [Create a system for automatic multithreaded parallelism of array operations](https://github.com/JuliaLang/julia/issues/19777) and see what kinds of packages end up more efficient
190 | - [Setup BLAS with a PARTR backend](https://github.com/JuliaLang/julia/issues/32786)
191 |   and investigate the downstream effects on multithreaded code like an existing
192 |   PDE solver
193 | - [Investigate the effects of work-stealing in multithreaded loops](https://github.com/JuliaLang/julia/issues/21017)
194 | - Fast parallelized type-generic FFT. Starter code by Steven Johnson (creator of FFTW)
195 |   and Yingbo Ma [can be found here](https://github.com/YingboMa/DFT.jl)
196 | - Type-generic BLAS. [Starter code can be found here](https://github.com/JuliaBLAS/JuliaBLAS.jl)
197 | - Implementation of parallelized map-reduce methods. For example, `pmapreduce`
198 |   [extension to `pmap`](https://docs.julialang.org/en/v1/manual/parallel-computing/index.html)
199 |   that adds a paralellized reduction, or a fast GPU-based map-reduce.
200 | - Investigating auto-compilation of full package codes to GPUs using tools like
201 |   [CUDAnative](https://github.com/JuliaGPU/CUDAnative.jl) and/or
202 |   [GPUifyLoops](https://github.com/vchuravy/GPUifyLoops.jl).
203 | - Investigating alternative implementations of databases and dataframes.
204 |   [NamedTuple backends of DataFrames](https://github.com/JuliaData/DataFrames.jl/issues/1335), alternative [type-stable DataFrames](https://github.com/FugroRoames/TypedTables.jl), defaults for CSV reading and other large-table formats
205 |   like [JuliaDB](https://github.com/JuliaComputing/JuliaDB.jl).
206 | 
207 | Additionally, Scientific Machine Learning is a wide open field with lots of
208 | low hanging fruit. Instead of a review, a suitable research project can be
209 | used for chosen for the final project. Possibilities include:
210 | 
211 | - Acceleration methods for adjoints of differential equations
212 | - Improved methods for Physics-Informed Neural Networks
213 | - New applications of neural differential equations
214 | - Parallelized implicit ODE solvers for large ODE systems
215 | - GPU-parallelized ODE/SDE solvers for small systems
216 | 
217 | 
218 | 
219 | 
220 | 
221 | 


--------------------------------------------------------------------------------
/hw1/hints.md:
--------------------------------------------------------------------------------
  1 | # Hints and Tricks for HW1. More will be added.
  2 | # Note: any format submission (e.g. pdf, notebooks, zip) is fine
  3 | 
  4 | ## Problem 1:
  5 | 
  6 | **Note: g is a function from Rⁿ to Rⁿ**  
  7 | **Note: Understand that the goal of the problem is to understand the stability of these basic iterations as they will become critical
  8 | for understanding the use of neural networks and other methods**
  9 | 
 10 | **Reminder: Stability of x(n) = g(x(n-1)) is proved by taking the jacobian of g and showing its eigenvalues have absolute value < 1.**
 11 | 
 12 | * Part 1: Should be straightforward. Think about x converging to the fixed point.
 13 | * Part 2: Write your answer in terms of J_n the Jacobian of g at x_n and J_0 the Jacobian of g at x_0 and the Identity.
 14 | 
 15 |   **Hint:** What is the Jacobian of the function `x->x-J_0⁻¹g(x)` at x=x_n? That is the matrix you need to write down.
 16 | 
 17 |   **Hint:** You may use the fact that if `x_0 - x*` is small, then `J_0 ≈ J_n ≈ J_*`. More precisely, assume that `J_x⁻¹ J_y = I + O(|x - y|)`
 18 |   
 19 |   **Hint:** If  a matrix is small then the eigenvalues of the matrix are small.
 20 | 
 21 | * Part 4: Remember that the eigenvalues of `α * M` are α times the eigenvalues of M, and the problem says the eigenvalues are positive.
 22 | 
 23 | *  Part 4
 24 | Better wording: create a new dynamical system that converges to a value x_e such that g(x_e) = 0.
 25 | 
 26 | ## Problem 2:
 27 | * Part 1: If you do part 1 as a Julia program (rather than as text), then Part 1 and Part 2 are the same.  There really is no part 1.
 28 | 
 29 | * Part 2: The prompt to make use of multiple dispatch might be a little bit misleading. You don't need to define multiple methods for `my_quantile` itself, but ideally you should take advantage of how Distributions.jl uses multiple dispatch. Distributions.jl defines methods for the functions `mean`, `pdf` and `cdf` for all `Distribution` objects, so if you implement `my_quantile` right, it should just work for any distribution.
 30 | 
 31 |   For those of you that are new to Julia, you can find a quick explanation of what multiple dispatch is [here](https://stackoverflow.com/questions/58700879/what-is-multiple-dispatch-and-how-does-one-use-it-in-julia). If you are more curious, you can also check out [this blog post explaining it in more detail](https://opensourc.es/blog/basics-multiple-dispatch/#what_is_dispatch) or [this video](https://www.youtube.com/watch?v=kc9HwsxE1OY) by Stefan explaining why this is actually so useful.
 32 | 
 33 |   **Hint:** You can get the CDF and PDF of a `Distribution` object `d` at point `x` with `cdf(d, x)` or `pdf(d, x)` respectively. You don't have to derive the PDF yourself.
 34 |   
 35 |   **Hint:** Julia allows you to compute default values for (keyword) arguments in the function signature itself, so your function definition could look like:
 36 |   ```julia
 37 |   function my_quantile(d, y; x₀=mean(d))
 38 |       # the actual implementation
 39 |   end
 40 |   ```
 41 | 
 42 | ## Problem 3:
 43 | 
 44 | * Part 1: Some were a bit confused by the signature given for `calc_attractor!`. It's probably easiest if you write your function something like this:
 45 |   ```julia
 46 |   function calc_attractor!(out, r, x₀; warmup=400)
 47 |       num_attract = length(out)
 48 |       # first do warmup then write each step to `out`
 49 |   end
 50 |   ```
 51 |   If you want you can generalize this to arbitrary systems given by some recurrence relation `f`, but this is not required.
 52 |   
 53 |   **Optional Optimization** In Julia, you can get uninitialized arrays with the constructor `Array{Float64}(undef, dim1, dim2, ...)`, which will be slightly more efficient than `zeros` if you are overwriting each entry anyways.
 54 |   
 55 |   **Optional Julia Syntax** For Parts 2-5, the function `eachindex` or `eachcol` might be useful, which iterates over each index of an array or each column of a matrix as views.
 56 | 
 57 |   If a vector is 1-based there is no difference between `for i = 1:length(vector)`
 58 |   and `for i = eachindex(vector)`.  
 59 | 
 60 |   * Part 3: (Use `@threads`) to parallelize an embarassingly parallel for loop.
 61 | 
 62 |   Note you can not change the number of threads inside of a Julia session so you must start Julia with something like `julia -t 4` or use the vscode setting like you saw in class.  (Code-->Preferences-->Settings-->threads) on a mac it's (Command-Comma)
 63 | 
 64 |   * Part 4: We didn't get a chance to talk about `@distributed` in class, but here is  an example.  (This works on distributed memory computers but you can also run it on your shared memory laptop.  By contrast `@threads` asummes shared memory.)
 65 | 
 66 |     One can use `@distributed` in the same way as `@threads` (to parallelize a loop)  but it also has the nice property of allowing reductions.  In the following example, we will use `(+)` and `hcat` which are summation and  a horizontal concatenation, meaning package everything up in an array. (Note `sum` is wrong, the reduction should
 67 |     be a binary operation.)
 68 | 
 69 | 
 70 |     ```julia
 71 |     using Distributed
 72 |     println(workers())
 73 | 
 74 |     if nworkers()==1
 75 |       addprocs(5)  # Unlike threads you can addprocs in the middle of a julia session
 76 |       println(workers())
 77 |     end
 78 | 
 79 |     @everywhere function f(i)
 80 |         return rand(10)*i
 81 |     end   
 82 |     
 83 |     r = 1:10000
 84 | 
 85 |     @distributed (+) for i in r
 86 |           f(i)
 87 |     end
 88 | 
 89 |     @distributed hcat for i in r
 90 |           f(i)
 91 |     end 
 92 | 
 93 | 
 94 | 
 95 |     
 96 |     ```
 97 | 
 98 | 
 99 | @Simeon,  we need an example of `pmap` in a similar way
100 | 
101 | @simeon: pmap has a head node which sends the data to the other processors.....
102 | with load balancing???
103 | distributed has each node setting the computation 
104 | 
105 | @simeon: for computations where there is a ton of data to send around
106 | pmap can be very inefficient, but for this computation i hardly expect
107 | much difference, perhaps slightly different overheads.
108 | 
109 | 


--------------------------------------------------------------------------------
/hw1/hw1.jl:
--------------------------------------------------------------------------------
  1 | ### A Pluto.jl notebook ###
  2 | # v0.19.14
  3 | 
  4 | using Markdown
  5 | using InteractiveUtils
  6 | 
  7 | # ╔═╡ 9c384715-5bf5-4308-94ef-db4f26be45a4
  8 | md"_Homework 1, version 1 -- 18.337 -- Spring  2023_"
  9 | 
 10 | # ╔═╡ 7679b2c5-a644-4341-a7cc-d1335727aacd
 11 | # edit the code below to set your name and kerberos ID (i.e. email without @mit.edu)
 12 | 
 13 | student = (name = "Philip the Corgi", kerberos_id = "ptcorgi")
 14 | 
 15 | # press the ▶ button in the bottom right of this cell to run your edits
 16 | # or use Shift+Enter
 17 | 
 18 | # you might need to wait until all other cells in this notebook have completed running.
 19 | # scroll down the page to see what's up
 20 | 
 21 | # ╔═╡ f8750fa4-8d49-4880-a53e-f40a653c84ea
 22 | md"HW is to be submitted on Canvas in the form of a .jl file and .pdf file (use the browser print)"
 23 | 
 24 | # ╔═╡ bec48cfd-ac3b-4dae-973f-cf529b3cdc05
 25 | md"""
 26 | # Homework 1: Getting up and running and  Matrix Calculus
 27 | 
 28 | HW1 release date: Thursday, Feb 9, 2023.
 29 | 
 30 | **HW1 due date: Thursday, Feb 16, 2023, 11:59pm EST**, _but best completed before Wednesday's lecture if possible_.
 31 | 
 32 | First of all, **_welcome to the course!_** We are excited to teach you about parallel computing and scientific machine lerning, using the same tools that we work with ourselves.
 33 | 
 34 | 
 35 | Without submitting anything we'd also like you to login and try out Juliahub, which we will use later especially when we use GPUs.  You might also try vscode on your own computer.
 36 | """
 37 | 
 38 | # ╔═╡ 0da73ecd-5bda-4098-8f13-354af436d231
 39 | md"## (Required) Exercise 0 - _Making a basic function_
 40 | 
 41 | Computing $x^2+1$ is easy -- you just multiply $x$ with itself and add 1.
 42 | 
 43 | ##### Algorithm:
 44 | 
 45 | Given: $x$
 46 | 
 47 | Output: $x^2+1$
 48 | 
 49 | 1. Multiply $x$ by $x$ and add 1"
 50 | 
 51 | # ╔═╡ 963f24f5-a442-4590-b355-300703b0cf86
 52 | function basic_function(x)
 53 | 	return x*x # this is wrong, write your code here!
 54 | end
 55 | 
 56 | # ╔═╡ b6f5abbb-1c32-46d0-b92a-2d0c6c806348
 57 | let
 58 | 	result = basic_function(5)
 59 | 	if !(result isa Number)
 60 | 		md"""
 61 | !!! warning "Not a number"
 62 |     `basic_square` did not return a number. Did you forget to write `return`?
 63 | 		"""
 64 | 	elseif abs(result - (5*5 + 1)) < 0.01
 65 | 		md"""
 66 | !!! correct
 67 |     Well done!
 68 | 		"""
 69 | 	else
 70 | 		md"""
 71 | !!! warning "Incorrect"
 72 |     Keep working on it!
 73 | 		"""
 74 | 	end
 75 | end
 76 | 
 77 | # ╔═╡ 172bd4bd-5ea9-475f-843d-abb86ffaed34
 78 | 
 79 | 
 80 | # ╔═╡ 20ed1521-fb1d-43cd-8c6f-15041fc512ec
 81 | if student.kerberos_id === "ptcorgi"
 82 | 	md"""
 83 | !!! danger "Oops!"
 84 |     **Before you submit**, remember to fill in your name and kerberos ID at the top of this notebook!
 85 | 	"""
 86 | end
 87 | 
 88 | # ╔═╡ ceaf29f7-df04-481e-9836-68298a9f64c7
 89 | md"""# Installation
 90 | Before being able to run this notebook succesfully locally, you will need to [set up Julia and Pluto.](https://computationalthinking.mit.edu/Spring21/installation/)
 91 | 
 92 | One you have Julia and Pluto installed, you can click the button at the top right of this page and follow the instructions to edit this notebook locally and submit.
 93 | """
 94 | 
 95 | # ╔═╡ 4ba96121-453d-400e-877a-61db02928ffb
 96 | md"""
 97 | # Matrix calculus
 98 | """
 99 | 
100 | # ╔═╡ 6996372a-0150-4522-8aa4-3fec36a0dcbb
101 | md"""
102 | For each function $f(x)$, work out the linear transformation $f'(x)$ such that $df = f'(x) dx$.
103 | Check your answers numerically using Julia by computing $f(x+e)-f(x)$ for some random $x$ and (small) $e$, and comparing with $f'(x)e$.
104 | We use lowercase $x$ for vectors and uppercase $X$ for matrices.
105 | 
106 | For the written part write the answer in the form f'(x)[dx]. 
107 | 
108 | For the numerical part write a function that works for all $x$ and $e$ and run
109 | on a few random inputs.
110 | """
111 | 
112 | # ╔═╡ 6067b7d5-a8d4-4922-a761-210418032da5
113 | md"""
114 | ## Question 1
115 | 
116 |  $f \colon x \in \mathbb{R}^n \longmapsto (x^\top x)^2$. 
117 | 
118 | $f'(x)[dx]=?$
119 | Note: dx is a column vector.  Be sure your answer makes sense in terms
120 | of row and column vectors.
121 | """
122 | 
123 | # ╔═╡ 7b2550d6-422d-4b8b-a86c-7e49314ac6c9
124 | 
125 | 
126 | # ╔═╡ f95d162c-0522-4cb1-9251-7659fee4711e
127 | md"""
128 | ## Question 2
129 | 
130 |  $f \colon x \in \mathbb{R}^n \longmapsto \sin.(x)$, meaning the elementwise application of the $\sin$ function to each entry of the vector $x$, whose result is another vector in $\mathbb{R}^n$.
131 | """
132 | 
133 | # ╔═╡ a02e8536-0360-4043-90e7-4fb28966393d
134 | 
135 | 
136 | # ╔═╡ e5738862-51f5-4dde-81a8-6db7d3638270
137 | 
138 | 
139 | # ╔═╡ bc655179-19a3-42c7-ab8b-776d3158a8c6
140 | md"""
141 | ## Question 3
142 | 
143 |  $f \colon X \in \mathbb{R}^{n \times m} \longmapsto \theta^\top X$, where $\theta \in R^n$ is a vector
144 | """
145 | 
146 | # ╔═╡ 2721e816-327b-468e-8121-2dec969d2021
147 | md"""
148 | ## Question 4
149 | 
150 |  $f \colon X \in \mathbb{R}^{n \times n} \longmapsto X^{-2}$, where $X$ is non-singular. 
151 | """
152 | 
153 | # ╔═╡ 675fd3c3-063e-4b34-a43d-e2486ca514ae
154 | 
155 | 
156 | # ╔═╡ 29d955a0-0410-4d8e-89a8-81a63229126c
157 | # Your code goes here
158 | 
159 | # ╔═╡ 00000000-0000-0000-0000-000000000001
160 | PLUTO_PROJECT_TOML_CONTENTS = """
161 | [deps]
162 | """
163 | 
164 | # ╔═╡ 00000000-0000-0000-0000-000000000002
165 | PLUTO_MANIFEST_TOML_CONTENTS = """
166 | # This file is machine-generated - editing it directly is not advised
167 | 
168 | julia_version = "1.8.0-rc4"
169 | manifest_format = "2.0"
170 | project_hash = "da39a3ee5e6b4b0d3255bfef95601890afd80709"
171 | 
172 | [deps]
173 | """
174 | 
175 | # ╔═╡ Cell order:
176 | # ╠═9c384715-5bf5-4308-94ef-db4f26be45a4
177 | # ╠═7679b2c5-a644-4341-a7cc-d1335727aacd
178 | # ╟─f8750fa4-8d49-4880-a53e-f40a653c84ea
179 | # ╟─bec48cfd-ac3b-4dae-973f-cf529b3cdc05
180 | # ╠═0da73ecd-5bda-4098-8f13-354af436d231
181 | # ╠═963f24f5-a442-4590-b355-300703b0cf86
182 | # ╟─b6f5abbb-1c32-46d0-b92a-2d0c6c806348
183 | # ╠═172bd4bd-5ea9-475f-843d-abb86ffaed34
184 | # ╟─20ed1521-fb1d-43cd-8c6f-15041fc512ec
185 | # ╟─ceaf29f7-df04-481e-9836-68298a9f64c7
186 | # ╟─4ba96121-453d-400e-877a-61db02928ffb
187 | # ╟─6996372a-0150-4522-8aa4-3fec36a0dcbb
188 | # ╟─6067b7d5-a8d4-4922-a761-210418032da5
189 | # ╠═7b2550d6-422d-4b8b-a86c-7e49314ac6c9
190 | # ╟─f95d162c-0522-4cb1-9251-7659fee4711e
191 | # ╠═a02e8536-0360-4043-90e7-4fb28966393d
192 | # ╠═e5738862-51f5-4dde-81a8-6db7d3638270
193 | # ╟─bc655179-19a3-42c7-ab8b-776d3158a8c6
194 | # ╟─2721e816-327b-468e-8121-2dec969d2021
195 | # ╠═675fd3c3-063e-4b34-a43d-e2486ca514ae
196 | # ╠═29d955a0-0410-4d8e-89a8-81a63229126c
197 | # ╟─00000000-0000-0000-0000-000000000001
198 | # ╟─00000000-0000-0000-0000-000000000002
199 | 


--------------------------------------------------------------------------------
/hw1/hw1.jmd:
--------------------------------------------------------------------------------
  1 | ---
  2 | title: Homework 1, Parallelized Dynamics
  3 | date: February 2nd, 2022
  4 | ---
  5 | The problems up to Problem 3 Part  2 are
  6 | due Wednesday February 16, 2022 at 11:59pm EST.
  7 | We'll have the parallel parts (Problem 3, Part 3 and 4) due Tuesday February 22, 2022.
  8 | 
  9 | At the time of assignment, we have not covered all the material yet,
 10 | but I wanted to give you a headstart.  
 11 | 
 12 | Homework 1 is a chance to get some experience implementing discrete dynamical
 13 | systems techniques in a way that is parallelized, and a time to understand the
 14 | fundamental behavior of the bottleneck algorithms in scientific computing.
 15 | 
 16 | Please submit the hw to canvas.  Canvas will only be used for hw submission.
 17 | (Original pset authored by Chris Rackauckas.)
 18 | 
 19 | ## Problem 1: A Ton of New Facts on Newton
 20 | 
 21 | In this problem we will look into Newton's method. Newton's method is the
 22 | dynamical system defined by the update process:
 23 | 
 24 | $$x_{n+1} = x_n - \left(\frac{dg}{dx}(x_n)\right)^{-1} g(x_n)$$
 25 | 
 26 | For these problems, assume that $\frac{dg}{dx}$ is non-singular.
 27 | 
 28 | ### Part 1
 29 | 
 30 | Show that if $x^\ast$ is a steady state of the equation, then $g(x^\ast) = 0$.
 31 | 
 32 | ### Part 2
 33 | 
 34 | Take a look at the Quasi-Newton approximation:
 35 | 
 36 | $$x_{n+1} = x_n - \left(\frac{dg}{dx}(x_0)\right)^{-1} g(x_n)$$
 37 | 
 38 | for some fixed $x_0$. Derive the stability of the Quasi-Newton approximation
 39 | in the form of a matrix whose eigenvalues need to be constrained. Use this
 40 | to argue that if $x_0$ is sufficiently close to $x^\ast$ then the steady
 41 | state is a stable (attracting) steady state.
 42 | 
 43 | ### Part 3
 44 | 
 45 | Relaxed Quasi-Newton is the method:
 46 | 
 47 | $$x_{n+1} = x_n - \alpha \left(\frac{dg}{dx}(x_0)\right)^{-1} g(x_n)$$
 48 | 
 49 | Argue that for some sufficiently small $\alpha$ that the Quasi-Newton iterations
 50 | will be stable if the eigenvalues of
 51 | $(\left(\frac{dg}{dx}(x_0)\right)^{-1} g(x_n))^\prime$ are all positive for
 52 | every $x$.
 53 | 
 54 | (Technically, these assumptions can be greatly relaxed, but weird cases arise.
 55 | When $x \in \mathbb{C}$, this holds except on some set of Lebesgue measure zero.
 56 | Feel free to explore this.)
 57 | 
 58 | ### Part 4
 59 | 
 60 | Fixed point iteration is the dynamical system
 61 | 
 62 | $$x_{n+1} = g(x_n)$$
 63 | 
 64 | which converges to $g(x)=x$.
 65 | 
 66 | 1. What is a small change to the dynamical system that could be done such that
 67 |    $g(x)=0$ is the steady state?
 68 | 2. How can you change the $\left(\frac{dg}{dx}(x_0)\right)^{-1}$ term from the
 69 |    Quasi-Newton iteration to get a method equivalent to fixed point iteration?
 70 |    What does this imply about the difference in stability between Quasi-Newton
 71 |    and fixed point iteration if $\frac{dg}{dx}$ has large eigenvalues?
 72 | 
 73 | ## Problem 2: The Root of all Problems
 74 | 
 75 | In this problem we will practice writing fast and type-generic Julia code by
 76 | producing an algorithm that will compute the quantile of any probability
 77 | distribution.
 78 | 
 79 | ### Part 1
 80 | 
 81 | Many problems can be interpreted as a rootfinding problem. For example, let's
 82 | take a look at a problem in statistics. Let $X$ be a random variable with a
 83 | cumulative distribution function (CDF) of $cdf(x)$. Recall that the CDF is a
 84 | monotonically increasing function in $[0,1]$ which is the total probability of
 85 | $X < x$. The $y$th quantile of $X$ is the value $x$ at with $X$ has a y% chance
 86 | of being less than $x$. Interpret the problem of computing an arbitrary quantile
 87 | $y$ as a rootfinding problem, and use Newton's method to write an algorithm
 88 | for computing $x$.
 89 | 
 90 | (Hint: Recall that $cdf^{\prime}(x) = pdf(x)$, the probability distribution
 91 | function.)
 92 | 
 93 | ### Part 2
 94 | 
 95 | Use the types from Distributions.jl to write a function
 96 | `my_quantile(y,d)` which uses multiple dispatch to compute the
 97 | $y$th quantile for any `UnivariateDistribution` `d` from Distributions.jl.
 98 | Test your function on `Gamma(5, 1)`, `Normal(0, 1)`, and `Beta(2, 4)` against
 99 | the `Distributions.quantile` function built into the library.
100 | 
101 | (Hint: Have a keyword argument for $x_0$, and let its default be the mean or
102 | median of the distribution.)
103 | 
104 | ## Problem 3: Bifurcating Data for Parallelism
105 | 
106 | In this problem we will write code for efficient generation of the bifurcation
107 | diagram of the logistic equation.
108 | 
109 | ### Part 1
110 | 
111 | The logistic equation is the dynamical system given by the update relation:
112 | 
113 | $$x_{n+1} = rx_n (1-x_n)$$
114 | 
115 | where $r$ is some parameter. Write a function which iterates the equation from
116 | $x_0 = 0.25$ enough times to be sufficiently close to its long-term behavior
117 | (400 iterations) and samples 150 points from the steady state attractor
118 | (i.e. output iterations 401:550) as a function of $r$, and mutates some vector
119 | as a solution, i.e. `calc_attractor!(out,f,p,num_attract=150;warmup=400)`.
120 | 
121 | Test your function with $r = 2.9$. Double check that your function computes
122 | the correct result by calculating the analytical steady state value.
123 | 
124 | ### Part 2
125 | 
126 | The bifurcation plot shows how a steady state changes as a parameter changes.
127 | Compute the long-term result of the logistic equation at the values of
128 | `r = 2.9:0.001:4`, and plot the steady state values for each $r$ as an
129 | r x steady_attractor scatter plot. You should get a very bizarrely awesome
130 | picture, the bifurcation graph of the logistic equation.
131 | 
132 | ![](https://upload.wikimedia.org/wikipedia/commons/7/7d/LogisticMap_BifurcationDiagram.png)
133 | 
134 | (Hint: Generate a single matrix for the attractor values, and use `calc_attractor!`
135 | on views of columns for calculating the output, or inline the `calc_attractor!`
136 | computation directly onto the matrix, or even give `calc_attractor!` an input
137 | for what column to modify.)
138 | 
139 | ### Part 3
140 | 
141 | Multithread your bifurcation graph generator by performing different steady
142 | state calcuations on different threads. Does your timing improve? Why? Be
143 | careful and check to make sure you have more than 1 thread!
144 | 
145 | ### Part 4
146 | 
147 | Multiprocess your bifurcation graph generator first by using `pmap`, and then
148 | by using `@distributed`. Does your timing improve? Why? Be careful to add
149 | processes before doing the distributed call.
150 | 
151 | (Note: You may need to change your implementation around to be allocating
152 | differently in order for it to be compatible with multiprocessing!)
153 | 
154 | ### Part 5
155 | 
156 | Which method is the fastest? Why?
157 | 


--------------------------------------------------------------------------------
/hw2/hints2.md:
--------------------------------------------------------------------------------
 1 | # Hints and Tricks for HW2. 
 2 | # Note: any format submission (e.g. pdf, notebooks, zip) is fine
 3 | 
 4 | 
 5 | 
 6 | ** Motivation: In this problem you will learn to do scientific machine learning.  Yay!  
 7 | We will generate some artificial data, and find parameters to fit a differential equation.
 8 | 
 9 | ## Problem 1:
10 | 
11 | Many people are impressed by differential equation solvers such as the ones that appear
12 | in commonly used packages.   The feeling is they must be so much more
13 | complicated than the Euler methods one sees in the basic classes.
14 | Here we will demonstrate that it is remarkably simple
15 | to build these solvers yourself.  Everybody should do this once in their lifetimes.
16 | 
17 | All you really need is the data in [the Dormand Prince Wikipedia article ](https://en.wikipedia.org/wiki/Dormand%E2%80%93Prince_method) and the algorithm in the [the Butcher Wikipedia article](https://en.wikipedia.org/wiki/Runge%E2%80%93Kutta_methods#Explicit_Runge.E2.80.93Kutta_methods) .  There is also discussion
18 | about this method in the class notes [Lecture 7](https://book.sciml.ai/notes/07/) search for Higher Order Methods
19 | towards the bottom of the page.
20 | 
21 | For the data, you can just copy and paste (and maybe use Static Vectors):
22 | ```julia
23 | const s = 7
24 | const a = @SVector[
25 |     1/5,
26 |     3/40, 9/40,
27 |     44/45, −56/15, 32/9,
28 |     19372/6561, −25360/2187, 64448/6561, −212/729,
29 |     9017/3168, −355/33, 46732/5247, 49/176, −5103/18656,
30 |     35/384, 0, 500/1113, 125/192, −2187/6784, 11/84,
31 | ]
32 | const b = @SVector[35/384, 0, 500/1113, 125/192, −2187/6784, 11/84, 0]
33 | const c = @SVector[0, 1/5, 3/10, 4/5, 8/9, 1, 1]
34 | ```
35 | For Part 2 of Problem 1 see [[pdf file]](https://github.com/mitmath/18337/blob/master/hw2/hw2_hint.pdf)
36 | I believe setting the initial conditions to 0 for the 8 new parameters should work just fine.
37 | 
38 | Part 3: use the data from all the timesteps
39 | 
40 | 
41 | 
42 | 
43 | 
44 | 
45 | 
46 | 
47 |  
48 | 
49 | 


--------------------------------------------------------------------------------
/hw2/hw2_hint.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/hw2/hw2_hint.pdf


--------------------------------------------------------------------------------
/hw2/hw2_hint.tex:
--------------------------------------------------------------------------------
 1 | \documentclass{article}
 2 | \usepackage[utf8]{inputenc}
 3 | \usepackage{amsmath}
 4 | \usepackage{physics}
 5 | 
 6 | \begin{document}
 7 | \section{HW2 Hint}
 8 | \subsection{Problem 1}
 9 | \subsubsection{Part 2}
10 | 
11 | It is helpful to realize that $x$ and $y$ depend not only on $t$ but on the four parameters $p=(\alpha,\beta,\gamma,\delta).$
12 | 
13 | Thus it is reasonable to evolve not only $u$=[$x$, $y$] with time but also the
14 | eight variables in the 2x4 matrix:
15 | $$ 
16 | \frac{\partial{u}}{\partial p}=
17 | \begin{pmatrix}
18 | \frac{\partial x}{\partial \alpha} &
19 | \frac{\partial x}{\partial \beta} &
20 | \frac{\partial x}{\partial \gamma} &
21 | \frac{\partial x}{\partial \delta} \\
22 | \frac{\partial y}{\partial \alpha} &
23 | \frac{\partial y}{\partial \beta} &
24 | \frac{\partial y}{\partial \gamma} &
25 | \frac{\partial y}{\partial \delta}
26 | \end{pmatrix}.$$
27 | Thus we are evolving 10 variables in
28 | total.  
29 | I'm wondering if it matters
30 | if we start these eight variables
31 | at 0 at t=0 or not?
32 | 
33 | Here
34 | $$f(u,p,t) =
35 | \begin{pmatrix}
36 | \alpha x - \beta x y \\
37 | -\gamma y + \delta x y
38 | \end{pmatrix}.
39 | $$
40 | 
41 | You will need the Jacobian
42 | of $f$ with respect to $x$ and $y$:
43 | $$\frac{\partial f}{\partial u}
44 | =
45 | \begin{pmatrix}
46 | \alpha-\beta y & - \beta x \\
47 | \delta y & -\gamma + \delta x
48 | \end{pmatrix},
49 | $$
50 | and also the Jacobian of $f$ with
51 | respect to $\alpha,\beta,\gamma,\delta$:
52 | 
53 | $$
54 | \frac{\partial f}{\partial p}=
55 | \begin{pmatrix}
56 | x & -xy & 0 & 0 \\
57 | 0 & 0 & -y & xy
58 | \end{pmatrix}.
59 | $$
60 | 
61 | Note that the resulting system does not have a nice analytical solution since $x$ and $y$ are functions of
62 | $t$. Instead, use your integrator from part 1 for solving the new combined system.
63 | 
64 | \subsubsection{Part 3}
65 | 
66 | First you will need to write down the loss function you want to minimize. You are asked to use the L2-norm
67 | of the difference between your computed solution $u(t_i)$ and the original solution from part 1 $\hat u(t_i)$ you are trying to 
68 | recreate (the training data if you will). The loss function $L(u)$ then looks as follows:
69 | 
70 | $$
71 | L(u) = \sum_i (u(t_i) - \hat u(t_i))^2
72 | $$
73 | 
74 | You want to minimize this function via gradient descent, so you need to find the gradient w.r.t. the parameters
75 | $p$ ($\alpha$, $\beta$, $\gamma$, and $\delta$). Use the chain rule:
76 | 
77 | $$
78 | \pdv{L}{p} = \sum_i \pdv{L}{u(t_i)} \cdot \pdv{u(t_i)}{p}
79 | $$
80 | 
81 | $\pdv{L}{u(t_i)}$ is straightforward to derive from the previous equation and $\pdv{u(t_i)}{p}$ is exactly what you were
82 | supposed to find a way to calculate numerically in part 2.
83 | 
84 | 
85 | \end{document}
86 | 


--------------------------------------------------------------------------------
/hw3/18_337_2023_pset3.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/hw3/18_337_2023_pset3.pdf


--------------------------------------------------------------------------------
/hw3/parallelhistogram.jl:
--------------------------------------------------------------------------------
 1 | using Plots, Random, SpecialFunctions, FastGaussQuadrature, LinearAlgebra, ForwardDiff
 2 | 
 3 | airy_kernel(x, y) = x==y ? (airyaiprime(x))^2 - x * (airyai(x))^2 :
 4 |            (airyai(x) * airyaiprime(y) - airyai(y) * airyaiprime(x)) / (x - y)
 5 | ϕ(ξ, s) =  s + 10*tan(π*(ξ+1)/4) # Transformation from [-1,1] to (s,∞)
 6 | ϕ′(ξ) = (5π/2)*(sec(π*(ξ+1)/4))^2
 7 | K(ξ,η,s) = sqrt(ϕ′(ξ) * ϕ′(η)) * airy_kernel(ϕ(ξ,s), ϕ(η,s))
 8 | 
 9 | function K(s , n=100) 
10 |     nodes,weights = gausslegendre(n)
11 |     Symmetric( K.(nodes',nodes,s) .* (√).(weights) .* (√).(weights'))
12 | end
13 | 
14 | TracyWidomPDF_via_Fredholm_Det(s) = ForwardDiff.derivative( t->det(I-K(t)),s)
15 | 
16 | t = 300 # change to 10_000 slowly when ready
17 | 
18 | n = 6^6
19 | dx = 1/6
20 | v = zeros(t)
21 | 
22 | 
23 | ## Experiment
24 | v = zeros(t)
25 | Threads.@threads for i ∈ 1:t
26 |     v[i] = patiencesort1(randperm(n)) # use your fastest function here
27 | end
28 | w = (v .- 2sqrt(n+.5)) ./ (n^(1/6))
29 | histogram(w, normalized=true, bins=-4.5:dx:2)
30 | 
31 | plot!(TracyWidomPDF_via_Fredholm_Det, -5.0, 2, label="Theory", lw=3)


--------------------------------------------------------------------------------
/hw3/patiencesort1.jl:
--------------------------------------------------------------------------------
 1 | function patiencesort1(p)
 2 |     # p : Permutation
 3 |     # Returns length of longest increasing subsequence
 4 |     pile_tops = Int[]
 5 |     for α ∈ p       
 6 |         whichpile = 1+sum(α.>pile_tops) # first pile where α is smaller
 7 |         if  whichpile ≤ length(pile_tops)
 8 |             pile_tops[whichpile] = α   # put α on top of a pile  or ..
 9 |         else
10 |             push!(pile_tops, α)        # create a new pile
11 |         end
12 |     end
13 |     return length(pile_tops)
14 | end


--------------------------------------------------------------------------------
/hw4.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/hw4.pdf


--------------------------------------------------------------------------------
/hw4/hints.md:
--------------------------------------------------------------------------------
 1 | # Hints for https://book.sciml.ai/homework/03/
 2 | 
 3 | This problem has many moving parts, but should be very satisfying once you get this to work properly.  When you reach ``the finish line" (Boston marathon is Monday after all) please
 4 | stop and think how this idea can be used and adapted for many other problems.
 5 | 
 6 | 
 7 | ## Problem 1
 8 | 
 9 | * Part 1: The definition of pullback first appears in [CR Lecture 10][10].  In particular the input of the pullback B has the size of the output of f.  The output value of B has the shape of the  inputs to f.  A scalar function f of many variables has a B with input a scalar and an output  the shape of the variables.
10 | 
11 | A gradient (∇) of a scalar function of a column vector is traditionally a column vector.
12 | The Jacobian of the same scalar function is the corresponding row vector.  More generally
13 | the gradient of a scalar function of any combination of shapes has the same shapes as the input.
14 | 
15 | 
16 | For problem 1, I would have said that B(1) is the gradient not the transpose, i.e. it is a column vector.
17 | I will be completely consistent.
18 | 
19 | vjp refers to vector jacobian product. (Not a great name.
20 | In part because it's not clear, and in part because we are going
21 | to more consistently compute "Jacobian transpose"*vector.
22 | )  Computationally one does not often form Jacobians these days as they are too expensive, but rather vjp's.
23 | A function from R^n to R^m has a Jacobian that is mxn.  
24 | The resulting vjp then is a vector of size m.    (Note Julia's vectors are not rows or columns, they are just one dimensional.)  In one place in Chris' notes he treats it as a row vector, but more consistent and simpler is to think column vector.
25 | 
26 | * For part 2 see https://book.sciml.ai/notes/10/, specifically equations 36-41 will be relevant to part 2
27 | 
28 | Perhaps define a function with firstline `function pullback(y,u, W₁, W, b₁, b₂)` which can be called
29 | `ū, W̄₁, W̄₂, b̄₁, b̄₂ = pullback(y, u, W₁, W, b₁, b₂)`.
30 | 
31 | Note the input `y` of the pullback here is a 2-vector and the output has the same shape  of the five objects, u,W1,W2,b1,b2.
32 |  
33 | For the ODE, in Part 3 you'll then need to flatten those into a vector. Perhaps write a function
34 | `p = flatten(u, W₁, W, b₁, b₂)` and `u, W₁, W, b₁, b₂ = unflatten(p)`.
35 | 
36 | You can do `[vec.(B_NN(y))...]` to flatten and for unflattening, use slicing and perhaps reshaping (e.g. `reshape(µ[1:10], 2, 5)`) for the final µ to use in the gradient descent step to optimize the weights.
37 | 
38 | Notice that equations (36) to (41) give expressions for `W̄₁, W̄₂, b̄₁, b̄₂` but while `x` serves as the `u` , in those equations it is not considered a parameter and so you will have to figure out the right expression for `ū`.
39 | Hint: `u` just appears as matrix times vector, so perhaps looking at equation (38) might help you see the right answer.
40 | 
41 | ## Part 3:  you can do Part 2 yourself if you like, or use ForwardDiff.jl or Zygote. jl if you like.
42 | 
43 | * Part 3: Use https://diffeq.sciml.ai/stable/features/callback_library/#PresetTimeCallback for adding the jumps for $\lambda$.  A nice example of difeqs with jumps and how to run the software
44 | may be found here: https://diffeq.sciml.ai/stable/features/callback_functions/#PresetTimeCallback .
45 | 
46 | Part 3 consists first of a forward pass to obtain u(t). We might recommend just saving the solution, but you can also just save u(T) and then (re)compute u in reverse with the  λ and μ.  The second requirement of Part 3 is
47 |  a backward pass `tspan=(1.0,0.0)` with the primary goal 
48 | to obtain the final value of μ(0) which is the flattened version of the gradient that we seek.
49 | Notice that μ would be expressed on a blackboard as a simple integral, but as a memory saving trick
50 | (we don't need to store the λ's, we can use them on the fly) we express this as a differential equation.
51 | 
52 | Following our convention, we might recommend (you can do it either way) thinking of λ as a column vector.
53 | So you are solving λ' = -fᵤᵀλ + (jumps when appropriate) and μ' = -f_pᵀλ .  
54 | (We won't take jumps for μ because our loss function will not depend explicitly on the parameters, i.e., g_p=0
55 | .)
56 | 
57 | Notice that you will not compute fᵤᵀλ but rather you will use the ū result of the pullback function that you wrote in Part 2 calling for example,    `pullback(λ, u, W₁, W, b₁, b₂)`. Don't worry the
58 |  `W̄₁, W̄₂, b̄₁, b̄₂`   parts will not go to waste as you need them for the f_pᵀλ.
59 | 
60 | 
61 | To solve for λ you will need Cᵤ for the initial condition at T=1 and Cᵤ at 0:.1:.9 for the jumps.
62 | The only time you will use Cᵤ for λ is T=1, for all other λ(t) you will be solving the differential
63 | equation λ' = fᵤᵀλ + (jumps when appropriate), where the jumps which will also be Cᵤ.
64 | Anticipating part 4, we can use the explicit values Cᵤ = 2(u(t)-û(t)), where u(t) is at the forward pass and û(t) is the known theoretical solution. (Those of you who are following will note that Cᵤ plays
65 | the role of gᵤᵀ hence it is a column vector so λ' = fᵤᵀλ +gᵤᵀ  at the jumps.)
66 | 
67 | When going forward just use t going from 0 to 1.  No need to think about the .1's just yet.
68 | u(0) is an arbitrary 2-vector for now, but in part 4 it will be [2,0]. When going backward t
69 | run from 1 to 0 (not just at the discrete time steps of multiples of .1)
70 | 
71 | * Part 4: you now have the ability to maneuver around p space and train.  You will need to do gradient
72 | descent with the old problem of figuring out what multiple of the gradient to take, i.e. the stepsize.
73 | If you know some fancy methods you may give it a try, but you can also take stepsizes around .1 or .01 and
74 | then if necessary reduce this until convergence seems reasonable.  Plotting the loss function is recommended
75 | for this purpose.
76 | 
77 | As a finale, compare the theoretical value of the known solution with the trained solution.
78 | 
79 | [10]:https://book.sciml.ai/notes/10/
80 | 


--------------------------------------------------------------------------------
/lecture 11/adjoint handwritten notes.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture 11/adjoint handwritten notes.pdf


--------------------------------------------------------------------------------
/lecture 12/..textClipping:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture 12/..textClipping


--------------------------------------------------------------------------------
/lecture 12/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture 12/.DS_Store


--------------------------------------------------------------------------------
/lecture 12/notebook.jl:
--------------------------------------------------------------------------------
  1 | ### A Pluto.jl notebook ###
  2 | # v0.18.0
  3 | 
  4 | using Markdown
  5 | using InteractiveUtils
  6 | 
  7 | # ╔═╡ d5559dba-9fe4-11ec-3744-ebd1408e7dc4
  8 | using LegibleLambdas, AbstractTrees, PlutoUI, HypertextLiteral, PlutoTest
  9 | 
 10 | # ╔═╡ 99b6ab91-a022-449c-988c-0e5c5719c910
 11 | begin
 12 | 	struct Tracked{T} <: Number
 13 | 		# The numerical result when doing the forward pass
 14 | 		val::T
 15 | 		name::Symbol
 16 | 		# The pullback map for the reverse pass
 17 | 		df
 18 | 		# All the other variables this variable directly depends on
 19 | 		deps::Vector{Tracked}
 20 | 	end
 21 | 	Tracked{T}(x, name=gensym()) where {T} = Tracked{T}(x, name, nothing, Tracked[])
 22 | 	# This tells Julia to convert any number added to a `Tracked` to a `Tracked` first
 23 | 	Base.promote_rule(::Type{Tracked{S}}, ::Type{T}) where {S<:Number, T<:Number} = Tracked{promote_type(S, T)}
 24 | end
 25 | 
 26 | # ╔═╡ 13487e65-5e48-4a37-9bea-f262dd7b6d56
 27 | # calculate the sum, but also remember the pullback map and input variables for the reverse pass which we'll need to calculate the gradient
 28 | # `@λ` is just for the nicer printing, we could have replaced `@λ(Δ -> (Δ, Δ))` with `Δ -> (Δ, Δ)` if we didn't care about that
 29 | function Base.:+(x::Tracked, y::Tracked)
 30 | 	Tracked(x.val + y.val, :+, @λ(Δ -> (Δ, Δ)), Tracked[x, y])
 31 | end
 32 | 
 33 | # ╔═╡ b0cc4665-eb45-48ea-9a33-5acf56d2a283
 34 | function Base.:-(x::Tracked, y::Tracked)
 35 | 	Tracked(x.val - y.val, :-, @λ(Δ -> (Δ, -Δ)), Tracked[x, y])
 36 | end
 37 | 
 38 | # ╔═╡ 73d638bf-30c1-4694-b3a8-4b29c5e3fa65
 39 | function Base.:*(x::Tracked, y::Tracked)
 40 | 	Tracked(x.val * y.val, :*, @λ(Δ -> (Δ * y.val, Δ * x.val)), Tracked[x, y])
 41 | end
 42 | 
 43 | # ╔═╡ ac097299-0a31-474c-ab26-a4fb24bb9046
 44 | function Base.:^(x::Tracked, n::Int)
 45 | 	Tracked(x.val^n, Symbol("^$n"), @λ(Δ -> (Δ * n * x.val^(n-1),)), Tracked[x,])
 46 | end
 47 | 
 48 | # ╔═╡ 2141849b-675e-406c-8df4-34b2706507af
 49 | function Base.:/(x::Tracked, y::Tracked)
 50 | 	Tracked(x.val / y.val, :/, @λ(Δ -> (Δ / y.val, -Δ * x.val / y.val^2)), Tracked[x, y])
 51 | end
 52 | 
 53 | # ╔═╡ 7429ffcb-dcee-4090-972e-ffde8393a37a
 54 | begin
 55 | 	# `Tracked` is a tree, we just need to tell AbstractTrees.jl how to get the children for each node
 56 | 	AbstractTrees.children(x::Tracked) = x.deps
 57 | 	# All this is just for nicer printing
 58 | 	function Base.show(io::IO, x::Tracked)
 59 | 		if x.df === nothing
 60 | 			print(io, Base.isgensym(x.name) ? x.val : "$(x.name)=$(x.val)")
 61 | 		else
 62 | 			print(io, "Tracked(")
 63 | 			show(io, x.val)
 64 | 			print(io, ", ")
 65 | 			print(io, x.name)
 66 | 			#print(io, ", ")
 67 | 			#show(io, x.df)
 68 | 			print(io, ")")
 69 | 		end
 70 | 	end
 71 | 	Base.show(io::IO, ::MIME"text/plain", x::Tracked) = print_tree(io, x)
 72 | end
 73 | 
 74 | # ╔═╡ 0b5e6560-81fd-4182-bba5-aca702fb3048
 75 | begin
 76 |    x = Tracked{Int}(3, :x)
 77 |    y = Tracked{Int}(5, :y)
 78 | end
 79 | 
 80 | # ╔═╡ 81eb8a2d-a3a9-45af-a5a5-b96aefd48712
 81 | (2x + (x-1)^2).val # The regular result of `2x + (x-1)^2`
 82 | 
 83 | # ╔═╡ e52aa672-69a9-419b-a992-e7a3d1364fb6
 84 | # PreOrderDFS traverses this tree from the top down
 85 | Text.(collect(PreOrderDFS(y*x+x^2)))
 86 | 
 87 | # ╔═╡ f0814e23-6f75-4db8-b277-d21d4926f876
 88 | y*x+x^2
 89 | 
 90 | # ╔═╡ 99a3507b-ca03-429f-acde-e2d1ebb32054
 91 | # produces a dict with all the intermediate gradient
 92 | function grad(f::Tracked)
 93 | 	d = Dict{Any, Any}(f => 1)
 94 | 	for x in PreOrderDFS(f) # recursively traverse all dependents
 95 | 		x.df === nothing && continue # ignore untracked variables like constants
 96 | 		dy = x.df(d[x]) # evaluate pullback
 97 | 		for (yᵢ, dyᵢ) in zip(x.deps, dy)
 98 | 			# store the gradient in d
 99 | 			# if we have already stored a gradient for this variable, we need to add them
100 | 			d[yᵢ] = get(d, yᵢ, 0) + dyᵢ
101 | 		end
102 | 	end
103 | 	return d
104 | end
105 | 
106 | # ╔═╡ d4e9b202-242e-4420-986b-12d2ab57af93
107 | grad(f::Tracked, x::Tracked) = grad(f)[x]
108 | 
109 | # ╔═╡ dc62ff81-dbb8-4416-8fc7-8878e16bdf85
110 | grad(y)
111 | 
112 | # ╔═╡ fc8aeed7-2806-438a-85f7-c155b0b222e6
113 | #grad(y, x)
114 | 
115 | # ╔═╡ a34a0941-6e7e-4a40-affa-7941c54a10b9
116 | y
117 | 
118 | # ╔═╡ 18b1c55d-a6b5-44f6-b0b3-50bdb0aa9d96
119 | w = x*y + x
120 | 
121 | # ╔═╡ 506d408e-dc2b-4e12-b917-286e3f4079a2
122 | grad(w)
123 | 
124 | # ╔═╡ 1a154bb7-93a3-4973-8908-788db77ac294
125 | @htl """
126 | <link rel="stylesheet" href="https://fperucic.github.io/treant-js/Treant.css"/>
127 | <style>
128 | .Treant > .node {
129 | 	padding: 3px; border: 1px solid #484848; border-radius: 3px;
130 | 	box-sizing: unset;
131 | 	background-color: var(--main-bg-color);
132 | 	width: 200px,
133 | }
134 | 
135 | .Treant .collapse-switch { width: 100%; height: 100%; border: none; }
136 | .Treant .node.collapsed { background-color: var(--main-bg-color); }
137 | .Treant .node.collapsed .collapse-switch { background: none;}
138 | </style>
139 | 
140 | <script src="https://fperucic.github.io/treant-js/vendor/jquery.min.js"></script>
141 | <script src="https://fperucic.github.io/treant-js/vendor/jquery.easing.js"></script>
142 | <script src="https://fperucic.github.io/treant-js/vendor/raphael.js"></script>
143 | <script src="https://fperucic.github.io/treant-js/Treant.js"></script>
144 | """
145 | 
146 | # ╔═╡ 6b1fb808-e993-4c2b-b81b-6710f8206de7
147 | function to_json(x)
148 | 	d = Dict{Symbol, Any}(
149 | 		:text => Dict{Symbol, Any}(:name => sprint(AbstractTrees.printnode, x)),
150 | 		:children => Any[to_json(c) for c in children(x)],
151 | 		:collapsed => !isempty(children(x)),
152 | 	)
153 | end
154 | 
155 | # ╔═╡ 437285d4-ec53-4bb7-9966-fcfb5352e205
156 | function show_tree(x; height=400)
157 | 	id = gensym()
158 | 	@htl """
159 | 	<div id="$id" style="width:100%; height: $(height)px"> </div>
160 | 	<script>
161 | 	var simple_chart_config = {
162 | 		chart: {
163 | 			container: "#$id",
164 | 
165 | 			animateOnInit: true,
166 | 
167 | 			node: {
168 | 				collapsable: true,
169 | 				style: {width: "500px"}
170 | 			},
171 | 
172 | 			nodeAlign: "BOTTOM",
173 | 
174 | 			connectors: {
175 | 				type: "straight",
176 | 				style: {
177 | 					stroke: getComputedStyle(document.documentElement).getPropertyValue('--cm-editor-text-color')
178 | 				}
179 | 			},
180 | 			animation: {
181 | 				nodeAnimation: "easeOutBounce",
182 | 				nodeSpeed: 500,
183 | 				connectorsAnimation: "bounce",
184 | 				connectorsSpeed: 500
185 | 			}
186 | 		},
187 | 
188 | 		nodeStructure: $(to_json(x))
189 | 	};
190 | 	var my_chart = new Treant(simple_chart_config);
191 | 	</script>
192 | 	"""
193 | end
194 | 
195 | # ╔═╡ 076594af-13d1-49a6-b5a3-17fefa676b3b
196 | show_tree(w)
197 | 
198 | # ╔═╡ ff78f53f-1ad6-4a05-9e38-0926223ed7a6
199 | show_tree(:(3y + 2(x-1)))
200 | 
201 | # ╔═╡ f6ce8448-d9ce-4453-9e47-dc6443d50f55
202 | html"""
203 | <style>
204 | p-frame-viewer {
205 | 	display: inline-flex;
206 | 	flex-direction: column;
207 | }
208 | p-frames,
209 | p-frame-controls {
210 | 	display: inline-flex;
211 | }
212 | p-frame-controls {
213 | 	margin-top: 20px;
214 | }
215 | line-like {
216 | 	font-size: 30px;
217 | }
218 | """
219 | 
220 | # ╔═╡ 9a141034-17cb-4d85-a5a2-4724a38dd269
221 | macro visual_debug(expr)
222 | 	quote
223 | 		$(esc(:(PlutoTest.@eval_step_by_step($expr)))) .|> PlutoTest.SlottedDisplay |> PlutoTest.frames |> PlutoTest.with_slotted_css
224 | 	end
225 | end
226 | 
227 | # ╔═╡ 79f71f9d-b491-4a2c-85a4-29ae8da4f312
228 | @visual_debug(3y + 2(x-1))
229 | 
230 | # ╔═╡ 00000000-0000-0000-0000-000000000001
231 | PLUTO_PROJECT_TOML_CONTENTS = """
232 | [deps]
233 | AbstractTrees = "1520ce14-60c1-5f80-bbc7-55ef81b5835c"
234 | HypertextLiteral = "ac1192a8-f4b3-4bfe-ba22-af5b92cd3ab2"
235 | LegibleLambdas = "f1f30506-32fe-5131-bd72-7c197988f9e5"
236 | PlutoTest = "cb4044da-4d16-4ffa-a6a3-8cad7f73ebdc"
237 | PlutoUI = "7f904dfe-b85e-4ff6-b463-dae2292396a8"
238 | 
239 | [compat]
240 | AbstractTrees = "~0.3.4"
241 | HypertextLiteral = "~0.9.3"
242 | LegibleLambdas = "~0.3.0"
243 | PlutoTest = "~0.2.2"
244 | PlutoUI = "~0.7.37"
245 | """
246 | 
247 | # ╔═╡ 00000000-0000-0000-0000-000000000002
248 | PLUTO_MANIFEST_TOML_CONTENTS = """
249 | # This file is machine-generated - editing it directly is not advised
250 | 
251 | julia_version = "1.7.1"
252 | manifest_format = "2.0"
253 | 
254 | [[deps.AbstractPlutoDingetjes]]
255 | deps = ["Pkg"]
256 | git-tree-sha1 = "8eaf9f1b4921132a4cff3f36a1d9ba923b14a481"
257 | uuid = "6e696c72-6542-2067-7265-42206c756150"
258 | version = "1.1.4"
259 | 
260 | [[deps.AbstractTrees]]
261 | git-tree-sha1 = "03e0550477d86222521d254b741d470ba17ea0b5"
262 | uuid = "1520ce14-60c1-5f80-bbc7-55ef81b5835c"
263 | version = "0.3.4"
264 | 
265 | [[deps.ArgTools]]
266 | uuid = "0dad84c5-d112-42e6-8d28-ef12dabb789f"
267 | 
268 | [[deps.Artifacts]]
269 | uuid = "56f22d72-fd6d-98f1-02f0-08ddc0907c33"
270 | 
271 | [[deps.Base64]]
272 | uuid = "2a0f44e3-6c83-55bd-87e4-b1978d98bd5f"
273 | 
274 | [[deps.ColorTypes]]
275 | deps = ["FixedPointNumbers", "Random"]
276 | git-tree-sha1 = "024fe24d83e4a5bf5fc80501a314ce0d1aa35597"
277 | uuid = "3da002f7-5984-5a60-b8a6-cbb66c0b333f"
278 | version = "0.11.0"
279 | 
280 | [[deps.CompilerSupportLibraries_jll]]
281 | deps = ["Artifacts", "Libdl"]
282 | uuid = "e66e0078-7015-5450-92f7-15fbd957f2ae"
283 | 
284 | [[deps.Dates]]
285 | deps = ["Printf"]
286 | uuid = "ade2ca70-3891-5945-98fb-dc099432e06a"
287 | 
288 | [[deps.Downloads]]
289 | deps = ["ArgTools", "LibCURL", "NetworkOptions"]
290 | uuid = "f43a241f-c20a-4ad4-852c-f6b1247861c6"
291 | 
292 | [[deps.FixedPointNumbers]]
293 | deps = ["Statistics"]
294 | git-tree-sha1 = "335bfdceacc84c5cdf16aadc768aa5ddfc5383cc"
295 | uuid = "53c48c17-4a7d-5ca2-90c5-79b7896eea93"
296 | version = "0.8.4"
297 | 
298 | [[deps.Hyperscript]]
299 | deps = ["Test"]
300 | git-tree-sha1 = "8d511d5b81240fc8e6802386302675bdf47737b9"
301 | uuid = "47d2ed2b-36de-50cf-bf87-49c2cf4b8b91"
302 | version = "0.0.4"
303 | 
304 | [[deps.HypertextLiteral]]
305 | git-tree-sha1 = "2b078b5a615c6c0396c77810d92ee8c6f470d238"
306 | uuid = "ac1192a8-f4b3-4bfe-ba22-af5b92cd3ab2"
307 | version = "0.9.3"
308 | 
309 | [[deps.IOCapture]]
310 | deps = ["Logging", "Random"]
311 | git-tree-sha1 = "f7be53659ab06ddc986428d3a9dcc95f6fa6705a"
312 | uuid = "b5f81e59-6552-4d32-b1f0-c071b021bf89"
313 | version = "0.2.2"
314 | 
315 | [[deps.InteractiveUtils]]
316 | deps = ["Markdown"]
317 | uuid = "b77e0a4c-d291-57a0-90e8-8db25a27a240"
318 | 
319 | [[deps.JSON]]
320 | deps = ["Dates", "Mmap", "Parsers", "Unicode"]
321 | git-tree-sha1 = "3c837543ddb02250ef42f4738347454f95079d4e"
322 | uuid = "682c06a0-de6a-54ab-a142-c8b1cf79cde6"
323 | version = "0.21.3"
324 | 
325 | [[deps.LegibleLambdas]]
326 | deps = ["MacroTools"]
327 | git-tree-sha1 = "7946db4829eb8de47c399f92c19790f9cc0bbd07"
328 | uuid = "f1f30506-32fe-5131-bd72-7c197988f9e5"
329 | version = "0.3.0"
330 | 
331 | [[deps.LibCURL]]
332 | deps = ["LibCURL_jll", "MozillaCACerts_jll"]
333 | uuid = "b27032c2-a3e7-50c8-80cd-2d36dbcbfd21"
334 | 
335 | [[deps.LibCURL_jll]]
336 | deps = ["Artifacts", "LibSSH2_jll", "Libdl", "MbedTLS_jll", "Zlib_jll", "nghttp2_jll"]
337 | uuid = "deac9b47-8bc7-5906-a0fe-35ac56dc84c0"
338 | 
339 | [[deps.LibGit2]]
340 | deps = ["Base64", "NetworkOptions", "Printf", "SHA"]
341 | uuid = "76f85450-5226-5b5a-8eaa-529ad045b433"
342 | 
343 | [[deps.LibSSH2_jll]]
344 | deps = ["Artifacts", "Libdl", "MbedTLS_jll"]
345 | uuid = "29816b5a-b9ab-546f-933c-edad1886dfa8"
346 | 
347 | [[deps.Libdl]]
348 | uuid = "8f399da3-3557-5675-b5ff-fb832c97cbdb"
349 | 
350 | [[deps.LinearAlgebra]]
351 | deps = ["Libdl", "libblastrampoline_jll"]
352 | uuid = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
353 | 
354 | [[deps.Logging]]
355 | uuid = "56ddb016-857b-54e1-b83d-db4d58db5568"
356 | 
357 | [[deps.MacroTools]]
358 | deps = ["Markdown", "Random"]
359 | git-tree-sha1 = "3d3e902b31198a27340d0bf00d6ac452866021cf"
360 | uuid = "1914dd2f-81c6-5fcd-8719-6d5c9610ff09"
361 | version = "0.5.9"
362 | 
363 | [[deps.Markdown]]
364 | deps = ["Base64"]
365 | uuid = "d6f4376e-aef5-505a-96c1-9c027394607a"
366 | 
367 | [[deps.MbedTLS_jll]]
368 | deps = ["Artifacts", "Libdl"]
369 | uuid = "c8ffd9c3-330d-5841-b78e-0817d7145fa1"
370 | 
371 | [[deps.Mmap]]
372 | uuid = "a63ad114-7e13-5084-954f-fe012c677804"
373 | 
374 | [[deps.MozillaCACerts_jll]]
375 | uuid = "14a3606d-f60d-562e-9121-12d972cd8159"
376 | 
377 | [[deps.NetworkOptions]]
378 | uuid = "ca575930-c2e3-43a9-ace4-1e988b2c1908"
379 | 
380 | [[deps.OpenBLAS_jll]]
381 | deps = ["Artifacts", "CompilerSupportLibraries_jll", "Libdl"]
382 | uuid = "4536629a-c528-5b80-bd46-f80d51c5b363"
383 | 
384 | [[deps.Parsers]]
385 | deps = ["Dates"]
386 | git-tree-sha1 = "85b5da0fa43588c75bb1ff986493443f821c70b7"
387 | uuid = "69de0a69-1ddd-5017-9359-2bf0b02dc9f0"
388 | version = "2.2.3"
389 | 
390 | [[deps.Pkg]]
391 | deps = ["Artifacts", "Dates", "Downloads", "LibGit2", "Libdl", "Logging", "Markdown", "Printf", "REPL", "Random", "SHA", "Serialization", "TOML", "Tar", "UUIDs", "p7zip_jll"]
392 | uuid = "44cfe95a-1eb2-52ea-b672-e2afdf69b78f"
393 | 
394 | [[deps.PlutoTest]]
395 | deps = ["HypertextLiteral", "InteractiveUtils", "Markdown", "Test"]
396 | git-tree-sha1 = "17aa9b81106e661cffa1c4c36c17ee1c50a86eda"
397 | uuid = "cb4044da-4d16-4ffa-a6a3-8cad7f73ebdc"
398 | version = "0.2.2"
399 | 
400 | [[deps.PlutoUI]]
401 | deps = ["AbstractPlutoDingetjes", "Base64", "ColorTypes", "Dates", "Hyperscript", "HypertextLiteral", "IOCapture", "InteractiveUtils", "JSON", "Logging", "Markdown", "Random", "Reexport", "UUIDs"]
402 | git-tree-sha1 = "bf0a1121af131d9974241ba53f601211e9303a9e"
403 | uuid = "7f904dfe-b85e-4ff6-b463-dae2292396a8"
404 | version = "0.7.37"
405 | 
406 | [[deps.Printf]]
407 | deps = ["Unicode"]
408 | uuid = "de0858da-6303-5e67-8744-51eddeeeb8d7"
409 | 
410 | [[deps.REPL]]
411 | deps = ["InteractiveUtils", "Markdown", "Sockets", "Unicode"]
412 | uuid = "3fa0cd96-eef1-5676-8a61-b3b8758bbffb"
413 | 
414 | [[deps.Random]]
415 | deps = ["SHA", "Serialization"]
416 | uuid = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
417 | 
418 | [[deps.Reexport]]
419 | git-tree-sha1 = "45e428421666073eab6f2da5c9d310d99bb12f9b"
420 | uuid = "189a3867-3050-52da-a836-e630ba90ab69"
421 | version = "1.2.2"
422 | 
423 | [[deps.SHA]]
424 | uuid = "ea8e919c-243c-51af-8825-aaa63cd721ce"
425 | 
426 | [[deps.Serialization]]
427 | uuid = "9e88b42a-f829-5b0c-bbe9-9e923198166b"
428 | 
429 | [[deps.Sockets]]
430 | uuid = "6462fe0b-24de-5631-8697-dd941f90decc"
431 | 
432 | [[deps.SparseArrays]]
433 | deps = ["LinearAlgebra", "Random"]
434 | uuid = "2f01184e-e22b-5df5-ae63-d93ebab69eaf"
435 | 
436 | [[deps.Statistics]]
437 | deps = ["LinearAlgebra", "SparseArrays"]
438 | uuid = "10745b16-79ce-11e8-11f9-7d13ad32a3b2"
439 | 
440 | [[deps.TOML]]
441 | deps = ["Dates"]
442 | uuid = "fa267f1f-6049-4f14-aa54-33bafae1ed76"
443 | 
444 | [[deps.Tar]]
445 | deps = ["ArgTools", "SHA"]
446 | uuid = "a4e569a6-e804-4fa4-b0f3-eef7a1d5b13e"
447 | 
448 | [[deps.Test]]
449 | deps = ["InteractiveUtils", "Logging", "Random", "Serialization"]
450 | uuid = "8dfed614-e22c-5e08-85e1-65c5234f0b40"
451 | 
452 | [[deps.UUIDs]]
453 | deps = ["Random", "SHA"]
454 | uuid = "cf7118a7-6976-5b1a-9a39-7adc72f591a4"
455 | 
456 | [[deps.Unicode]]
457 | uuid = "4ec0a83e-493e-50e2-b9ac-8f72acf5a8f5"
458 | 
459 | [[deps.Zlib_jll]]
460 | deps = ["Libdl"]
461 | uuid = "83775a58-1f1d-513f-b197-d71354ab007a"
462 | 
463 | [[deps.libblastrampoline_jll]]
464 | deps = ["Artifacts", "Libdl", "OpenBLAS_jll"]
465 | uuid = "8e850b90-86db-534c-a0d3-1478176c7d93"
466 | 
467 | [[deps.nghttp2_jll]]
468 | deps = ["Artifacts", "Libdl"]
469 | uuid = "8e850ede-7688-5339-a07c-302acd2aaf8d"
470 | 
471 | [[deps.p7zip_jll]]
472 | deps = ["Artifacts", "Libdl"]
473 | uuid = "3f19e933-33d8-53b3-aaab-bd5110c3b7a0"
474 | """
475 | 
476 | # ╔═╡ Cell order:
477 | # ╠═d5559dba-9fe4-11ec-3744-ebd1408e7dc4
478 | # ╠═99b6ab91-a022-449c-988c-0e5c5719c910
479 | # ╠═13487e65-5e48-4a37-9bea-f262dd7b6d56
480 | # ╠═b0cc4665-eb45-48ea-9a33-5acf56d2a283
481 | # ╠═73d638bf-30c1-4694-b3a8-4b29c5e3fa65
482 | # ╠═2141849b-675e-406c-8df4-34b2706507af
483 | # ╠═ac097299-0a31-474c-ab26-a4fb24bb9046
484 | # ╠═7429ffcb-dcee-4090-972e-ffde8393a37a
485 | # ╠═0b5e6560-81fd-4182-bba5-aca702fb3048
486 | # ╠═81eb8a2d-a3a9-45af-a5a5-b96aefd48712
487 | # ╠═e52aa672-69a9-419b-a992-e7a3d1364fb6
488 | # ╠═f0814e23-6f75-4db8-b277-d21d4926f876
489 | # ╠═99a3507b-ca03-429f-acde-e2d1ebb32054
490 | # ╠═d4e9b202-242e-4420-986b-12d2ab57af93
491 | # ╠═dc62ff81-dbb8-4416-8fc7-8878e16bdf85
492 | # ╠═fc8aeed7-2806-438a-85f7-c155b0b222e6
493 | # ╠═a34a0941-6e7e-4a40-affa-7941c54a10b9
494 | # ╠═18b1c55d-a6b5-44f6-b0b3-50bdb0aa9d96
495 | # ╠═506d408e-dc2b-4e12-b917-286e3f4079a2
496 | # ╠═076594af-13d1-49a6-b5a3-17fefa676b3b
497 | # ╠═ff78f53f-1ad6-4a05-9e38-0926223ed7a6
498 | # ╠═79f71f9d-b491-4a2c-85a4-29ae8da4f312
499 | # ╠═1a154bb7-93a3-4973-8908-788db77ac294
500 | # ╠═6b1fb808-e993-4c2b-b81b-6710f8206de7
501 | # ╠═437285d4-ec53-4bb7-9966-fcfb5352e205
502 | # ╠═f6ce8448-d9ce-4453-9e47-dc6443d50f55
503 | # ╠═9a141034-17cb-4d85-a5a2-4724a38dd269
504 | # ╟─00000000-0000-0000-0000-000000000001
505 | # ╟─00000000-0000-0000-0000-000000000002
506 | 


--------------------------------------------------------------------------------
/lecture 12/reverse mode 2 (simeon).jl:
--------------------------------------------------------------------------------
  1 | ### A Pluto.jl notebook ###
  2 | # v0.18.0
  3 | 
  4 | using Markdown
  5 | using InteractiveUtils
  6 | 
  7 | # ╔═╡ d5559dba-9fe4-11ec-3744-ebd1408e7dc4
  8 | using LegibleLambdas, AbstractTrees
  9 | 
 10 | # ╔═╡ 99b6ab91-a022-449c-988c-0e5c5719c910
 11 | begin
 12 | 	struct Tracked{T} <: Number
 13 | 		# The numerical result when doing the forward pass
 14 | 		val::T
 15 | 		name::Symbol
 16 | 		# The pullback map for the reverse pass
 17 | 		df
 18 | 		# All the other variables this variable directly depends on
 19 | 		deps::Vector{Tracked}
 20 | 	end
 21 | 	Tracked{T}(x, name=gensym()) where {T} = Tracked{T}(x, name, nothing, Tracked[])
 22 | 	# This tells Julia to convert any number added to a `Tracked` to a `Tracked` first
 23 | 	Base.promote_rule(::Type{Tracked{S}}, ::Type{T}) where {S<:Number, T<:Number} = Tracked{promote_type(S, T)}
 24 | end
 25 | 
 26 | # ╔═╡ 13487e65-5e48-4a37-9bea-f262dd7b6d56
 27 | # calculate the sum, but also remember the pullback map and input variables for the reverse pass which we'll need to calculate the gradient
 28 | # `@λ` is just for the nicer printing, we could have replaced `@λ(Δ -> (Δ, Δ))` with `Δ -> (Δ, Δ)` if we didn't care about that
 29 | function Base.:+(x::Tracked, y::Tracked)
 30 | 	Tracked(x.val + y.val, :+, @λ(Δ -> (Δ, Δ)), Tracked[x, y])
 31 | end
 32 | 
 33 | # ╔═╡ b0cc4665-eb45-48ea-9a33-5acf56d2a283
 34 | function Base.:-(x::Tracked, y::Tracked)
 35 | 	Tracked(x.val - y.val, :-, @λ(Δ -> (Δ, -Δ)), Tracked[x, y])
 36 | end
 37 | 
 38 | # ╔═╡ 73d638bf-30c1-4694-b3a8-4b29c5e3fa65
 39 | function Base.:*(x::Tracked, y::Tracked)
 40 | 	Tracked(x.val * y.val, :*, @λ(Δ -> (Δ * y.val, Δ * x.val)), Tracked[x, y])
 41 | end
 42 | 
 43 | # ╔═╡ ac097299-0a31-474c-ab26-a4fb24bb9046
 44 | function Base.:^(x::Tracked, n::Int)
 45 | 	Tracked(x.val^n, Symbol("^$n"), @λ(Δ -> (Δ * n * x.val^(n-1),)), Tracked[x,])
 46 | end
 47 | 
 48 | # ╔═╡ 2141849b-675e-406c-8df4-34b2706507af
 49 | function Base.:/(x::Tracked, y::Tracked)
 50 | 	Tracked(x.val / y.val, :/, @λ(Δ -> (Δ / y.val, -Δ * x.val / y.val^2)), Tracked[x, y])
 51 | end
 52 | 
 53 | # ╔═╡ 7429ffcb-dcee-4090-972e-ffde8393a37a
 54 | begin
 55 | 	# `Tracked` is a tree, we just need to tell AbstractTrees.jl how to get the children for each node
 56 | 	AbstractTrees.children(x::Tracked) = x.deps
 57 | 	# All this is just for nicer printing
 58 | 	function Base.show(io::IO, x::Tracked)
 59 | 		if x.df === nothing
 60 | 			print(io, Base.isgensym(x.name) ? x.val : "$(x.name)=$(x.val)")
 61 | 		else
 62 | 			print(io, "Tracked(")
 63 | 			show(io, x.val)
 64 | 			print(io, ", ")
 65 | 			print(io, x.name)
 66 | 			#print(io, ", ")
 67 | 			#show(io, x.df)
 68 | 			print(io, ")")
 69 | 		end
 70 | 	end
 71 | 	Base.show(io::IO, ::MIME"text/plain", x::Tracked) = print_tree(io, x)
 72 | end
 73 | 
 74 | # ╔═╡ 0b5e6560-81fd-4182-bba5-aca702fb3048
 75 | begin
 76 |    x = Tracked{Int}(3, :x)
 77 |    y  = Tracked{Int}(5,:y)
 78 | end
 79 | 
 80 | # ╔═╡ 2cc054d3-470d-421c-8628-c5c2b0e5e402
 81 | 
 82 | 
 83 | # ╔═╡ 81eb8a2d-a3a9-45af-a5a5-b96aefd48712
 84 | y.val # The regular result of `2x + (x-1)^2`
 85 | 
 86 | # ╔═╡ e52aa672-69a9-419b-a992-e7a3d1364fb6
 87 | # PreOrderDFS traverses this tree from the top down
 88 | Text.(collect(PreOrderDFS(y*x+x^2)))
 89 | 
 90 | # ╔═╡ f0814e23-6f75-4db8-b277-d21d4926f876
 91 | y*x+x^2
 92 | 
 93 | # ╔═╡ 99a3507b-ca03-429f-acde-e2d1ebb32054
 94 | # produces a dict with all the intermediate gradient
 95 | function grad(f::Tracked)
 96 | 	d = Dict{Any, Any}(f => 1)
 97 | 	for x in PreOrderDFS(f) # recursively traverse all dependents
 98 | 		x.df === nothing && continue # ignore untracked variables like constants
 99 | 		dy = x.df(d[x]) # evaluate pullback
100 | 		for (yᵢ, dyᵢ) in zip(x.deps, dy)
101 | 			# store the gradient in d
102 | 			# if we have already stored a gradient for this variable, we need to add them
103 | 			d[yᵢ] = get(d, yᵢ, 0) + dyᵢ
104 | 		end
105 | 	end
106 | 	return d
107 | end
108 | 
109 | # ╔═╡ d4e9b202-242e-4420-986b-12d2ab57af93
110 | grad(f::Tracked, x::Tracked) = grad(f)[x]
111 | 
112 | # ╔═╡ dc62ff81-dbb8-4416-8fc7-8878e16bdf85
113 | grad(y)
114 | 
115 | # ╔═╡ fc8aeed7-2806-438a-85f7-c155b0b222e6
116 | #grad(y, x)
117 | 
118 | # ╔═╡ a34a0941-6e7e-4a40-affa-7941c54a10b9
119 | y
120 | 
121 | # ╔═╡ 18b1c55d-a6b5-44f6-b0b3-50bdb0aa9d96
122 | w = x*y + x
123 | 
124 | # ╔═╡ 506d408e-dc2b-4e12-b917-286e3f4079a2
125 | grad(w)
126 | 
127 | # ╔═╡ e8b19887-d7b6-40e4-b099-a08ddc776e74
128 | cumsum(1:5)
129 | 
130 | # ╔═╡ 00000000-0000-0000-0000-000000000001
131 | PLUTO_PROJECT_TOML_CONTENTS = """
132 | [deps]
133 | AbstractTrees = "1520ce14-60c1-5f80-bbc7-55ef81b5835c"
134 | LegibleLambdas = "f1f30506-32fe-5131-bd72-7c197988f9e5"
135 | 
136 | [compat]
137 | AbstractTrees = "~0.3.4"
138 | LegibleLambdas = "~0.3.0"
139 | """
140 | 
141 | # ╔═╡ 00000000-0000-0000-0000-000000000002
142 | PLUTO_MANIFEST_TOML_CONTENTS = """
143 | # This file is machine-generated - editing it directly is not advised
144 | 
145 | julia_version = "1.7.1"
146 | manifest_format = "2.0"
147 | 
148 | [[deps.AbstractTrees]]
149 | git-tree-sha1 = "03e0550477d86222521d254b741d470ba17ea0b5"
150 | uuid = "1520ce14-60c1-5f80-bbc7-55ef81b5835c"
151 | version = "0.3.4"
152 | 
153 | [[deps.Base64]]
154 | uuid = "2a0f44e3-6c83-55bd-87e4-b1978d98bd5f"
155 | 
156 | [[deps.LegibleLambdas]]
157 | deps = ["MacroTools"]
158 | git-tree-sha1 = "7946db4829eb8de47c399f92c19790f9cc0bbd07"
159 | uuid = "f1f30506-32fe-5131-bd72-7c197988f9e5"
160 | version = "0.3.0"
161 | 
162 | [[deps.MacroTools]]
163 | deps = ["Markdown", "Random"]
164 | git-tree-sha1 = "3d3e902b31198a27340d0bf00d6ac452866021cf"
165 | uuid = "1914dd2f-81c6-5fcd-8719-6d5c9610ff09"
166 | version = "0.5.9"
167 | 
168 | [[deps.Markdown]]
169 | deps = ["Base64"]
170 | uuid = "d6f4376e-aef5-505a-96c1-9c027394607a"
171 | 
172 | [[deps.Random]]
173 | deps = ["SHA", "Serialization"]
174 | uuid = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
175 | 
176 | [[deps.SHA]]
177 | uuid = "ea8e919c-243c-51af-8825-aaa63cd721ce"
178 | 
179 | [[deps.Serialization]]
180 | uuid = "9e88b42a-f829-5b0c-bbe9-9e923198166b"
181 | """
182 | 
183 | # ╔═╡ Cell order:
184 | # ╠═d5559dba-9fe4-11ec-3744-ebd1408e7dc4
185 | # ╠═99b6ab91-a022-449c-988c-0e5c5719c910
186 | # ╠═13487e65-5e48-4a37-9bea-f262dd7b6d56
187 | # ╠═b0cc4665-eb45-48ea-9a33-5acf56d2a283
188 | # ╠═73d638bf-30c1-4694-b3a8-4b29c5e3fa65
189 | # ╠═2141849b-675e-406c-8df4-34b2706507af
190 | # ╠═ac097299-0a31-474c-ab26-a4fb24bb9046
191 | # ╠═7429ffcb-dcee-4090-972e-ffde8393a37a
192 | # ╠═0b5e6560-81fd-4182-bba5-aca702fb3048
193 | # ╠═2cc054d3-470d-421c-8628-c5c2b0e5e402
194 | # ╠═81eb8a2d-a3a9-45af-a5a5-b96aefd48712
195 | # ╠═e52aa672-69a9-419b-a992-e7a3d1364fb6
196 | # ╠═f0814e23-6f75-4db8-b277-d21d4926f876
197 | # ╠═99a3507b-ca03-429f-acde-e2d1ebb32054
198 | # ╠═d4e9b202-242e-4420-986b-12d2ab57af93
199 | # ╠═dc62ff81-dbb8-4416-8fc7-8878e16bdf85
200 | # ╠═fc8aeed7-2806-438a-85f7-c155b0b222e6
201 | # ╠═a34a0941-6e7e-4a40-affa-7941c54a10b9
202 | # ╠═18b1c55d-a6b5-44f6-b0b3-50bdb0aa9d96
203 | # ╠═506d408e-dc2b-4e12-b917-286e3f4079a2
204 | # ╠═e8b19887-d7b6-40e4-b099-a08ddc776e74
205 | # ╟─00000000-0000-0000-0000-000000000001
206 | # ╟─00000000-0000-0000-0000-000000000002
207 | 


--------------------------------------------------------------------------------
/lecture 12/reverse mode 4.jl.zip:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture 12/reverse mode 4.jl.zip


--------------------------------------------------------------------------------
/lecture 14/adjoint equations.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture 14/adjoint equations.pdf


--------------------------------------------------------------------------------
/lecture 17/handwritten notes adjoint.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture 17/handwritten notes adjoint.pdf


--------------------------------------------------------------------------------
/lecture 22/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture 22/.DS_Store


--------------------------------------------------------------------------------
/lecture 22/HPEC-Handbook-Kepner.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture 22/HPEC-Handbook-Kepner.pdf


--------------------------------------------------------------------------------
/lecture 22/MathOfBigData-Chapter1.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture 22/MathOfBigData-Chapter1.pdf


--------------------------------------------------------------------------------
/lecture 22/Optimizing_Xeon_Phi_for_Interactive_Data_Analysis.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture 22/Optimizing_Xeon_Phi_for_Interactive_Data_Analysis.pdf


--------------------------------------------------------------------------------
/lecture 24/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture 24/.DS_Store


--------------------------------------------------------------------------------
/lecture 24/.ipynb_checkpoints/Designing+Markov+chains-checkpoint.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# Designing Markov chains"
  8 |    ]
  9 |   },
 10 |   {
 11 |    "cell_type": "markdown",
 12 |    "metadata": {},
 13 |    "source": [
 14 |     "How can we design a Markov chain such that it converges to a given distribution $\\pi(s)$ over states $s$?\n",
 15 |     "The idea is to design the chain such that it has a **stationary distribution** to which it converges after a long time, and such that that stationary distribution is equal to $\\pi$."
 16 |    ]
 17 |   },
 18 |   {
 19 |    "cell_type": "markdown",
 20 |    "metadata": {},
 21 |    "source": [
 22 |     "To do so, we need to find (design) suitable transition probabilities $p(s \\to t)$ of jumping from a state $s$ to a state $t$.\n",
 23 |     "\n",
 24 |     "The simplest design method is to impose the **detailed balance** criterion,\n",
 25 |     "\n",
 26 |     "$$\\pi(s) p(s \\to t) = \\pi(t) p(t \\to s) \\quad \\forall s, t,$$\n",
 27 |     "\n",
 28 |     "which says that the flow of probability between any two states is equal, and hence that there is an equilibrium between any two states. \n",
 29 |     "[This is not a necessary condition: there are MCMC methods that impose only the weaker \"balance\" condition that the *total* flow into and out of a given state should be equal.]\n",
 30 |     "\n",
 31 |     "This then imposes a condition on the ratio\n",
 32 |     "$$\\frac{p(s \\to t)}{p(t \\to s)} = \\frac{\\pi(t)}{\\pi(s)}.$$\n",
 33 |     "\n",
 34 |     "Note that the normalization constant disappears in this ratio of values of $\\pi$, so that we can design a chain for a distribution whose normalization constant we don't know."
 35 |    ]
 36 |   },
 37 |   {
 38 |    "cell_type": "markdown",
 39 |    "metadata": {},
 40 |    "source": [
 41 |     "There are many ways to solve this underdetermined set of equations. The Metropolis solution is the following. \n",
 42 |     "\n",
 43 |     "We split up $p(s \\to t)$ into $g(s \\to t) \\cdot \\alpha(s \\to t)$, where $g(s \\to t)$ is the probability of proposing (generating) the state $t$ from the state $s$, and $\\alpha(s \\to t)$ is the probability of accepting the move.\n",
 44 |     "\n",
 45 |     "If $g$ is symmetric, such that $g(s \\to t) = g(t \\to s)$ for all $s, t$, then we have\n",
 46 |     "\n",
 47 |     "$$\\frac{\\alpha(s \\to t)}{\\alpha(t \\to s)} = \\frac{\\pi(t)}{\\pi(s)}.$$"
 48 |    ]
 49 |   },
 50 |   {
 51 |    "cell_type": "markdown",
 52 |    "metadata": {},
 53 |    "source": [
 54 |     "We attempt to maximise the acceptance ratio $\\alpha(s \\to t)$ by putting it equal to $1$ when possible. The solution is\n",
 55 |     "\n",
 56 |     "$$\\alpha(s \\to t) = \\max \\left[ 1, \\frac{\\pi(s)}{\\pi(t)} \\right].$$\n",
 57 |     "\n",
 58 |     "Note that this choice implies that the probability of going \"downhill\" (to a less likely state) is 1."
 59 |    ]
 60 |   },
 61 |   {
 62 |    "cell_type": "markdown",
 63 |    "metadata": {},
 64 |    "source": [
 65 |     "See also [this Wikipedia article](https://en.wikipedia.org/wiki/Metropolis%E2%80%93Hastings_algorithm) and e.g. the book by Newman & Barkema, Monte Carlo Methods in Statistical Physics."
 66 |    ]
 67 |   },
 68 |   {
 69 |    "cell_type": "markdown",
 70 |    "metadata": {},
 71 |    "source": [
 72 |     "## Code for simplest Metropolis MCMC"
 73 |    ]
 74 |   },
 75 |   {
 76 |    "cell_type": "code",
 77 |    "execution_count": 1,
 78 |    "metadata": {},
 79 |    "outputs": [
 80 |     {
 81 |      "data": {
 82 |       "text/plain": [
 83 |        "MCMC"
 84 |       ]
 85 |      },
 86 |      "execution_count": 1,
 87 |      "metadata": {},
 88 |      "output_type": "execute_result"
 89 |     }
 90 |    ],
 91 |    "source": [
 92 |     "doc\"\"\"Generate a distribution looking like the (unnormalised) function f using MCMC\"\"\"\n",
 93 |     "function MCMC(f, N=100000)\n",
 94 |     "\n",
 95 |     "    data = Float64[]\n",
 96 |     "    \n",
 97 |     "    x = 0.0\n",
 98 |     "\n",
 99 |     "    for i in 1:N\n",
100 |     "        x_new = x + 0.1*(rand() - 0.5)  # generate new state locally\n",
101 |     "\n",
102 |     "        ratio = f(x_new) / f(x)\n",
103 |     "\n",
104 |     "        if rand() < ratio\n",
105 |     "            x = x_new\n",
106 |     "        end\n",
107 |     "\n",
108 |     "        push!(data, x)\n",
109 |     "    end\n",
110 |     "    \n",
111 |     "    return data\n",
112 |     "end"
113 |    ]
114 |   },
115 |   {
116 |    "cell_type": "code",
117 |    "execution_count": 2,
118 |    "metadata": {},
119 |    "outputs": [
120 |     {
121 |      "data": {
122 |       "text/plain": [
123 |        "Plots.GRBackend()"
124 |       ]
125 |      },
126 |      "execution_count": 2,
127 |      "metadata": {},
128 |      "output_type": "execute_result"
129 |     }
130 |    ],
131 |    "source": [
132 |     "using Plots\n",
133 |     "gr()"
134 |    ]
135 |   },
136 |   {
137 |    "cell_type": "code",
138 |    "execution_count": null,
139 |    "metadata": {},
140 |    "outputs": [],
141 |    "source": [
142 |     "data = MCMC(x->exp(-x^2), 10^7)\n",
143 |     "histogram(data, normed=true, bins=100)"
144 |    ]
145 |   },
146 |   {
147 |    "cell_type": "code",
148 |    "execution_count": 4,
149 |    "metadata": {},
150 |    "outputs": [
151 |     {
152 |      "data": {
153 |       "text/html": [
154 |        "<?xml version=\"1.0\" encoding=\"utf-8\"?>\n",
155 |        "<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"600\" height=\"400\" viewBox=\"0 0 600 400\">\n",
156 |        "<defs>\n",
157 |        "  <clipPath id=\"clip00\">\n",
158 |        "    <rect x=\"0\" y=\"0\" width=\"600\" height=\"400\"/>\n",
159 |        "  </clipPath>\n",
160 |        "</defs>\n",
161 |        "<polygon clip-path=\"url(#clip00)\" points=\"\n",
162 |        "0,400 600,400 600,0 0,0 \n",
163 |        "  \" fill=\"#ffffff\" fill-opacity=\"1\"/>\n",
164 |        "<defs>\n",
165 |        "  <clipPath id=\"clip01\">\n",
166 |        "    <rect x=\"120\" y=\"0\" width=\"421\" height=\"400\"/>\n",
167 |        "  </clipPath>\n",
168 |        "</defs>\n",
169 |        "<polygon clip-path=\"url(#clip00)\" points=\"\n",
170 |        "32.2221,375.813 580.315,375.813 580.315,11.811 32.2221,11.811 \n",
171 |        "  \" fill=\"#ffffff\" fill-opacity=\"1\"/>\n",
172 |        "<defs>\n",
173 |        "  <clipPath id=\"clip02\">\n",
174 |        "    <rect x=\"32\" y=\"11\" width=\"549\" height=\"365\"/>\n",
175 |        "  </clipPath>\n",
176 |        "</defs>\n",
177 |        "<polyline clip-path=\"url(#clip02)\" style=\"stroke:#000000; stroke-width:0.5; stroke-opacity:0.1; fill:none\" points=\"\n",
178 |        "  136.914,370.353 136.914,17.2711 \n",
179 |        "  \"/>\n",
180 |        "<polyline clip-path=\"url(#clip02)\" style=\"stroke:#000000; stroke-width:0.5; stroke-opacity:0.1; fill:none\" points=\"\n",
181 |        "  290.873,370.353 290.873,17.2711 \n",
182 |        "  \"/>\n",
183 |        "<polyline clip-path=\"url(#clip02)\" style=\"stroke:#000000; stroke-width:0.5; stroke-opacity:0.1; fill:none\" points=\"\n",
184 |        "  444.831,370.353 444.831,17.2711 \n",
185 |        "  \"/>\n",
186 |        "<polyline clip-path=\"url(#clip02)\" style=\"stroke:#000000; stroke-width:0.5; stroke-opacity:0.1; fill:none\" points=\"\n",
187 |        "  40.4435,375.813 572.094,375.813 \n",
188 |        "  \"/>\n",
189 |        "<polyline clip-path=\"url(#clip02)\" style=\"stroke:#000000; stroke-width:0.5; stroke-opacity:0.1; fill:none\" points=\"\n",
190 |        "  40.4435,295.906 572.094,295.906 \n",
191 |        "  \"/>\n",
192 |        "<polyline clip-path=\"url(#clip02)\" style=\"stroke:#000000; stroke-width:0.5; stroke-opacity:0.1; fill:none\" points=\"\n",
193 |        "  40.4435,215.999 572.094,215.999 \n",
194 |        "  \"/>\n",
195 |        "<polyline clip-path=\"url(#clip02)\" style=\"stroke:#000000; stroke-width:0.5; stroke-opacity:0.1; fill:none\" points=\"\n",
196 |        "  40.4435,136.091 572.094,136.091 \n",
197 |        "  \"/>\n",
198 |        "<polyline clip-path=\"url(#clip02)\" style=\"stroke:#000000; stroke-width:0.5; stroke-opacity:0.1; fill:none\" points=\"\n",
199 |        "  40.4435,56.1836 572.094,56.1836 \n",
200 |        "  \"/>\n",
201 |        "<polyline clip-path=\"url(#clip00)\" style=\"stroke:#000000; stroke-width:1; stroke-opacity:1; fill:none\" points=\"\n",
202 |        "  32.2221,375.813 580.315,375.813 \n",
203 |        "  \"/>\n",
204 |        "<polyline clip-path=\"url(#clip00)\" style=\"stroke:#000000; stroke-width:1; stroke-opacity:1; fill:none\" points=\"\n",
205 |        "  136.914,375.813 136.914,370.353 \n",
206 |        "  \"/>\n",
207 |        "<polyline clip-path=\"url(#clip00)\" style=\"stroke:#000000; stroke-width:1; stroke-opacity:1; fill:none\" points=\"\n",
208 |        "  290.873,375.813 290.873,370.353 \n",
209 |        "  \"/>\n",
210 |        "<polyline clip-path=\"url(#clip00)\" style=\"stroke:#000000; stroke-width:1; stroke-opacity:1; fill:none\" points=\"\n",
211 |        "  444.831,375.813 444.831,370.353 \n",
212 |        "  \"/>\n",
213 |        "<polyline clip-path=\"url(#clip00)\" style=\"stroke:#000000; stroke-width:1; stroke-opacity:1; fill:none\" points=\"\n",
214 |        "  32.2221,375.813 32.2221,11.811 \n",
215 |        "  \"/>\n",
216 |        "<polyline clip-path=\"url(#clip00)\" style=\"stroke:#000000; stroke-width:1; stroke-opacity:1; fill:none\" points=\"\n",
217 |        "  32.2221,375.813 40.4435,375.813 \n",
218 |        "  \"/>\n",
219 |        "<polyline clip-path=\"url(#clip00)\" style=\"stroke:#000000; stroke-width:1; stroke-opacity:1; fill:none\" points=\"\n",
220 |        "  32.2221,295.906 40.4435,295.906 \n",
221 |        "  \"/>\n",
222 |        "<polyline clip-path=\"url(#clip00)\" style=\"stroke:#000000; stroke-width:1; stroke-opacity:1; fill:none\" points=\"\n",
223 |        "  32.2221,215.999 40.4435,215.999 \n",
224 |        "  \"/>\n",
225 |        "<polyline clip-path=\"url(#clip00)\" style=\"stroke:#000000; stroke-width:1; stroke-opacity:1; fill:none\" points=\"\n",
226 |        "  32.2221,136.091 40.4435,136.091 \n",
227 |        "  \"/>\n",
228 |        "<polyline clip-path=\"url(#clip00)\" style=\"stroke:#000000; stroke-width:1; stroke-opacity:1; fill:none\" points=\"\n",
229 |        "  32.2221,56.1836 40.4435,56.1836 \n",
230 |        "  \"/>\n",
231 |        "<g clip-path=\"url(#clip00)\">\n",
232 |        "<text style=\"fill:#000000; fill-opacity:1; font-family:Arial,Helvetica Neue,Helvetica,sans-serif; font-size:12; text-anchor:middle;\" transform=\"rotate(0, 136.914, 389.613)\" x=\"136.914\" y=\"389.613\">-5</text>\n",
233 |        "</g>\n",
234 |        "<g clip-path=\"url(#clip00)\">\n",
235 |        "<text style=\"fill:#000000; fill-opacity:1; font-family:Arial,Helvetica Neue,Helvetica,sans-serif; font-size:12; text-anchor:middle;\" transform=\"rotate(0, 290.873, 389.613)\" x=\"290.873\" y=\"389.613\">0</text>\n",
236 |        "</g>\n",
237 |        "<g clip-path=\"url(#clip00)\">\n",
238 |        "<text style=\"fill:#000000; fill-opacity:1; font-family:Arial,Helvetica Neue,Helvetica,sans-serif; font-size:12; text-anchor:middle;\" transform=\"rotate(0, 444.831, 389.613)\" x=\"444.831\" y=\"389.613\">5</text>\n",
239 |        "</g>\n",
240 |        "<g clip-path=\"url(#clip00)\">\n",
241 |        "<text style=\"fill:#000000; fill-opacity:1; font-family:Arial,Helvetica Neue,Helvetica,sans-serif; font-size:12; text-anchor:end;\" transform=\"rotate(0, 26.2221, 380.313)\" x=\"26.2221\" y=\"380.313\">0.0</text>\n",
242 |        "</g>\n",
243 |        "<g clip-path=\"url(#clip00)\">\n",
244 |        "<text style=\"fill:#000000; fill-opacity:1; font-family:Arial,Helvetica Neue,Helvetica,sans-serif; font-size:12; text-anchor:end;\" transform=\"rotate(0, 26.2221, 300.406)\" x=\"26.2221\" y=\"300.406\">0.1</text>\n",
245 |        "</g>\n",
246 |        "<g clip-path=\"url(#clip00)\">\n",
247 |        "<text style=\"fill:#000000; fill-opacity:1; font-family:Arial,Helvetica Neue,Helvetica,sans-serif; font-size:12; text-anchor:end;\" transform=\"rotate(0, 26.2221, 220.499)\" x=\"26.2221\" y=\"220.499\">0.2</text>\n",
248 |        "</g>\n",
249 |        "<g clip-path=\"url(#clip00)\">\n",
250 |        "<text style=\"fill:#000000; fill-opacity:1; font-family:Arial,Helvetica Neue,Helvetica,sans-serif; font-size:12; text-anchor:end;\" transform=\"rotate(0, 26.2221, 140.591)\" x=\"26.2221\" y=\"140.591\">0.3</text>\n",
251 |        "</g>\n",
252 |        "<g clip-path=\"url(#clip00)\">\n",
253 |        "<text style=\"fill:#000000; fill-opacity:1; font-family:Arial,Helvetica Neue,Helvetica,sans-serif; font-size:12; text-anchor:end;\" transform=\"rotate(0, 26.2221, 60.6836)\" x=\"26.2221\" y=\"60.6836\">0.4</text>\n",
254 |        "</g>\n",
255 |        "<polyline clip-path=\"url(#clip02)\" style=\"stroke:#000000; stroke-width:1; stroke-opacity:1; fill:none\" points=\"\n",
256 |        "  32.2221,375.813 32.2221,375.812 38.3805,375.812 38.3805,375.741 44.5388,375.741 44.5388,375.565 50.6971,375.565 50.6971,375.595 56.8555,375.595 56.8555,375.539 \n",
257 |        "  63.0138,375.539 63.0138,375.459 69.1722,375.459 69.1722,375.357 75.3305,375.357 75.3305,375.363 81.4889,375.363 81.4889,375.447 87.6472,375.447 87.6472,375.418 \n",
258 |        "  93.8056,375.418 93.8056,375.261 99.9639,375.261 99.9639,375.253 106.122,375.253 106.122,374.624 112.281,374.624 112.281,374.021 118.439,374.021 118.439,372.851 \n",
259 |        "  124.597,372.851 124.597,372.337 130.756,372.337 130.756,371.46 136.914,371.46 136.914,370.302 143.072,370.302 143.072,369.356 149.231,369.356 149.231,368.443 \n",
260 |        "  155.389,368.443 155.389,367.275 161.547,367.275 161.547,366.167 167.706,366.167 167.706,365.255 173.864,365.255 173.864,364.133 180.022,364.133 180.022,361.87 \n",
261 |        "  186.181,361.87 186.181,358.074 192.339,358.074 192.339,355.818 198.497,355.818 198.497,352.514 204.656,352.514 204.656,348.741 210.814,348.741 210.814,344.035 \n",
262 |        "  216.973,344.035 216.973,338.122 223.131,338.122 223.131,331.082 229.289,331.082 229.289,323.382 235.448,323.382 235.448,310.474 241.606,310.474 241.606,295.296 \n",
263 |        "  247.764,295.296 247.764,274.456 253.923,274.456 253.923,249.435 260.081,249.435 260.081,219.447 266.239,219.447 266.239,180.485 272.398,180.485 272.398,140.484 \n",
264 |        "  278.556,140.484 278.556,85.6823 284.714,85.6823 284.714,11.811 290.873,11.811 290.873,11.8777 297.031,11.8777 297.031,76.208 303.189,76.208 303.189,131.084 \n",
265 |        "  309.348,131.084 309.348,174.8 315.506,174.8 315.506,210.856 321.664,210.856 321.664,238.518 327.823,238.518 327.823,263.354 333.981,263.354 333.981,285.901 \n",
266 |        "  340.139,285.901 340.139,303.232 346.298,303.232 346.298,317.709 352.456,317.709 352.456,327.364 358.614,327.364 358.614,335.116 364.773,335.116 364.773,343.113 \n",
267 |        "  370.931,343.113 370.931,349.205 377.09,349.205 377.09,355.364 383.248,355.364 383.248,358.728 389.406,358.728 389.406,360.925 395.565,360.925 395.565,362.581 \n",
268 |        "  401.723,362.581 401.723,365.165 407.881,365.165 407.881,366.843 414.04,366.843 414.04,368.82 420.198,368.82 420.198,369.578 426.356,369.578 426.356,370.121 \n",
269 |        "  432.515,370.121 432.515,370.466 438.673,370.466 438.673,370.816 444.831,370.816 444.831,371.564 450.99,371.564 450.99,372.252 457.148,372.252 457.148,372.946 \n",
270 |        "  463.306,372.946 463.306,373.088 469.465,373.088 469.465,373.544 475.623,373.544 475.623,373.264 481.781,373.264 481.781,373.301 487.94,373.301 487.94,374.321 \n",
271 |        "  494.098,374.321 494.098,374.567 500.256,374.567 500.256,375.001 506.415,375.001 506.415,375.282 512.573,375.282 512.573,375.472 518.731,375.472 518.731,375.567 \n",
272 |        "  524.89,375.567 524.89,375.444 531.048,375.444 531.048,375.434 537.207,375.434 537.207,375.572 543.365,375.572 543.365,375.661 549.523,375.661 549.523,375.725 \n",
273 |        "  555.682,375.725 555.682,375.746 561.84,375.746 561.84,375.745 567.998,375.745 567.998,375.73 574.157,375.73 574.157,375.807 580.315,375.807 580.315,375.813 \n",
274 |        "  \n",
275 |        "  \"/>\n",
276 |        "<polygon clip-path=\"url(#clip00)\" points=\"\n",
277 |        "489.799,62.931 562.315,62.931 562.315,32.691 489.799,32.691 \n",
278 |        "  \" fill=\"#ffffff\" fill-opacity=\"1\"/>\n",
279 |        "<polyline clip-path=\"url(#clip00)\" style=\"stroke:#000000; stroke-width:1; stroke-opacity:1; fill:none\" points=\"\n",
280 |        "  489.799,62.931 562.315,62.931 562.315,32.691 489.799,32.691 489.799,62.931 \n",
281 |        "  \"/>\n",
282 |        "<polyline clip-path=\"url(#clip00)\" style=\"stroke:#000000; stroke-width:1; stroke-opacity:1; fill:none\" points=\"\n",
283 |        "  495.799,47.811 531.799,47.811 \n",
284 |        "  \"/>\n",
285 |        "<g clip-path=\"url(#clip00)\">\n",
286 |        "<text style=\"fill:#000000; fill-opacity:1; font-family:Arial,Helvetica Neue,Helvetica,sans-serif; font-size:12; text-anchor:start;\" transform=\"rotate(0, 537.799, 52.311)\" x=\"537.799\" y=\"52.311\">y1</text>\n",
287 |        "</g>\n",
288 |        "</svg>\n"
289 |       ]
290 |      },
291 |      "execution_count": 4,
292 |      "metadata": {},
293 |      "output_type": "execute_result"
294 |     }
295 |    ],
296 |    "source": [
297 |     "data = MCMC(x->exp(-abs(x)), 10^7)\n",
298 |     "histogram(data, normed=true, bins=100)"
299 |    ]
300 |   },
301 |   {
302 |    "cell_type": "code",
303 |    "execution_count": null,
304 |    "metadata": {
305 |     "collapsed": true
306 |    },
307 |    "outputs": [],
308 |    "source": [
309 |     "data = MCMC(x->(abs(x)<10 ? 1 : 0), 10^9)\n",
310 |     "histogram(data, normed=true, bins=100)"
311 |    ]
312 |   },
313 |   {
314 |    "cell_type": "code",
315 |    "execution_count": null,
316 |    "metadata": {
317 |     "collapsed": true
318 |    },
319 |    "outputs": [],
320 |    "source": [
321 |     "data = MCMC(x->(abs(x)<10 ? x^2+1 : 0), 10^7)\n",
322 |     "histogram(data, normed=true, bins=100)"
323 |    ]
324 |   },
325 |   {
326 |    "cell_type": "code",
327 |    "execution_count": 10,
328 |    "metadata": {},
329 |    "outputs": [
330 |     {
331 |      "data": {
332 |       "text/plain": [
333 |        "1000000000-element Array{Float64,1}:\n",
334 |        " -0.01073   \n",
335 |        " -0.0392436 \n",
336 |        " -0.0233078 \n",
337 |        " -0.066845  \n",
338 |        " -0.0220234 \n",
339 |        "  0.0179812 \n",
340 |        " -0.00588417\n",
341 |        "  0.0311589 \n",
342 |        "  0.0553976 \n",
343 |        "  0.0551316 \n",
344 |        "  0.0722811 \n",
345 |        "  0.0831915 \n",
346 |        "  0.126861  \n",
347 |        "  ⋮         \n",
348 |        "  8.27072   \n",
349 |        "  8.25477   \n",
350 |        "  8.28446   \n",
351 |        "  8.24666   \n",
352 |        "  8.24466   \n",
353 |        "  8.27376   \n",
354 |        "  8.24812   \n",
355 |        "  8.20816   \n",
356 |        "  8.20128   \n",
357 |        "  8.18769   \n",
358 |        "  8.15618   \n",
359 |        "  8.15794   "
360 |       ]
361 |      },
362 |      "execution_count": 10,
363 |      "metadata": {},
364 |      "output_type": "execute_result"
365 |     }
366 |    ],
367 |    "source": [
368 |     "data"
369 |    ]
370 |   },
371 |   {
372 |    "cell_type": "code",
373 |    "execution_count": null,
374 |    "metadata": {
375 |     "collapsed": true
376 |    },
377 |    "outputs": [],
378 |    "source": [
379 |     "L\"x^2\""
380 |    ]
381 |   },
382 |   {
383 |    "cell_type": "code",
384 |    "execution_count": null,
385 |    "metadata": {
386 |     "collapsed": true
387 |    },
388 |    "outputs": [],
389 |    "source": []
390 |   }
391 |  ],
392 |  "metadata": {
393 |   "kernelspec": {
394 |    "display_name": "Julia 1.7 1.7.1",
395 |    "language": "julia",
396 |    "name": "julia-1.7-1.7"
397 |   },
398 |   "language_info": {
399 |    "file_extension": ".jl",
400 |    "mimetype": "application/julia",
401 |    "name": "julia",
402 |    "version": "1.7.1"
403 |   },
404 |   "toc": {
405 |    "colors": {
406 |     "hover_highlight": "#DAA520",
407 |     "running_highlight": "#FF0000",
408 |     "selected_highlight": "#FFD700"
409 |    },
410 |    "moveMenuLeft": true,
411 |    "nav_menu": {
412 |     "height": "30px",
413 |     "width": "252px"
414 |    },
415 |    "navigate_menu": true,
416 |    "number_sections": true,
417 |    "sideBar": true,
418 |    "threshold": "1",
419 |    "toc_cell": false,
420 |    "toc_section_display": "block",
421 |    "toc_window_display": false
422 |   }
423 |  },
424 |  "nbformat": 4,
425 |  "nbformat_minor": 2
426 | }
427 | 


--------------------------------------------------------------------------------
/lecture 24/.ipynb_checkpoints/Metropolis with linear algebra-checkpoint.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "code",
  5 |    "execution_count": 24,
  6 |    "metadata": {},
  7 |    "outputs": [],
  8 |    "source": [
  9 |     "using LinearAlgebra"
 10 |    ]
 11 |   },
 12 |   {
 13 |    "cell_type": "code",
 14 |    "execution_count": 142,
 15 |    "metadata": {},
 16 |    "outputs": [
 17 |     {
 18 |      "data": {
 19 |       "text/plain": [
 20 |        "7×7 Matrix{Float64}:\n",
 21 |        " 1.0       0.470461   0.357589  0.677251   1.0  0.598646   0.703171\n",
 22 |        " 1.0       1.0        0.760081  1.0        1.0  1.0        1.0\n",
 23 |        " 1.0       1.0        1.0       1.0        1.0  1.0        1.0\n",
 24 |        " 1.0       0.694663   0.528     1.0        1.0  0.883936   1.0\n",
 25 |        " 0.127373  0.0599239  0.045547  0.0862633  1.0  0.0762512  0.0895648\n",
 26 |        " 1.0       0.785875   0.597328  1.0        1.0  1.0        1.0\n",
 27 |        " 1.0       0.669057   0.508537  0.963139   1.0  0.851353   1.0"
 28 |       ]
 29 |      },
 30 |      "execution_count": 142,
 31 |      "metadata": {},
 32 |      "output_type": "execute_result"
 33 |     }
 34 |    ],
 35 |    "source": [
 36 |     "# Create a vector of Probabilities and do the Metropolis thing\n",
 37 |     "N = 7\n",
 38 |     "π = normalize(rand(N),1)\n",
 39 |     "A = min.(1,π./π') # Acceptance Matrix"
 40 |    ]
 41 |   },
 42 |   {
 43 |    "cell_type": "code",
 44 |    "execution_count": 135,
 45 |    "metadata": {},
 46 |    "outputs": [
 47 |     {
 48 |      "data": {
 49 |       "text/plain": [
 50 |        "true"
 51 |       ]
 52 |      },
 53 |      "execution_count": 135,
 54 |      "metadata": {},
 55 |      "output_type": "execute_result"
 56 |     }
 57 |    ],
 58 |    "source": [
 59 |     "# Note that by construction\n",
 60 |     "A'./A ≈ π'./π"
 61 |    ]
 62 |   },
 63 |   {
 64 |    "cell_type": "code",
 65 |    "execution_count": 136,
 66 |    "metadata": {},
 67 |    "outputs": [
 68 |     {
 69 |      "data": {
 70 |       "text/plain": [
 71 |        "true"
 72 |       ]
 73 |      },
 74 |      "execution_count": 136,
 75 |      "metadata": {},
 76 |      "output_type": "execute_result"
 77 |     }
 78 |    ],
 79 |    "source": [
 80 |     "# The same test in linear algebra notation\n",
 81 |     "A ≈ Diagonal(π)*A'/Diagonal(π)"
 82 |    ]
 83 |   },
 84 |   {
 85 |    "cell_type": "code",
 86 |    "execution_count": 144,
 87 |    "metadata": {},
 88 |    "outputs": [
 89 |     {
 90 |      "data": {
 91 |       "text/plain": [
 92 |        "true"
 93 |       ]
 94 |      },
 95 |      "execution_count": 144,
 96 |      "metadata": {},
 97 |      "output_type": "execute_result"
 98 |     }
 99 |    ],
100 |    "source": [
101 |     "# The following steps preserve P'./P ≈ π'./π \n",
102 |     "# but add a new property:  sum(P,1) ≈ ones(1,N)\n",
103 |     "\n",
104 |     "G = [ i==j ? 0 : 1/(N-1) for i=1:N,j=1:N] # Generating Matrix\n",
105 |     "M = G.*A # Markov Matrix\n",
106 |     "\n",
107 |     "M += Diagonal(1 .- sum(M,dims=1)[:]) # Rejection Probabilities\n",
108 |     "M'./M ≈ π'./π   &&  sum(M,dims=1) ≈ ones(1,N) "
109 |    ]
110 |   },
111 |   {
112 |    "cell_type": "code",
113 |    "execution_count": 132,
114 |    "metadata": {},
115 |    "outputs": [
116 |     {
117 |      "data": {
118 |       "text/plain": [
119 |        "true"
120 |       ]
121 |      },
122 |      "execution_count": 132,
123 |      "metadata": {},
124 |      "output_type": "execute_result"
125 |     }
126 |    ],
127 |    "source": [
128 |     "M*π ≈ π \n",
129 |     "# why? multiplying P*π \n",
130 |     "# from right to left in\n",
131 |     "# (Diagonal(π)*P'/Diagonal(π)) * π \n",
132 |     "# gives π --> ones --> ones --> π"
133 |    ]
134 |   },
135 |   {
136 |    "cell_type": "code",
137 |    "execution_count": 145,
138 |    "metadata": {},
139 |    "outputs": [
140 |     {
141 |      "data": {
142 |       "text/plain": [
143 |        "true"
144 |       ]
145 |      },
146 |      "execution_count": 145,
147 |      "metadata": {},
148 |      "output_type": "execute_result"
149 |     }
150 |    ],
151 |    "source": [
152 |     "# Nothing special about the uniform distribution\n",
153 |     "\n",
154 |     "G = Symmetric([ i==j ? 0 : rand() for i=1:N,j=1:N]) # Generating Matrix\n",
155 |     "M = G.*A # Markov Matrix\n",
156 |     "\n",
157 |     "M += Diagonal(1 .- sum(M,dims=1)[:]) # Rejection Probabilities\n",
158 |     "M'./M ≈ π'./π   &&  sum(M,dims=1) ≈ ones(1,N)"
159 |    ]
160 |   },
161 |   {
162 |    "cell_type": "code",
163 |    "execution_count": 141,
164 |    "metadata": {},
165 |    "outputs": [
166 |     {
167 |      "data": {
168 |       "text/plain": [
169 |        "true"
170 |       ]
171 |      },
172 |      "execution_count": 141,
173 |      "metadata": {},
174 |      "output_type": "execute_result"
175 |     }
176 |    ],
177 |    "source": [
178 |     "M*π ≈ π"
179 |    ]
180 |   },
181 |   {
182 |    "cell_type": "code",
183 |    "execution_count": null,
184 |    "metadata": {},
185 |    "outputs": [],
186 |    "source": []
187 |   }
188 |  ],
189 |  "metadata": {
190 |   "kernelspec": {
191 |    "display_name": "Julia 1.7 1.7.1",
192 |    "language": "julia",
193 |    "name": "julia-1.7-1.7"
194 |   },
195 |   "language_info": {
196 |    "file_extension": ".jl",
197 |    "mimetype": "application/julia",
198 |    "name": "julia",
199 |    "version": "1.7.1"
200 |   }
201 |  },
202 |  "nbformat": 4,
203 |  "nbformat_minor": 2
204 | }
205 | 


--------------------------------------------------------------------------------
/lecture 24/Metropolis with linear algebra.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "code",
  5 |    "execution_count": 31,
  6 |    "metadata": {},
  7 |    "outputs": [],
  8 |    "source": [
  9 |     "using LinearAlgebra, Distributions, StatsBase"
 10 |    ]
 11 |   },
 12 |   {
 13 |    "cell_type": "code",
 14 |    "execution_count": null,
 15 |    "metadata": {},
 16 |    "outputs": [],
 17 |    "source": [
 18 |     "# Create a vector of Probabilities and do the Metropolis thing\n",
 19 |     "N = 7\n",
 20 |     "π = normalize(rand(N),1)\n",
 21 |     "A = min.(1,π./π') # Acceptance Matrix"
 22 |    ]
 23 |   },
 24 |   {
 25 |    "cell_type": "code",
 26 |    "execution_count": null,
 27 |    "metadata": {},
 28 |    "outputs": [],
 29 |    "source": [
 30 |     "# Note that by construction\n",
 31 |     "A'./A ≈ π'./π"
 32 |    ]
 33 |   },
 34 |   {
 35 |    "cell_type": "code",
 36 |    "execution_count": null,
 37 |    "metadata": {},
 38 |    "outputs": [],
 39 |    "source": [
 40 |     "# The same test in linear algebra notation\n",
 41 |     "A ≈ Diagonal(π)*A'/Diagonal(π)"
 42 |    ]
 43 |   },
 44 |   {
 45 |    "cell_type": "code",
 46 |    "execution_count": 15,
 47 |    "metadata": {},
 48 |    "outputs": [
 49 |     {
 50 |      "data": {
 51 |       "text/plain": [
 52 |        "true"
 53 |       ]
 54 |      },
 55 |      "execution_count": 15,
 56 |      "metadata": {},
 57 |      "output_type": "execute_result"
 58 |     }
 59 |    ],
 60 |    "source": [
 61 |     "# The following steps preserve P'./P ≈ π'./π \n",
 62 |     "# but add a new property:  sum(P,1) ≈ ones(1,N)\n",
 63 |     "\n",
 64 |     "G = [ i==j ? 0 : 1/(N-1) for i=1:N,j=1:N] # Generating Matrix\n",
 65 |     "M = G.*A # Markov Matrix\n",
 66 |     "\n",
 67 |     "M += Diagonal(1 .- sum(M,dims=1)[:]) # Rejection Probabilities\n",
 68 |     "M'./M ≈ π'./π   &&  sum(M,dims=1) ≈ ones(1,N) "
 69 |    ]
 70 |   },
 71 |   {
 72 |    "cell_type": "code",
 73 |    "execution_count": 16,
 74 |    "metadata": {},
 75 |    "outputs": [
 76 |     {
 77 |      "data": {
 78 |       "text/plain": [
 79 |        "true"
 80 |       ]
 81 |      },
 82 |      "execution_count": 16,
 83 |      "metadata": {},
 84 |      "output_type": "execute_result"
 85 |     }
 86 |    ],
 87 |    "source": [
 88 |     "M*π ≈ π \n",
 89 |     "# why? multiplying P*π \n",
 90 |     "# from right to left in\n",
 91 |     "# (Diagonal(π)*P'/Diagonal(π)) * π \n",
 92 |     "# gives π --> ones --> ones --> π"
 93 |    ]
 94 |   },
 95 |   {
 96 |    "cell_type": "code",
 97 |    "execution_count": 17,
 98 |    "metadata": {},
 99 |    "outputs": [],
100 |    "source": [
101 |     "# Nothing special about the uniform distribution\n",
102 |     "\n",
103 |     "# G = Symmetric([ i==j ? 0 : rand() for i=1:N,j=1:N]) # Generating Matrix\n",
104 |     "# M = G.*A # Markov Matrix\n",
105 |     "\n",
106 |     "# M += Diagonal(1 .- sum(M,dims=1)[:]) # Rejection Probabilities\n",
107 |     "# M'./M ≈ π'./π   &&  sum(M,dims=1) ≈ ones(1,N)"
108 |    ]
109 |   },
110 |   {
111 |    "cell_type": "code",
112 |    "execution_count": 18,
113 |    "metadata": {},
114 |    "outputs": [
115 |     {
116 |      "data": {
117 |       "text/plain": [
118 |        "true"
119 |       ]
120 |      },
121 |      "execution_count": 18,
122 |      "metadata": {},
123 |      "output_type": "execute_result"
124 |     }
125 |    ],
126 |    "source": [
127 |     "M*π ≈ π"
128 |    ]
129 |   },
130 |   {
131 |    "cell_type": "code",
132 |    "execution_count": 19,
133 |    "metadata": {},
134 |    "outputs": [
135 |     {
136 |      "data": {
137 |       "text/plain": [
138 |        "7×7 Matrix{Float64}:\n",
139 |        " 0.0752557  0.106492  0.166667     0.0952127  0.0884378  0.0652019  0.0537528\n",
140 |        " 0.166667   0.168435  0.166667     0.149014   0.138411   0.102045   0.0841268\n",
141 |        " 0.0914109  0.058407  1.11022e-16  0.0522209  0.0485051  0.035761   0.0294816\n",
142 |        " 0.166667   0.166667  0.166667     0.203552   0.154808   0.114134   0.0940925\n",
143 |        " 0.166667   0.166667  0.166667     0.166667   0.236505   0.122877   0.1013\n",
144 |        " 0.166667   0.166667  0.166667     0.166667   0.166667   0.393314   0.137401\n",
145 |        " 0.166667   0.166667  0.166667     0.166667   0.166667   0.166667   0.499845"
146 |       ]
147 |      },
148 |      "execution_count": 19,
149 |      "metadata": {},
150 |      "output_type": "execute_result"
151 |     }
152 |    ],
153 |    "source": [
154 |     "M"
155 |    ]
156 |   },
157 |   {
158 |    "cell_type": "code",
159 |    "execution_count": 20,
160 |    "metadata": {},
161 |    "outputs": [
162 |     {
163 |      "data": {
164 |       "text/plain": [
165 |        "markov_jump (generic function with 1 method)"
166 |       ]
167 |      },
168 |      "execution_count": 20,
169 |      "metadata": {},
170 |      "output_type": "execute_result"
171 |     }
172 |    ],
173 |    "source": [
174 |     "function markov_jump(M,s)\n",
175 |     "    rand(Categorical(  M[:,s] ))\n",
176 |     "end"
177 |    ]
178 |   },
179 |   {
180 |    "cell_type": "code",
181 |    "execution_count": 47,
182 |    "metadata": {},
183 |    "outputs": [],
184 |    "source": [
185 |     "data=Int[]\n",
186 |     "howmany = 10_000_000\n",
187 |     "s=1\n",
188 |     "for i=1:howmany\n",
189 |     "    s = markov_jump(M,s)\n",
190 |     "    append!(data,s)\n",
191 |     "end"
192 |    ]
193 |   },
194 |   {
195 |    "cell_type": "code",
196 |    "execution_count": 48,
197 |    "metadata": {},
198 |    "outputs": [
199 |     {
200 |      "data": {
201 |       "text/plain": [
202 |        "7×2 Matrix{Float64}:\n",
203 |        " 0.0806753  0.0806104\n",
204 |        " 0.126221   0.126161\n",
205 |        " 0.0442706  0.044212\n",
206 |        " 0.141005   0.141106\n",
207 |        " 0.151835   0.151915\n",
208 |        " 0.206065   0.206053\n",
209 |        " 0.249929   0.249942"
210 |       ]
211 |      },
212 |      "execution_count": 48,
213 |      "metadata": {},
214 |      "output_type": "execute_result"
215 |     }
216 |    ],
217 |    "source": [
218 |     "[[ countmap(data)[i]/howmany for i=1:N]  π]"
219 |    ]
220 |   },
221 |   {
222 |    "cell_type": "code",
223 |    "execution_count": null,
224 |    "metadata": {},
225 |    "outputs": [],
226 |    "source": []
227 |   }
228 |  ],
229 |  "metadata": {
230 |   "@webio": {
231 |    "lastCommId": null,
232 |    "lastKernelId": null
233 |   },
234 |   "kernelspec": {
235 |    "display_name": "Julia 1.7 1.7.1",
236 |    "language": "julia",
237 |    "name": "julia-1.7-1.7"
238 |   },
239 |   "language_info": {
240 |    "file_extension": ".jl",
241 |    "mimetype": "application/julia",
242 |    "name": "julia",
243 |    "version": "1.7.1"
244 |   }
245 |  },
246 |  "nbformat": 4,
247 |  "nbformat_minor": 2
248 | }
249 | 


--------------------------------------------------------------------------------
/lecture1/fernbach 2019 power_of_language.pptx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture1/fernbach 2019 power_of_language.pptx


--------------------------------------------------------------------------------
/lecture10/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture10/.DS_Store


--------------------------------------------------------------------------------
/lecture10/prefix.pptx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture10/prefix.pptx


--------------------------------------------------------------------------------
/lecture10/star_and_more.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture10/star_and_more.pdf


--------------------------------------------------------------------------------
/lecture10/trid.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture10/trid.pdf


--------------------------------------------------------------------------------
/lecture10/~$prefix.pptx:
--------------------------------------------------------------------------------
1 | Alan Edelman                                           A l a n   E d e l m a n                                                                                     


--------------------------------------------------------------------------------
/lecture11/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture11/.DS_Store


--------------------------------------------------------------------------------
/lecture13/handwritten_notes_vectors_adjoints.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture13/handwritten_notes_vectors_adjoints.pdf


--------------------------------------------------------------------------------
/lecture2/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture2/.DS_Store


--------------------------------------------------------------------------------
/lecture2/The Julia HPC dream - Jupyter Notebook.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture2/The Julia HPC dream - Jupyter Notebook.pdf


--------------------------------------------------------------------------------
/lecture2/allocations.jl:
--------------------------------------------------------------------------------
 1 | ### Introduction
 2 | 
 3 | @btime a = 100;  # This goes on the stack (0 allocations)
 4 | # All arrays live on the heap
 5 | @btime a = rand(10,10); # This creates one pointer (1 allocation)
 6 | @btime a = rand(100,10);  
 7 | @btime a = rand(100,100); # why 2 allocations? (wrapper and buffer)
 8 | @btime a = rand(1000,100); # why 2 allocations? (wrapper and buffer)
 9 | 
10 | # One KiB = 1024 Bytes
11 | 
12 | function lots_of_allocations(a)
13 |     for i=1:size(a,1), j=1:size(a,2)
14 |         val = [a[i,j]]  # <-- every step this is placed on the heap
15 |     end
16 | end 
17 | 
18 | a = rand(100,100)
19 | @btime lots_of_allocations(a);
20 | 
21 | a = rand(100,100)
22 | b = rand(100,100)
23 | c = similar(a)  # this is preallocated
24 | 
25 | function add_and_store!(c,a,b)  # function changes it's first argument
26 |     for i=1:100, j=1:100
27 |         c[i,j] = a[i,j]+b[i,j]
28 |     end
29 | end


--------------------------------------------------------------------------------
/lecture2/lecture2.jl:
--------------------------------------------------------------------------------
 1 | # Flattening
 2 | A = 1:9
 3 | A[3]
 4 | A[2]
 5 | A[3,2]
 6 | i,j = 3,2
 7 | A[i + (j-1)*3]
 8 | reshape(A,(3,3))[3,2]  # It's just an index scheme
 9 | 
10 | # Memory Order Matters
11 | A = rand(100,100)
12 | B = rand(100,100)
13 | C = rand(100,100)
14 | using BenchmarkTools
15 | 
16 | function inner_rows!(C,A,B)
17 |   for i in 1:100, j in 1:100
18 |     C[i,j] = A[i,j] + B[i,j]
19 |   end
20 | end
21 | @btime inner_rows!(C,A,B)
22 | 
23 | function inner_cols!(C,A,B)
24 |     for j in 1:100, i in 1:100
25 |       C[i,j] = A[i,j] + B[i,j]
26 |     end
27 |   end
28 |   @btime inner_cols!(C,A,B)
29 | 
30 | 
31 |   # Heap vs Stack
32 |   function inner_alloc!(C,A,B)
33 |     
34 |     for j in 1:100, i in 1:100
35 |       val = [A[i,j] + B[i,j]]  # this is a vector of length 1, but Julia doesn't know
36 |       C[i,j] = val[1]
37 |     end
38 |   end
39 |   @btime inner_alloc!(C,A,B)
40 | 
41 |   function inner_noalloc!(C,A,B)
42 |     for j in 1:100, i in 1:100
43 |       val = A[i,j] + B[i,j]
44 |       C[i,j] = val[1]  # this is a scalar which Julia does know
45 |     end
46 |   end
47 |   @btime inner_noalloc!(C,A,B)
48 | 
49 | 


--------------------------------------------------------------------------------
/lecture2/matrix_calculus_handwritten_notes_02_08_2023.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture2/matrix_calculus_handwritten_notes_02_08_2023.pdf


--------------------------------------------------------------------------------
/lecture20/adjointpde.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture20/adjointpde.pdf


--------------------------------------------------------------------------------
/lecture3/allocation.jl:
--------------------------------------------------------------------------------
  1 | ### A Pluto.jl notebook ###
  2 | # v0.19.14
  3 | 
  4 | using Markdown
  5 | using InteractiveUtils
  6 | 
  7 | # ╔═╡ 670f41d2-882c-11ec-1232-b53f49123cfe
  8 | using PlutoUI, BenchmarkTools, LinearAlgebra
  9 | 
 10 | # ╔═╡ 5dccaff9-d326-4a71-a54a-7b3288bddecf
 11 | using StaticArrays
 12 | 
 13 | # ╔═╡ a749af3f-a4c8-4531-8f2f-2cad0b99cd10
 14 | let
 15 | 	# 1. Caches - how they impact performance
 16 | 	BLAS.set_num_threads(1)
 17 | 	n = 1000
 18 | 	A = randn(n,n)
 19 | 	B = randn(n,n);
 20 | end
 21 | 
 22 | # ╔═╡ 3f72ae62-29dd-44c9-9571-075e0e87175f
 23 | md"""
 24 | ## Allocations
 25 | """
 26 | 
 27 | # ╔═╡ b5d0c163-b718-4954-b50c-37532941ae79
 28 | 	with_terminal() do
 29 | 		@btime a = 100;  # This goes on the stack (0 allocations)
 30 | # All arrays live on the heap
 31 | @btime a = rand(10,10); # This creates one pointer (1 allocation)
 32 | @btime a = rand(100,10);  
 33 | @btime a = rand(100,100); # why 2 allocations? (wrapper and buffer)
 34 | @btime a = rand(1000,100); # why 2 allocations? (wrapper and buffer)
 35 | 	end
 36 | 
 37 | # ╔═╡ 3ae89b96-7b73-4b52-a52d-f2808ed72b39
 38 | md"""
 39 |   Note:  One KiB = 1024 Bytes
 40 | """
 41 | 
 42 | # ╔═╡ 7d03d114-c17e-4581-a4b6-8213ebc907b2
 43 | md"""
 44 | ## Lots of Allocations
 45 | """
 46 | 
 47 | # ╔═╡ 640e141a-9e00-4280-9c4e-da6461a753c5
 48 | function lots_of_allocations(a)
 49 | 	    for i=1:size(a,1), j=1:size(a,2)
 50 | 	        val = [a[i,j]]  # <-- every step this is placed on the heap
 51 | 	    end
 52 | end
 53 | 
 54 | # ╔═╡ c9db43b8-b80c-4d98-9994-caf5177a1f02
 55 | lots_of_allocations(rand(100,100))
 56 | 
 57 | # ╔═╡ 6d2e2671-7063-4c1f-9915-fb767db291b3
 58 | a = rand(100,100)
 59 | 
 60 | # ╔═╡ 80304bdb-e390-4f00-b4d6-43c1c3ef8237
 61 | with_terminal() do 
 62 |      @btime $lots_of_allocations(a);
 63 | end
 64 | 
 65 | # ╔═╡ 24aa362b-5758-4354-9faf-654a48c5ceed
 66 | md"""
 67 | ## No allocations (well it's been preallocated!)
 68 | 
 69 | Note the difference in time
 70 | """
 71 | 
 72 | # ╔═╡ 6fbda23b-30f0-4e95-936e-71c9a9f286a2
 73 | begin
 74 | 	with_terminal() do
 75 | 		
 76 | 	# a = rand(100,100)
 77 |     b = rand(100,100)
 78 |     c = similar(a)  # this is preallocated
 79 | 
 80 | 	function add_and_store!(c,a,b)  # function changes it's first argument
 81 |       for i=1:100, j=1:100
 82 |         c[i,j] = a[i,j]+b[i,j]
 83 |       end
 84 | 	end
 85 | 
 86 | 	
 87 | 		@btime $add_and_store!($c,$a,$b)  # dollar sign is really annoying, hope it will go away.  Something to do with benchmarktools and pluto, not needed in repl, jupyter, vscode
 88 | 	end
 89 | end
 90 | 
 91 | # ╔═╡ 31062988-22c8-4543-ab50-038edf1e8a98
 92 | md"""
 93 | ## Objects in languages such as Python, R, Java have to go on the heap.
 94 | """
 95 | 
 96 | # ╔═╡ 7e240df0-aed4-4d5d-b3ec-a3269bfd3aee
 97 | struct Object
 98 | 	a::Int
 99 | 	b::Int
100 | end
101 | 
102 | # ╔═╡ c90543f8-5c73-463e-b796-28755223e7e8
103 | A = Object(10,1)
104 | 
105 | # ╔═╡ 2f999998-3908-4ec4-8e49-1bfcb0f563ef
106 | begin
107 | 	# Rate of computation = (ops)/(time) in gigaflops
108 | 	(2n^3)/(@elapsed A*A)/1e9
109 | 	(n^2)/(@elapsed A.+A)/1e
110 | end
111 | 
112 | # ╔═╡ 8b7d204d-2774-4f39-90c0-9abd4b92d970
113 | # analog would  work in python
114 |    A.c = 5
115 | 
116 | # ╔═╡ 8a7995c0-d616-4381-a16e-081da762b9c9
117 | md"""
118 | Convenient, yes, but now you understand the loss of performance. 
119 | """
120 | 
121 | # ╔═╡ a0eca1c3-49c1-4057-b688-25e994cd0a69
122 | md"""
123 | ## Example: Static arrays for small vectors
124 | """
125 | 
126 | # ╔═╡ 2c14ce3d-9a68-4363-aaee-04ac7a2e5e40
127 | val = SVector{3,Float64}(1.0,2.0,3.0)  # braces are "type parameters"
128 | 
129 | # ╔═╡ 53057c8c-47d8-4446-8ce1-96ac9189a289
130 | typeof(val)
131 | 
132 | # ╔═╡ d6d55818-ddc1-44ce-bbad-b8c1f9ba9dbc
133 | typeof( [1.0,2.0,3.0])  # the type doesn't know
134 | 
135 | # ╔═╡ e7b79d83-4a0a-494d-bfa5-f09d544ce75d
136 | @SVector  [1.0,2.0,3.0]   # "Macro" shorthand for SVector{3,Float64}(1.0,2.0,3.0) 
137 | 
138 | # ╔═╡ b904916b-c102-4ab7-9357-47639d4f212b
139 | function add_and_store_slow!(c,a,b)  # function changes it's first argument
140 |       for j=1:100, i=1:100
141 |         c[i,j] = [a[i,j]+b[i,j] ][1]   #Artificial I know!
142 |       end
143 | 	end
144 | 
145 | # ╔═╡ bf06883d-fda1-4966-9001-a439d5283230
146 | function add_and_store_fast!(c,a,b)  # function changes it's first argument
147 |         for j=1:100
148 | 			 for i=1:100
149 |            c[i,j] = (@SVector [a[i,j]+b[i,j] ])[1]
150 |       end
151 | 	  end
152 | 	end
153 | 
154 | # ╔═╡ 9aa390a3-e599-4d8c-90f5-abe591591e49
155 | 
156 | 
157 | # ╔═╡ 8f8bc783-3f0b-49e5-8726-778c560f6916
158 | 	let
159 | 
160 | 		a = rand(100,100)
161 | 		b = rand(100,100)
162 | 		c = rand(100,100)
163 | 		
164 | 	
165 | 
166 | 	
167 | 
168 |     with_terminal() do
169 |        @btime $add_and_store_slow!($c,$a,$b)
170 | 	   @btime $add_and_store_fast!($c,$a,$b)
171 | 	end
172 | 
173 | 	end
174 | 
175 | # ╔═╡ cafae1f5-8f9e-4ff6-a3cb-8b38256d3d5f
176 | md"""
177 | Static Arrays:
178 |     Fast for small arrays, but only have so much space in your stack.  If you try to stuff a 100x100 array on the stack, not only will it be slow, as the stack pushes and pops from the top, but the compiler will have a terribly tough time as well.  It would be like compiling a 10,000 line code.
179 | """
180 | 
181 | # ╔═╡ b2e4e674-8b07-4b0a-98cd-ad92544167be
182 | md"""
183 | # Mutation
184 | """
185 | 
186 | # ╔═╡ 3fcb879d-fb60-481d-b149-e60de152a56e
187 | md"""
188 | So what to do for fast arrays? Mutation.  You've alreay seen it.  Change an existing allocated array.
189 | """
190 | 
191 | # ╔═╡ 7a9618d3-36fe-4145-a2cb-adc55d25bdaa
192 | begin
193 |    X = rand(100,100)
194 |    Y = rand(100,100)
195 |    D = similar(Y)
196 | 
197 |    function just_plus(A,B)
198 | 	     return A+B
199 |    end
200 | 
201 | 	function just_add_and_store!(D,A,B)
202 | 		for j=1:100
203 | 			for i=1:100
204 | 			D[i,j] = A[i,j] +B[i,j]
205 | 				end
206 | 		end
207 | 	end
208 | 	
209 | 	with_terminal() do
210 |       @btime E=$just_plus($X,$Y)
211 | 	  @btime $just_add_and_store!($D,$X,$Y)  
212 | 	 
213 | 	end
214 | end
215 | 
216 | 
217 | # ╔═╡ 975c2dd5-931a-41ee-a227-1dbada1b263e
218 | md"""
219 | ## Broadcasting (loop fusion)
220 | """
221 | 
222 | # ╔═╡ dd1da75c-e123-46ee-a835-d3ee694381b7
223 | let
224 | 	 A =  rand(100,100)
225 | 	 B  = rand(100,100)
226 | 	 C =  rand(100,100)
227 | 	  C = A.*B
228 | end
229 | 
230 | # ╔═╡ 513262a6-5a49-45fe-96f0-2549571915fc
231 | let
232 | 	 A =  rand(100,100)
233 | 	 B  = rand(100,100)
234 | 	 C =  rand(100,100)
235 | 	 D =  similar(C)
236 | 	 D .=  A.*B.*C
237 | end
238 | 
239 | # ╔═╡ 2e7e7cae-c659-43f3-a781-6f6c22eb1f6b
240 | md"""
241 |   think what may be happening
242 | """
243 | 
244 | # ╔═╡ 22f9c847-b09c-4052-981a-34f873e370f7
245 | 
246 | 
247 | 
248 | let
249 | 	 A =  rand(100,100)
250 | 	 B  = rand(100,100)
251 | 	 C =  rand(100,100)
252 | 	 D =  similar(C)
253 | 	tmp = similar(C)
254 | 	tmp2 = similar(C)
255 | 
256 | 	for  i = 1:length(A)
257 | 	   tmp[i]= A[i] * B[i]
258 | 	  tmp2[i] = tmp[i] * C[i]
259 | 		D[i] = tmp2[i]
260 | 	end
261 | 
262 | end
263 | 
264 | # ╔═╡ c32f3f81-40d4-45d2-8ea6-bdcdaacd7afd
265 | let
266 | 	 A =  rand(100,100)
267 | 	 B  = rand(100,100)
268 | 	 C =  rand(100,100)
269 | 		 
270 | 	 map((a,b)->a*b, map( (a,b)-> a*b, A, B), C)
271 | end
272 | 
273 | # ╔═╡ 00ad2dd8-76db-48e3-a0ea-6fac1598c92e
274 | let
275 | 	 A =  rand(100,100)
276 | 	 B  = rand(100,100)
277 | 	 C =  rand(100,100)
278 | 		 
279 | 	 map((a,b,c)->a*b*c, A,B,C) # create one compiled function
280 | end
281 | 
282 | # ╔═╡ d4c933fb-8b17-47bc-9e14-81f5da7fc1ad
283 | md"""
284 | This sort of issue is more pronounced on GPUs type architectures
285 | 
286 | Python, R doesn't generate the fast code for fused loops, as it can't know all possible cases without JIT compilation.
287 | """
288 | 
289 | # ╔═╡ 08758ca8-4a7f-46af-8a5b-4d4586c66a46
290 | md"""
291 | # Slicing
292 | """
293 | 
294 | # ╔═╡ 70d1e7b6-8522-4b5a-a0f0-c4d7905cc8f5
295 | let
296 | 	 A = rand(100,100)
297 | 	 x = @view A[:,3]  # does not allocate
298 | 	 x[3] = 12345
299 | 	 A[1:3,1:3]
300 | end
301 | 
302 | # ╔═╡ b1b0dc0a-2a46-410d-8db5-b7eb473a4cef
303 | md"""
304 |  # Bounds Checking
305 | """
306 | 
307 | # ╔═╡ 8fa83e64-d6a8-4e2c-894d-b1151542080c
308 | let
309 | 	A = rand(100,100)
310 | 	A[10001]
311 | end
312 | 
313 | # ╔═╡ 00000000-0000-0000-0000-000000000001
314 | PLUTO_PROJECT_TOML_CONTENTS = """
315 | [deps]
316 | BenchmarkTools = "6e4b80f9-dd63-53aa-95a3-0cdb28fa8baf"
317 | LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
318 | PlutoUI = "7f904dfe-b85e-4ff6-b463-dae2292396a8"
319 | StaticArrays = "90137ffa-7385-5640-81b9-e52037218182"
320 | 
321 | [compat]
322 | BenchmarkTools = "~1.3.2"
323 | PlutoUI = "~0.7.49"
324 | StaticArrays = "~1.5.14"
325 | """
326 | 
327 | # ╔═╡ 00000000-0000-0000-0000-000000000002
328 | PLUTO_MANIFEST_TOML_CONTENTS = """
329 | # This file is machine-generated - editing it directly is not advised
330 | 
331 | julia_version = "1.8.0-rc4"
332 | manifest_format = "2.0"
333 | project_hash = "e57715669a528e29932e2ca28260116abbdf64e1"
334 | 
335 | [[deps.AbstractPlutoDingetjes]]
336 | deps = ["Pkg"]
337 | git-tree-sha1 = "8eaf9f1b4921132a4cff3f36a1d9ba923b14a481"
338 | uuid = "6e696c72-6542-2067-7265-42206c756150"
339 | version = "1.1.4"
340 | 
341 | [[deps.ArgTools]]
342 | uuid = "0dad84c5-d112-42e6-8d28-ef12dabb789f"
343 | version = "1.1.1"
344 | 
345 | [[deps.Artifacts]]
346 | uuid = "56f22d72-fd6d-98f1-02f0-08ddc0907c33"
347 | 
348 | [[deps.Base64]]
349 | uuid = "2a0f44e3-6c83-55bd-87e4-b1978d98bd5f"
350 | 
351 | [[deps.BenchmarkTools]]
352 | deps = ["JSON", "Logging", "Printf", "Profile", "Statistics", "UUIDs"]
353 | git-tree-sha1 = "d9a9701b899b30332bbcb3e1679c41cce81fb0e8"
354 | uuid = "6e4b80f9-dd63-53aa-95a3-0cdb28fa8baf"
355 | version = "1.3.2"
356 | 
357 | [[deps.ColorTypes]]
358 | deps = ["FixedPointNumbers", "Random"]
359 | git-tree-sha1 = "eb7f0f8307f71fac7c606984ea5fb2817275d6e4"
360 | uuid = "3da002f7-5984-5a60-b8a6-cbb66c0b333f"
361 | version = "0.11.4"
362 | 
363 | [[deps.CompilerSupportLibraries_jll]]
364 | deps = ["Artifacts", "Libdl"]
365 | uuid = "e66e0078-7015-5450-92f7-15fbd957f2ae"
366 | version = "0.5.2+0"
367 | 
368 | [[deps.Dates]]
369 | deps = ["Printf"]
370 | uuid = "ade2ca70-3891-5945-98fb-dc099432e06a"
371 | 
372 | [[deps.Downloads]]
373 | deps = ["ArgTools", "FileWatching", "LibCURL", "NetworkOptions"]
374 | uuid = "f43a241f-c20a-4ad4-852c-f6b1247861c6"
375 | version = "1.6.0"
376 | 
377 | [[deps.FileWatching]]
378 | uuid = "7b1f6079-737a-58dc-b8bc-7a2ca5c1b5ee"
379 | 
380 | [[deps.FixedPointNumbers]]
381 | deps = ["Statistics"]
382 | git-tree-sha1 = "335bfdceacc84c5cdf16aadc768aa5ddfc5383cc"
383 | uuid = "53c48c17-4a7d-5ca2-90c5-79b7896eea93"
384 | version = "0.8.4"
385 | 
386 | [[deps.Hyperscript]]
387 | deps = ["Test"]
388 | git-tree-sha1 = "8d511d5b81240fc8e6802386302675bdf47737b9"
389 | uuid = "47d2ed2b-36de-50cf-bf87-49c2cf4b8b91"
390 | version = "0.0.4"
391 | 
392 | [[deps.HypertextLiteral]]
393 | deps = ["Tricks"]
394 | git-tree-sha1 = "c47c5fa4c5308f27ccaac35504858d8914e102f9"
395 | uuid = "ac1192a8-f4b3-4bfe-ba22-af5b92cd3ab2"
396 | version = "0.9.4"
397 | 
398 | [[deps.IOCapture]]
399 | deps = ["Logging", "Random"]
400 | git-tree-sha1 = "f7be53659ab06ddc986428d3a9dcc95f6fa6705a"
401 | uuid = "b5f81e59-6552-4d32-b1f0-c071b021bf89"
402 | version = "0.2.2"
403 | 
404 | [[deps.InteractiveUtils]]
405 | deps = ["Markdown"]
406 | uuid = "b77e0a4c-d291-57a0-90e8-8db25a27a240"
407 | 
408 | [[deps.JSON]]
409 | deps = ["Dates", "Mmap", "Parsers", "Unicode"]
410 | git-tree-sha1 = "3c837543ddb02250ef42f4738347454f95079d4e"
411 | uuid = "682c06a0-de6a-54ab-a142-c8b1cf79cde6"
412 | version = "0.21.3"
413 | 
414 | [[deps.LibCURL]]
415 | deps = ["LibCURL_jll", "MozillaCACerts_jll"]
416 | uuid = "b27032c2-a3e7-50c8-80cd-2d36dbcbfd21"
417 | version = "0.6.3"
418 | 
419 | [[deps.LibCURL_jll]]
420 | deps = ["Artifacts", "LibSSH2_jll", "Libdl", "MbedTLS_jll", "Zlib_jll", "nghttp2_jll"]
421 | uuid = "deac9b47-8bc7-5906-a0fe-35ac56dc84c0"
422 | version = "7.84.0+0"
423 | 
424 | [[deps.LibGit2]]
425 | deps = ["Base64", "NetworkOptions", "Printf", "SHA"]
426 | uuid = "76f85450-5226-5b5a-8eaa-529ad045b433"
427 | 
428 | [[deps.LibSSH2_jll]]
429 | deps = ["Artifacts", "Libdl", "MbedTLS_jll"]
430 | uuid = "29816b5a-b9ab-546f-933c-edad1886dfa8"
431 | version = "1.10.2+0"
432 | 
433 | [[deps.Libdl]]
434 | uuid = "8f399da3-3557-5675-b5ff-fb832c97cbdb"
435 | 
436 | [[deps.LinearAlgebra]]
437 | deps = ["Libdl", "libblastrampoline_jll"]
438 | uuid = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
439 | 
440 | [[deps.Logging]]
441 | uuid = "56ddb016-857b-54e1-b83d-db4d58db5568"
442 | 
443 | [[deps.MIMEs]]
444 | git-tree-sha1 = "65f28ad4b594aebe22157d6fac869786a255b7eb"
445 | uuid = "6c6e2e6c-3030-632d-7369-2d6c69616d65"
446 | version = "0.1.4"
447 | 
448 | [[deps.Markdown]]
449 | deps = ["Base64"]
450 | uuid = "d6f4376e-aef5-505a-96c1-9c027394607a"
451 | 
452 | [[deps.MbedTLS_jll]]
453 | deps = ["Artifacts", "Libdl"]
454 | uuid = "c8ffd9c3-330d-5841-b78e-0817d7145fa1"
455 | version = "2.28.0+0"
456 | 
457 | [[deps.Mmap]]
458 | uuid = "a63ad114-7e13-5084-954f-fe012c677804"
459 | 
460 | [[deps.MozillaCACerts_jll]]
461 | uuid = "14a3606d-f60d-562e-9121-12d972cd8159"
462 | version = "2022.2.1"
463 | 
464 | [[deps.NetworkOptions]]
465 | uuid = "ca575930-c2e3-43a9-ace4-1e988b2c1908"
466 | version = "1.2.0"
467 | 
468 | [[deps.OpenBLAS_jll]]
469 | deps = ["Artifacts", "CompilerSupportLibraries_jll", "Libdl"]
470 | uuid = "4536629a-c528-5b80-bd46-f80d51c5b363"
471 | version = "0.3.20+0"
472 | 
473 | [[deps.Parsers]]
474 | deps = ["Dates", "SnoopPrecompile"]
475 | git-tree-sha1 = "946b56b2135c6c10bbb93efad8a78b699b6383ab"
476 | uuid = "69de0a69-1ddd-5017-9359-2bf0b02dc9f0"
477 | version = "2.5.6"
478 | 
479 | [[deps.Pkg]]
480 | deps = ["Artifacts", "Dates", "Downloads", "LibGit2", "Libdl", "Logging", "Markdown", "Printf", "REPL", "Random", "SHA", "Serialization", "TOML", "Tar", "UUIDs", "p7zip_jll"]
481 | uuid = "44cfe95a-1eb2-52ea-b672-e2afdf69b78f"
482 | version = "1.8.0"
483 | 
484 | [[deps.PlutoUI]]
485 | deps = ["AbstractPlutoDingetjes", "Base64", "ColorTypes", "Dates", "FixedPointNumbers", "Hyperscript", "HypertextLiteral", "IOCapture", "InteractiveUtils", "JSON", "Logging", "MIMEs", "Markdown", "Random", "Reexport", "URIs", "UUIDs"]
486 | git-tree-sha1 = "eadad7b14cf046de6eb41f13c9275e5aa2711ab6"
487 | uuid = "7f904dfe-b85e-4ff6-b463-dae2292396a8"
488 | version = "0.7.49"
489 | 
490 | [[deps.Preferences]]
491 | deps = ["TOML"]
492 | git-tree-sha1 = "47e5f437cc0e7ef2ce8406ce1e7e24d44915f88d"
493 | uuid = "21216c6a-2e73-6563-6e65-726566657250"
494 | version = "1.3.0"
495 | 
496 | [[deps.Printf]]
497 | deps = ["Unicode"]
498 | uuid = "de0858da-6303-5e67-8744-51eddeeeb8d7"
499 | 
500 | [[deps.Profile]]
501 | deps = ["Printf"]
502 | uuid = "9abbd945-dff8-562f-b5e8-e1ebf5ef1b79"
503 | 
504 | [[deps.REPL]]
505 | deps = ["InteractiveUtils", "Markdown", "Sockets", "Unicode"]
506 | uuid = "3fa0cd96-eef1-5676-8a61-b3b8758bbffb"
507 | 
508 | [[deps.Random]]
509 | deps = ["SHA", "Serialization"]
510 | uuid = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
511 | 
512 | [[deps.Reexport]]
513 | git-tree-sha1 = "45e428421666073eab6f2da5c9d310d99bb12f9b"
514 | uuid = "189a3867-3050-52da-a836-e630ba90ab69"
515 | version = "1.2.2"
516 | 
517 | [[deps.SHA]]
518 | uuid = "ea8e919c-243c-51af-8825-aaa63cd721ce"
519 | version = "0.7.0"
520 | 
521 | [[deps.Serialization]]
522 | uuid = "9e88b42a-f829-5b0c-bbe9-9e923198166b"
523 | 
524 | [[deps.SnoopPrecompile]]
525 | deps = ["Preferences"]
526 | git-tree-sha1 = "e760a70afdcd461cf01a575947738d359234665c"
527 | uuid = "66db9d55-30c0-4569-8b51-7e840670fc0c"
528 | version = "1.0.3"
529 | 
530 | [[deps.Sockets]]
531 | uuid = "6462fe0b-24de-5631-8697-dd941f90decc"
532 | 
533 | [[deps.SparseArrays]]
534 | deps = ["LinearAlgebra", "Random"]
535 | uuid = "2f01184e-e22b-5df5-ae63-d93ebab69eaf"
536 | 
537 | [[deps.StaticArrays]]
538 | deps = ["LinearAlgebra", "Random", "StaticArraysCore", "Statistics"]
539 | git-tree-sha1 = "cee507162ecbb677450f20058ca83bd559b6b752"
540 | uuid = "90137ffa-7385-5640-81b9-e52037218182"
541 | version = "1.5.14"
542 | 
543 | [[deps.StaticArraysCore]]
544 | git-tree-sha1 = "6b7ba252635a5eff6a0b0664a41ee140a1c9e72a"
545 | uuid = "1e83bf80-4336-4d27-bf5d-d5a4f845583c"
546 | version = "1.4.0"
547 | 
548 | [[deps.Statistics]]
549 | deps = ["LinearAlgebra", "SparseArrays"]
550 | uuid = "10745b16-79ce-11e8-11f9-7d13ad32a3b2"
551 | 
552 | [[deps.TOML]]
553 | deps = ["Dates"]
554 | uuid = "fa267f1f-6049-4f14-aa54-33bafae1ed76"
555 | version = "1.0.0"
556 | 
557 | [[deps.Tar]]
558 | deps = ["ArgTools", "SHA"]
559 | uuid = "a4e569a6-e804-4fa4-b0f3-eef7a1d5b13e"
560 | version = "1.10.0"
561 | 
562 | [[deps.Test]]
563 | deps = ["InteractiveUtils", "Logging", "Random", "Serialization"]
564 | uuid = "8dfed614-e22c-5e08-85e1-65c5234f0b40"
565 | 
566 | [[deps.Tricks]]
567 | git-tree-sha1 = "6bac775f2d42a611cdfcd1fb217ee719630c4175"
568 | uuid = "410a4b4d-49e4-4fbc-ab6d-cb71b17b3775"
569 | version = "0.1.6"
570 | 
571 | [[deps.URIs]]
572 | git-tree-sha1 = "ac00576f90d8a259f2c9d823e91d1de3fd44d348"
573 | uuid = "5c2747f8-b7ea-4ff2-ba2e-563bfd36b1d4"
574 | version = "1.4.1"
575 | 
576 | [[deps.UUIDs]]
577 | deps = ["Random", "SHA"]
578 | uuid = "cf7118a7-6976-5b1a-9a39-7adc72f591a4"
579 | 
580 | [[deps.Unicode]]
581 | uuid = "4ec0a83e-493e-50e2-b9ac-8f72acf5a8f5"
582 | 
583 | [[deps.Zlib_jll]]
584 | deps = ["Libdl"]
585 | uuid = "83775a58-1f1d-513f-b197-d71354ab007a"
586 | version = "1.2.12+3"
587 | 
588 | [[deps.libblastrampoline_jll]]
589 | deps = ["Artifacts", "Libdl", "OpenBLAS_jll"]
590 | uuid = "8e850b90-86db-534c-a0d3-1478176c7d93"
591 | version = "5.1.1+0"
592 | 
593 | [[deps.nghttp2_jll]]
594 | deps = ["Artifacts", "Libdl"]
595 | uuid = "8e850ede-7688-5339-a07c-302acd2aaf8d"
596 | version = "1.48.0+0"
597 | 
598 | [[deps.p7zip_jll]]
599 | deps = ["Artifacts", "Libdl"]
600 | uuid = "3f19e933-33d8-53b3-aaab-bd5110c3b7a0"
601 | version = "17.4.0+0"
602 | """
603 | 
604 | # ╔═╡ Cell order:
605 | # ╠═670f41d2-882c-11ec-1232-b53f49123cfe
606 | # ╠═a749af3f-a4c8-4531-8f2f-2cad0b99cd10
607 | # ╠═2f999998-3908-4ec4-8e49-1bfcb0f563ef
608 | # ╟─3f72ae62-29dd-44c9-9571-075e0e87175f
609 | # ╠═b5d0c163-b718-4954-b50c-37532941ae79
610 | # ╟─3ae89b96-7b73-4b52-a52d-f2808ed72b39
611 | # ╟─7d03d114-c17e-4581-a4b6-8213ebc907b2
612 | # ╠═640e141a-9e00-4280-9c4e-da6461a753c5
613 | # ╠═c9db43b8-b80c-4d98-9994-caf5177a1f02
614 | # ╠═6d2e2671-7063-4c1f-9915-fb767db291b3
615 | # ╠═80304bdb-e390-4f00-b4d6-43c1c3ef8237
616 | # ╟─24aa362b-5758-4354-9faf-654a48c5ceed
617 | # ╠═6fbda23b-30f0-4e95-936e-71c9a9f286a2
618 | # ╟─31062988-22c8-4543-ab50-038edf1e8a98
619 | # ╠═7e240df0-aed4-4d5d-b3ec-a3269bfd3aee
620 | # ╠═c90543f8-5c73-463e-b796-28755223e7e8
621 | # ╠═8b7d204d-2774-4f39-90c0-9abd4b92d970
622 | # ╠═8a7995c0-d616-4381-a16e-081da762b9c9
623 | # ╟─a0eca1c3-49c1-4057-b688-25e994cd0a69
624 | # ╠═5dccaff9-d326-4a71-a54a-7b3288bddecf
625 | # ╠═2c14ce3d-9a68-4363-aaee-04ac7a2e5e40
626 | # ╠═53057c8c-47d8-4446-8ce1-96ac9189a289
627 | # ╠═d6d55818-ddc1-44ce-bbad-b8c1f9ba9dbc
628 | # ╠═e7b79d83-4a0a-494d-bfa5-f09d544ce75d
629 | # ╠═b904916b-c102-4ab7-9357-47639d4f212b
630 | # ╠═bf06883d-fda1-4966-9001-a439d5283230
631 | # ╠═9aa390a3-e599-4d8c-90f5-abe591591e49
632 | # ╠═8f8bc783-3f0b-49e5-8726-778c560f6916
633 | # ╠═cafae1f5-8f9e-4ff6-a3cb-8b38256d3d5f
634 | # ╟─b2e4e674-8b07-4b0a-98cd-ad92544167be
635 | # ╠═3fcb879d-fb60-481d-b149-e60de152a56e
636 | # ╠═7a9618d3-36fe-4145-a2cb-adc55d25bdaa
637 | # ╠═975c2dd5-931a-41ee-a227-1dbada1b263e
638 | # ╠═dd1da75c-e123-46ee-a835-d3ee694381b7
639 | # ╠═513262a6-5a49-45fe-96f0-2549571915fc
640 | # ╠═2e7e7cae-c659-43f3-a781-6f6c22eb1f6b
641 | # ╠═22f9c847-b09c-4052-981a-34f873e370f7
642 | # ╠═c32f3f81-40d4-45d2-8ea6-bdcdaacd7afd
643 | # ╠═00ad2dd8-76db-48e3-a0ea-6fac1598c92e
644 | # ╠═d4c933fb-8b17-47bc-9e14-81f5da7fc1ad
645 | # ╠═08758ca8-4a7f-46af-8a5b-4d4586c66a46
646 | # ╠═70d1e7b6-8522-4b5a-a0f0-c4d7905cc8f5
647 | # ╠═b1b0dc0a-2a46-410d-8db5-b7eb473a4cef
648 | # ╠═8fa83e64-d6a8-4e2c-894d-b1151542080c
649 | # ╟─00000000-0000-0000-0000-000000000001
650 | # ╟─00000000-0000-0000-0000-000000000002
651 | 


--------------------------------------------------------------------------------
/lecture3/lecture_3_handwritten_2023.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture3/lecture_3_handwritten_2023.pdf


--------------------------------------------------------------------------------
/lecture4/lecture_4_handwritten_2023.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture4/lecture_4_handwritten_2023.pdf


--------------------------------------------------------------------------------
/lecture4/serial performance.jl:
--------------------------------------------------------------------------------
  1 | using LinearAlgebra, BenchmarkTools
  2 | 
  3 | # 1. Caches - how they impact performance
  4 | BLAS.set_num_threads(1)
  5 | n = 1000
  6 | A = randn(n,n)
  7 | B = randn(n,n)
  8 | 
  9 | # Rate of computation = (ops)/(time) in gigaflops
 10 | (2n^3)/(@elapsed A*A)/1e9
 11 | (n^2)/(@elapsed A.+A)/1e9
 12 | 
 13 | # 2. row vs column major
 14 | A = rand(100,100)
 15 | B = rand(100,100)
 16 | C = rand(100,100)
 17 | 
 18 | # compute row by row
 19 | function inner_rows!(C,A,B)
 20 |   for i in 1:100, j in 1:100  #
 21 |     C[i,j] = A[i,j] + B[i,j]
 22 |   end
 23 | end
 24 | @btime inner_rows!(C,A,B)
 25 | 
 26 | # compute column by column
 27 | function inner_cols!(C,A,B)
 28 |   for j in 1:100, i in 1:100
 29 |     C[i,j] = A[i,j] + B[i,j]
 30 |   end
 31 | end
 32 | @btime inner_cols!(C,A,B)
 33 | 
 34 | # 3. The stack vs the heap
 35 | 
 36 | # 3a.  Arrays go on the heap but have few allocations
 37 | @btime a = 100;  # This goes on the stack (0 allocations)
 38 | # All arrays live on the heap
 39 | @btime a = rand(10,10); # This creates one pointer (1 allocation)
 40 | @btime a = rand(100,10);  
 41 | @btime a = rand(100,100); # why 2 allocations? (wrapper and buffer)
 42 | @btime a = rand(1000,100); # why 2 allocations? (wrapper and buffer)
 43 | # One KiB = 1024 Bytes
 44 | 
 45 | #3b. An example where every element of an array needs an allocation
 46 | function lots_of_allocations(a)
 47 |     for i=1:size(a,1), j=1:size(a,2)
 48 |         val = [a[i,j]]  # <-- every step this is placed on the heap 
 49 |     end
 50 | end 
 51 | 
 52 | a = rand(1000,100)
 53 | @btime lots_of_allocations(a)
 54 | 
 55 | #4. "Mutation" to avoid heap allocations
 56 | 
 57 | a = rand(100,100)
 58 | b = rand(100,100)
 59 | c = similar(a)  # this is preallocated
 60 | 
 61 | 
 62 | function add_and_store(a,b)
 63 |   c = similar(a)
 64 |   for i=1:100, j=1:100
 65 |     c[i,j] = a[i,j]+b[i,j]
 66 |   end
 67 | end
 68 | @btime add_and_store(a,b);
 69 | 
 70 | function add_and_store!(c,a,b)  # function changes it's first argument
 71 |     for i=1:100, j=1:100
 72 |         c[i,j] = a[i,j]+b[i,j]
 73 |     end
 74 | end
 75 | @btime 
 76 | 
 77 | #5. Broadcasting (pointwise operations = "."wise operations)
 78 | 
 79 | #5a Devectorized vs. Vectorized
 80 | 
 81 | 
 82 | 
 83 | function applyf(x,fx)
 84 |   f(a) = a^3 + 4a^2 + 3a + 2
 85 |    for i=1:length(x)
 86 |      fx[i] = f(x[i])
 87 |    end
 88 | end
 89 | 
 90 | x = rand(100_000); fx=similar(x)
 91 | applyf(x,fx)
 92 | @benchmark applyf(x,fx)
 93 | 
 94 | f(a) = a^3 + 4a^2 + 3a + 2
 95 | @benchmark fx .= f.(x)
 96 | @benchmark @. fx= f(x)
 97 | 
 98 | #5b broadcasting functionality -- Julia is very consistent about this
 99 | # single argument is elementwise
100 | exp.( rand(5,5) ) # exp of every element
101 | exp(  rand(5,5) ) # Matrix exponential  I + A + A^2/ 2+ A^3/6+...
102 | 
103 | # two arguments with the same shape is also elementwise
104 | A = rand(4,3)
105 | B = rand(4,3)
106 | A .* B  # elementwise (A*B = matmul )
107 | 
108 | # 1's are "wild carded"
109 | A = rand(1,4)
110 | B = rand(3,4)
111 | A .* B
112 | 
113 | A = rand(3, 1)
114 | B = rand(1, 4)
115 | A .* B # outer product
116 | A .+ B # outer sum 
117 | 
118 | A = rand(2)  # one dimensional Vector (acts like size=2,1,1 here)
119 | B = rand(2,3,4)
120 | size(A .+ B) 
121 | 
122 | # works with any function
123 | f(a,b,c) = a*b+sin(c)
124 | size( f.( rand(2) , rand(2,3,4),  rand(1,3) ) )
125 | 
126 | #6 Views, Copies, Slices, etc
127 | A = [1 2 3;4 5 6;7 8 9]
128 | B = A # points to A
129 | B[1,1] = 18337
130 | A
131 | #MATLAB users get tripped by this one but valuable for performance
132 | 
133 | A = [1 2 3;4 5 6;7 8 9]
134 | B = copy(A) # new allocation
135 | B[1,1] = 18337
136 | A
137 | 
138 | B = A[1:2,1:2] # new allocation
139 | B[1,1] = 18337 
140 | A
141 | 
142 | A = [1 2 3;4 5 6;7 8 9]
143 | B = @view A[1:2,1:2] # points into A
144 | B[1,1] = 18337
145 | A
146 | 
147 | # Moral, slices produce new allocations, @view gives a pointer into the original array
148 | # saving allocations is great for performance
149 | 
150 | #7 Types, Type Inference, Multiple dispatch
151 | 
152 | #7a Numbers are stored as bits
153 | bitstring(0)
154 | bitstring(1)
155 | bitstring(1023)
156 | 
157 | bitstring(1.0)
158 | bitstring('a')
159 | parse(Int, bitstring(1))
160 | parse(Int, bitstring(1.0)) # tries to read as decimal, too large
161 | n = parse(Int, bitstring(1.0), base=2) # as binary it's okay
162 | parse(Float64, bitstring(1.0)) # read the string as a julia float, not the bits
163 | reinterpret(Float64,  n )  # recover the Float64 from the integer representation
164 | 
165 | # Moral of the story: bits are just bits, types tell you how to interepret the bits
166 | # one more example
167 | bitstring('a')
168 | n = parse(Int32,bitstring('a'),base=2)
169 | reinterpret(Char,n)
170 | 
171 | # types are critical to knowing what to do
172 | a = 1
173 | b = 3
174 | a+b  # you knew how to do this in kindergarten
175 | 
176 | a = 1.0
177 | b = 3.0
178 | a+b  # you may not know how to do this with the bits
179 | 
180 | #7b type inference
181 | # statically typed languages -- user specifies the type of everything
182 | # python,matlab determines types at run time
183 | # not knowing how much space to allocate slows things down
184 | # could be int, float, a matrix, etc
185 | # leads to runtime overhead in function calls and memory overhead too
186 | # as values are allocated on the heap
187 | 
188 | # What does julia do?
189 | # julia knows types of a and b and infers the type of c = a+b
190 | # julia is constructed to propagate type information even if the user doesn't specify types
191 | 
192 | @code_llvm 2+5
193 | @code_llvm 2.0+5.0
194 | @code_llvm 2 + 5.0 # sitofp = llvm speak for "signed integer to floating point" conversion
195 | 
196 | #7c type stability
197 | # if you know the type of the input arguments, you know the type of the output
198 | 
199 | # sqrt an interesting case study
200 | sqrt(3)
201 | # output is real
202 | # type stability requires then
203 | sqrt(-3)
204 | sqrt(Complex(3))
205 | sqrt(Complex(-3))
206 | # slightly inconvenient, even annoying maybe, but important for performance
207 | 
208 | # breaking type stability
209 | mysqrt(x) = x ≥ 0 ? sqrt(x) : sqrt(Complex(x))
210 | mysqrt(1)
211 | mysqrt(-1)
212 | @code_warntype mysqrt(1) # the redoutput is to be worried about
213 | 
214 | #no type stability
215 | plainold_sqrt(x) = x ≥ 0 ? sqrt(x) :  sqrt(x)
216 | @code_warntype plainold_sqrt(1)
217 | 
218 | # FizzBuzz is not type stable
219 | function fizzbuzz(i)
220 |   if i % 15 == 0
221 |       return("FizzBuzz")
222 |   elseif i % 3 == 0
223 |       return("Fizz")
224 |   elseif i % 5 == 0
225 |       return("Buzz")
226 |   else
227 |       return(i)
228 |   end
229 | end
230 | 
231 | fizzbuzz(100)
232 | @code_warntype(fizzbuzz(100))
233 | 
234 | # Multiple dispatch
235 | 
236 | # 7b Example with fake roman numerals
237 | struct Roman 
238 |     n::Int
239 | end
240 | 
241 | # Cool roman numeral printing magic (0:9 for demo only)
242 | import Base: promote_rule, convert, show
243 | Base.show(io::IO, r::Roman) = print(io,r.n%10==0 ? '0' : 'ⅰ'+r.n%10-1)
244 | 
245 | [Roman(1) Roman(2) Roman(5) Roman(9) ]  #Exercise: make work past single digits
246 | 
247 | import Base.*
248 | *(i::Roman,j::Roman)  = Roman(i.n*j.n)                     # Multiply like a Roman
249 | *(i::Number,j::Roman) = Matrix(I,i,i)*j.n                  # Multiply like a matrix constructor
250 | *(i::Roman,j::Number) = join(['😸' for k=1:(i.n)*j])       # Multiply with 😸's
251 | 
252 | Roman(2)*Roman(3)                      
253 | 2 * Roman(3)
254 | Roman(2) * 3
255 | 
256 | # 7c code specialization
257 | # the code below is not type instable
258 | # the compiler can infer the output types from the input types
259 | function f(x)
260 |   if x isa Int
261 |     y = 2
262 |   else
263 |     y = 4.0
264 |   end
265 |   x + y
266 | end
267 | 
268 | @code_warntype f(3)


--------------------------------------------------------------------------------
/lecture5/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture5/.DS_Store


--------------------------------------------------------------------------------
/lecture5/1071_230222012837_001.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture5/1071_230222012837_001.pdf


--------------------------------------------------------------------------------
/lecture5/de_solver_software_comparsion.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture5/de_solver_software_comparsion.pdf


--------------------------------------------------------------------------------
/lecture5/ode.jl:
--------------------------------------------------------------------------------
1 | using PackageCompiler
2 | create_sysimage(["DifferentialEquations"], sysimage_path="DiffEqSysImage.so")
3 | using DifferentialEquations


--------------------------------------------------------------------------------
/lecture5/pinn.jl:
--------------------------------------------------------------------------------
 1 | using Flux, Statistics, Plots
 2 | 
 3 | # n = 3
 4 | # n = 10
 5 | # n = 20
 6 | #  n = 25
 7 | # the below don't work with Flux.Descent(0.005)
 8 | #n = 26
 9 | n = 28
10 | #n = 30
11 | #n = 32
12 | 
13 | NNODE = Chain(x -> [Float32(x)], 
14 |            Dense(1 => n,tanh),
15 |            Dense(n => 1),
16 |            first) 
17 | 
18 | ϵ = sqrt(eps(Float32))
19 | g(t) = t*NNODE(t) + 1f0
20 | loss() = mean(abs2(((g(t+ϵ)-g(t))/ϵ) - sin(2π*t)) for t in 0:1f-2:1f0)
21 | 
22 | #opt = Flux.Descent(0.005)
23 | opt = Flux.Adam(0.01) ## for now this is a faster gradient descent
24 | data = Iterators.repeated((), 1000)
25 | iter = 0
26 | cb = function () #callback function to observe training
27 |   global iter += 1
28 |   if iter % 500 == 0
29 |     display(loss())
30 |   end
31 | end
32 | display(loss())
33 | Flux.train!(loss, Flux.params(NNODE), data, opt; cb=cb)
34 | 
35 | t = 0:0.001:1.0
36 | plot(t,g.(t),label="NN")
37 | plot!(t,1.0 +1/(2π) .- cos.(2π.*t)/2π, label = "True Solution")


--------------------------------------------------------------------------------
/lecture6/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture6/.DS_Store


--------------------------------------------------------------------------------
/lecture6/BACKpropagation.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture6/BACKpropagation.pdf


--------------------------------------------------------------------------------
/lecture6/backprop_poster.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture6/backprop_poster.pdf


--------------------------------------------------------------------------------
/lecture6/handwritten reverse mode.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture6/handwritten reverse mode.pdf


--------------------------------------------------------------------------------
/lecture6/parallel_models.jl:
--------------------------------------------------------------------------------
  1 | # SIMD EXAMPLE (look for the "fmul <4 x double>" in "vector.body" etc.)
  2 | function f(v)
  3 |     for i in 1:length(v)
  4 |       @inbounds v[i] *= 2
  5 |       #v[i] *= 2
  6 |     end
  7 |  end
  8 | 
  9 |  v = zeros(100)
 10 |  @code_llvm f(v)
 11 | 
 12 | 
 13 |  # arrays of structs vs structs of arrays
 14 |  struct MyComplex
 15 |     real::Float64
 16 |     imag::Float64
 17 |   end
 18 |   arr = [MyComplex(rand(),rand()) for i in 1:100]
 19 |   # this is real,imag,real,imag,...
 20 | 
 21 |   struct MyComplexes # notice the "es" 
 22 |     real::Vector{Float64}
 23 |     imag::Vector{Float64}
 24 |   end
 25 |   arr2 = MyComplexes(rand(100),rand(100))
 26 |   # this is real,real,real,...,imag,imag,imag...
 27 | display("---------")
 28 | Base.:+(x::MyComplex,y::MyComplex) = MyComplex(x.real+y.real,x.imag+y.imag)
 29 | Base.:/(x::MyComplex,y::Int) = MyComplex(x.real/y,x.imag/y)
 30 | average(x::Vector{MyComplex}) = sum(x)/length(x)
 31 | @code_llvm average(arr) # look for the [2 x double] etc?
 32 | 
 33 | # explicit SIMD (not recommended for beginners)
 34 | using SIMD
 35 | v = Vec{4,Float64}((1,2,3,4))
 36 | @show v+v # basic arithmetic is supported
 37 | @show sum(v) # basic reductions are supported
 38 | @code_llvm v+v
 39 | @code_llvm sum(v)
 40 | 
 41 | # compilers are really smart, this just returns N
 42 | function f(N)
 43 |     acc = 0
 44 |     for i in 1:N
 45 |       acc += 1
 46 |     end
 47 |     return acc
 48 | end
 49 | @code_llvm f(100)
 50 | # may seem unreadable but 
 51 | # %0 is the N  
 52 | # the select is essentially (N>0):N:0
 53 | # the output is i64
 54 | 
 55 |   Threads.nthreads()
 56 | 
 57 | 
 58 | #using Base.Threads   # lets you leave out the Threads.xyz
 59 | 
 60 | #here none of this will happen
 61 | # but the answer doesn't seem right
 62 | acc = 0  # this is a global, always on the heap
 63 | @btime acc=0 # doesn't show it
 64 | @btime acc=Ref(0) # does
 65 | # ? Ref
 66 | Threads.@threads for i in 1:10_000
 67 |     global acc
 68 |     acc += 1
 69 | end
 70 | acc
 71 | #Why? reads from heap, computes on stack, and writes to heap at the same time
 72 | 
 73 | 
 74 | # atomics fixes (does the blocking) but performance
 75 | acc = Atomic{Int64}(0)
 76 | Threads.@threads for i in 1:10_000
 77 |     atomic_add!(acc, 1)
 78 | end
 79 | acc
 80 | 
 81 | 
 82 | # SpinLock (unsafe if you do locks within locks)
 83 | const acc_lock = Ref{Int64}(0)
 84 | const splock = SpinLock()
 85 | function f1()
 86 |     @threads for i in 1:10_000
 87 |         lock(splock)
 88 |         acc_lock[] += 1
 89 |         unlock(splock)
 90 |     end
 91 | end
 92 | 
 93 | # Reentrant lock (safe but slower)
 94 | const rsplock = ReentrantLock()
 95 | function f2()
 96 |     @threads for i in 1:10_000
 97 |         lock(rsplock)
 98 |         acc_lock[] += 1
 99 |         unlock(rsplock)
100 |     end
101 | end
102 | 
103 | # atomic, we've seen already
104 | acc2 = Atomic{Int64}(0)
105 | function g()
106 |   @threads for i in 1:10_000
107 |       atomic_add!(acc2, 1)
108 |   end
109 | end
110 | 
111 | # just serial
112 | const acc_s = Ref{Int64}(0)
113 | function h()
114 |   global acc_s
115 |   for i in 1:10_000
116 |       acc_s[] += 1
117 |   end
118 | end
119 | 
120 | # serial without tricks
121 | non_const_len = 10000
122 | function h3()
123 |   global acc_s
124 |   global non_const_len
125 |   len2::Int = non_const_len
126 |   for i in 1:len2
127 |       acc_s[] += 1
128 |   end
129 | end
130 | @btime h3()
131 | 
132 | 
133 | @btime f1()
134 | @btime f2()
135 | @btime f()
136 | @btime g()
137 | 
138 | 
139 | 
140 | #threads work in any order
141 | const a2 = zeros(nthreads()*10)
142 | const acc_lock2 = Ref{Int64}(0)
143 | const splock2 = SpinLock()
144 | function f_order()
145 |     @threads for i in 1:length(a2)
146 |         lock(splock2)
147 |         acc_lock2[] += 1
148 |         a2[i] = acc_lock2[]
149 |         unlock(splock2)
150 |     end
151 | end
152 | f_order()
153 | a2


--------------------------------------------------------------------------------
/lecture6/pinn2.jl:
--------------------------------------------------------------------------------
 1 | using Flux, Plots, DifferentialEquations
 2 | 
 3 | # Let's set up a modified Hook's law u" = kx + 0.1sinx
 4 | k = 1.0
 5 | force(dx,x,k,t) = -k*x + 0.1sin(x)
 6 | 
 7 | # solve and plot the solution
 8 | prob = SecondOrderODEProblem(force,1.0,0.0,(0.0,10.0),k)
 9 | sol = solve(prob)
10 | plot(sol,label=["Velocity" "Position"])
11 | 
12 | # get forces at all points
13 | plot_t = 0:0.01:10
14 | data_plot = sol(plot_t)
15 | positions_plot = [state[2] for state in data_plot]
16 | force_plot = [force(state[1],state[2],k,t) for state in data_plot]
17 | 
18 | # dataset at four points
19 | t = 0:3.3:10
20 | dataset = sol(t)
21 | position_data  = [state[2] for state in sol(t)]
22 | force_data   = [force(state[1],state[2],k,t) for state in sol(t)]
23 | 
24 | # see the four positions_plot
25 | plot(plot_t,force_plot,xlabel="t",label="True Force")
26 | scatter!(t,force_data,label="Force Measurements")
27 | 
28 | NNForce = Chain(x -> [Float32(x)],
29 |            Dense(1 => 32,tanh),
30 |            Dense(32 => 1),
31 |            first)
32 | 
33 | 
34 | random_positions = [2rand()-1 for i in 1:100] # random values in [-1,1]
35 | loss_ode() = sum(abs2,NNForce(x) - (-k*x) for x in random_positions)
36 | loss() = sum(abs2,NNForce(position_data[i]) - force_data[i] for i in 1:length(position_data))
37 | 
38 | λ = 0.1
39 | composed_loss() = loss() + λ*loss_ode()
40 | 
41 | 
42 | 
43 | opt = Flux.Descent(0.01)
44 | data = Iterators.repeated((), 10000)
45 | iter = 0
46 | cb = function () #callback function to observe training
47 |   global iter += 1
48 |   if iter % 500 == 0
49 |     display(composed_loss())
50 |   end
51 | end
52 | display(composed_loss())
53 | Flux.train!(composed_loss, Flux.params(NNForce), data, opt; cb=cb)
54 | 
55 | learned_force_plot = NNForce.(positions_plot)
56 | 
57 | plot(plot_t,force_plot,xlabel="t",label="True Force")
58 | plot!(plot_t,learned_force_plot,label="Predicted Force")
59 | scatter!(t,force_data,label="Force Measurements")


--------------------------------------------------------------------------------
/lecture6/threads_demo.jl:
--------------------------------------------------------------------------------
 1 | using BenchmarkTools, LinearAlgebra
 2 | Threads.nthreads()
 3 | BLAS.set_num_threads(1)
 4 | 
 5 | # BASIC LOOP
 6 | n= 200
 7 | stuff = [rand(n,n) for i=1:10]
 8 | function busywork(stuff)
 9 |     for i=1:10
10 |         stuff[i] = inv(stuff[i])
11 |     end
12 | end
13 | 
14 | # Time the Basic Loop
15 | busywork(stuff)
16 | print(" 1  thread: ")
17 | @time busywork(stuff)
18 | 
19 | # WITH THREADS  -- really a PARFOR
20 | # in 1.8 this will always be dynamic by default,
21 | 4
22 | 
23 | busywork_with_threads(stuff)
24 | print("$(Threads.nthreads()) threads: ")
25 | @time busywork_with_threads(stuff)
26 | 
27 | # DYNAMIC SCHEDULING -- # feels like there is a computational graph in your mind
28 | # In 1.8 this is no longer a good example for non-uniform work loads
29 | # but even now is a great example for traversing binary trees etc.
30 | # (PARFOR @threads could have been implemented from @spawn's but is more specialized for performance)
31 | function busywork_with_threads_dynamic_scheduling(stuff)
32 |  @sync for  i=1:length(stuff)  # @sync is for the timing  #also a parfor
33 |     Threads.@spawn stuff[i] = inv(stuff[i])
34 |  end
35 | end
36 | 
37 | busywork_with_threads_dynamic_scheduling(stuff)
38 | print("dynamic scheduling threads: ")
39 | @time busywork_with_threads_dynamic_scheduling(stuff)
40 | 
41 | 
42 | stuff = [rand( i ,i) for i∈ [ fill(800,3);fill(100,18)]];
43 | @time busywork_with_threads(stuff)
44 | @time busywork_with_threads(stuff)
45 | @time busywork_with_threads(stuff)
46 | @time busywork_with_threads(stuff)
47 | @time busywork_with_threads(stuff)
48 | println("----------------------------")
49 | @time busywork_with_threads_dynamic_scheduling(stuff)
50 | @time busywork_with_threads_dynamic_scheduling(stuff)
51 | @time busywork_with_threads_dynamic_scheduling(stuff)
52 | @time busywork_with_threads_dynamic_scheduling(stuff)
53 | @time busywork_with_threads_dynamic_scheduling(stuff)
54 | 
55 | 
56 | function lorenz!(du,u,p)
57 |     α,σ,ρ,β = p
58 |     @inbounds begin
59 |       du[1] = u[1] + α*(σ*(u[2]-u[1]))
60 |       du[2] = u[2] + α*(u[1]*(ρ-u[3]) - u[2])
61 |       du[3] = u[3] + α*(u[1]*u[2] - β*u[3])
62 |     end
63 |   end
64 |   function solve_system_save_iip!(u,f,u0,p,n)
65 |     @inbounds u[1] = u0
66 |     @inbounds for i in 1:length(u)-1
67 |       f(u[i+1],u[i],p)
68 |     end
69 |     u
70 |   end
71 |   p = (0.02,10.0,28.0,8/3)
72 |   u = [Vector{Float64}(undef,3) for i in 1:1000]
73 |   @btime solve_system_save_iip!(u,lorenz!,[1.0,0.0,0.0],p,1000)


--------------------------------------------------------------------------------
/lecture7/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture7/.DS_Store


--------------------------------------------------------------------------------
/lecture7/LorenzManyWays.jl:
--------------------------------------------------------------------------------
  1 | using BenchmarkTools
  2 | 
  3 | function lorenz(u,p)
  4 |     α,σ,ρ,β = p
  5 |     du1 = u[1] + α*(σ*(u[2]-u[1]))
  6 |     du2 = u[2] + α*(u[1]*(ρ-u[3]) - u[2])
  7 |     du3 = u[3] + α*(u[1]*u[2] - β*u[3])
  8 |     [du1,du2,du3]  # returns a vector
  9 |   end
 10 |   p = (0.02,10.0,28.0,8/3)
 11 | 
 12 | 
 13 | # first try
 14 | function solve_system_save(f,u0,p,n)
 15 |     u = Vector{typeof(u0)}(undef,n)
 16 |     u[1] = u0
 17 |     for i in 1:n-1
 18 |       u[i+1] = f(u[i],p)
 19 |     end
 20 |     u
 21 |   end
 22 |  @btime  solve_system_save(lorenz,[1.0,0.0,0.0],p,1000);
 23 | 
 24 |  # second try (shows that pushing doesnt hurt or help)
 25 |  # you might think that not allocating the memory would slow you down, but...
 26 |  # julia doubles memory each time
 27 |  function solve_system_save_push(f,u0,p,n)
 28 |      u = Vector{typeof(u0)}(undef,1) # note the 1
 29 |     u[1] = u0
 30 |     for i in 1:n-1
 31 |       push!(u,f(u[i],p))
 32 |     end
 33 |     u
 34 |   end
 35 |   @btime solve_system_save_push(lorenz,[1.0,0.0,0.0],p,1000);
 36 | 
 37 |   # matlab users might prefer matrices
 38 | # third try
 39 | function solve_system_save_matrix(f,u0,p,n)
 40 |     u = Matrix{eltype(u0)}(undef,length(u0),n)
 41 |     u[:,1] = u0
 42 |     for i in 1:n-1
 43 |       u[:,i+1] = f(u[:,i],p)
 44 |     end
 45 |     u
 46 |   end
 47 |   @btime solve_system_save_matrix(lorenz,[1.0,0.0,0.0],p,1000);
 48 | # slicing into the matrix is expensive
 49 | 
 50 | #fourth try -- fix with a view
 51 | 
 52 | function solve_system_save_matrix_view(f,u0,p,n)
 53 |     u = Matrix{eltype(u0)}(undef,length(u0),n)
 54 |     u[:,1] = u0
 55 |     for i in 1:n-1
 56 |       u[:,i+1] = f(@view(u[:,i]),p)
 57 |     end
 58 |     u
 59 |   end
 60 |   @btime solve_system_save_matrix_view(lorenz,[1.0,0.0,0.0],p,1000);
 61 | #okay that's more like it
 62 | 
 63 | # Note that growing matrices adaptively is a really bad idea
 64 | function solve_system_save_matrix_resize(f,u0,p,n)
 65 |     u = Matrix{eltype(u0)}(undef,length(u0),1)
 66 |     u[:,1] = u0
 67 |     for i in 1:n-1
 68 |       u = hcat(u,f(@view(u[:,i]),p))
 69 |     end
 70 |     u
 71 |   end
 72 |   @btime solve_system_save_matrix_resize(lorenz,[1.0,0.0,0.0],p,1000);
 73 | 
 74 |   # so let's go back to matrices of vectors
 75 |   function lorenz(u,p)
 76 |     α,σ,ρ,β = p
 77 |     du1 = u[1] + α*(σ*(u[2]-u[1]))
 78 |     du2 = u[2] + α*(u[1]*(ρ-u[3]) - u[2])
 79 |     du3 = u[3] + α*(u[1]*u[2] - β*u[3])
 80 |     [du1,du2,du3]  # returns a vector
 81 |   end
 82 |   function solve_system_save(f,u0,p,n)
 83 |     u = Vector{typeof(u0)}(undef,n)
 84 |     u[1] = u0
 85 |     for i in 1:n-1
 86 |       u[i+1] = f(u[i],p)
 87 |     end
 88 |     u
 89 |   end
 90 | 
 91 |   function lorenz2(du,u,p)  # du is now an argument so it can mutate
 92 |     α,σ,ρ,β = p
 93 |     du[1] = u[1] + α*(σ*(u[2]-u[1]))
 94 |     du[2] = u[2] + α*(u[1]*(ρ-u[3]) - u[2])
 95 |     du[3] = u[3] + α*(u[1]*u[2] - β*u[3])
 96 |   end
 97 |   p = (0.02,10.0,28.0,8/3)
 98 |   function solve_system_save2(f,u0,p,n)
 99 |     u = Vector{typeof(u0)}(undef,n)
100 |     du = similar(u0)  # new line
101 |     u[1] = u0  
102 |     for i in 1:n-1
103 |       f(du,u[i],p) # now called with du [no allocations!]
104 |       u[i+1] = du  
105 |     end
106 |     u
107 |   end
108 |  @btime  solve_system_save2(lorenz2,[1.0,0.0,0.0],p,1000);
109 | 
110 |  #but
111 |  # solve_system_save2(lorenz2,[1.0,0.0,0.0],p,1000)
112 |  # we are changign the data every time, can't get around that
113 | 
114 |  function solve_system_save_copy(f,u0,p,n)
115 |     u = Vector{typeof(u0)}(undef,n)
116 |     du = similar(u0)
117 |     u[1] = u0
118 |     for i in 1:n-1
119 |       f(du,u[i],p)
120 |       u[i+1] = copy(du)
121 |     end
122 |     u
123 |   end
124 |   @btime solve_system_save_copy(lorenz2,[1.0,0.0,0.0],p,1000);
125 | 
126 |   # static array approach
127 |   using StaticArrays
128 | function lorenz3(u,p)
129 |   α,σ,ρ,β = p
130 |   du1 = u[1] + α*(σ*(u[2]-u[1]))
131 |   du2 = u[2] + α*(u[1]*(ρ-u[3]) - u[2])
132 |   du3 = u[3] + α*(u[1]*u[2] - β*u[3])
133 |   @SVector [du1,du2,du3]
134 | end
135 | p = (0.02,10.0,28.0,8/3)
136 | function solve_system_save(f,u0,p,n)
137 |   u = Vector{typeof(u0)}(undef,n)
138 |   u[1] = u0
139 |   for i in 1:n-1
140 |     u[i+1] = f(u[i],p)
141 |   end
142 |   u
143 | end
144 | @btime solve_system_save(lorenz3,@SVector[1.0,0.0,0.0],p,1000);
145 | 
146 | # people like inbounds, i don't find it saves that much that often, but sometimes.
147 | function lorenz4(u,p)
148 |     α,σ,ρ,β = p
149 |     @inbounds begin
150 |       du1 = u[1] + α*(σ*(u[2]-u[1]))
151 |       du2 = u[2] + α*(u[1]*(ρ-u[3]) - u[2])
152 |       du3 = u[3] + α*(u[1]*u[2] - β*u[3])
153 |     end
154 |     @SVector [du1,du2,du3]
155 |   end
156 | 
157 |   function solve_system_save(f,u0,p,n)
158 |     u = Vector{typeof(u0)}(undef,n)
159 |     @inbounds u[1] = u0
160 |     @inbounds for i in 1:n-1
161 |       u[i+1] = f(u[i],p)
162 |     end
163 |     u
164 |   end
165 |  @btime  solve_system_save(lorenz4,@SVector[1.0,0.0,0.0],p,1000);
166 | 
167 | # the single allocation is the output , that can be removed 
168 | function solve_system_save!(u,f,u0,p,n) # add an output u to be mutated as well
169 |     @inbounds u[1] = u0
170 |     @inbounds for i in 1:length(u)-1
171 |       u[i+1] = f(u[i],p)
172 |     end
173 |     u
174 |   end
175 |   u = Vector{typeof(@SVector([1.0,0.0,0.0]))}(undef,1000)
176 |   @btime solve_system_save!(u,lorenz4,@SVector([1.0,0.0,0.0]),p,1000);


--------------------------------------------------------------------------------
/lecture7/lecture7 handwritten notes.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/lecture7/lecture7 handwritten notes.pdf


--------------------------------------------------------------------------------
/lecture7/pinn.jl:
--------------------------------------------------------------------------------
 1 | using Flux, Statistics, Plots
 2 | 
 3 | # n = 3
 4 | # n = 10
 5 | # n = 20
 6 | #  n = 25
 7 | # the below don't work with Flux.Descent(0.005)
 8 | #n = 26
 9 | n = 28
10 | #n = 30
11 | #n = 32
12 | 
13 | NNODE = Chain(x -> [Float32(x)], 
14 |            Dense(1 => n,tanh),
15 |            Dense(n => 1),
16 |            first) 
17 | 
18 | ϵ = sqrt(eps(Float32))
19 | g(t) = t*NNODE(t) + 1f0
20 | loss() = mean(abs2(((g(t+ϵ)-g(t))/ϵ) - sin(2π*t)) for t in 0:1f-2:1f0)
21 | 
22 | #opt = Flux.Descent(0.005)
23 | opt = Flux.Adam(0.01) ## for now this is a faster gradient descent
24 | data = Iterators.repeated((), 1000)
25 | iter = 0
26 | cb = function () #callback function to observe training
27 |   global iter += 1
28 |   if iter % 500 == 0
29 |     display(loss())
30 |   end
31 | end
32 | display(loss())
33 | Flux.train!(loss, Flux.params(NNODE), data, opt; cb=cb)
34 | 
35 | t = 0:0.001:1.0
36 | plot(t,g.(t),label="NN")
37 | plot!(t,1.0 +1/(2π) .- cos.(2π.*t)/2π, label = "True Solution")


--------------------------------------------------------------------------------
/lecture7/pinn2.jl:
--------------------------------------------------------------------------------
 1 | using Flux, Plots, DifferentialEquations
 2 | 
 3 | # Let's set up a modified Hook's law u" = kx + 0.1sinx
 4 | k = 1.0
 5 | force(dx,x,k,t) = -k*x + 0.1sin(x)  # suppose there was friction, then we would use dx (velocity)
 6 | 
 7 | 
 8 | 
 9 | # solve and plot the solution
10 | prob = SecondOrderODEProblem(force,1.0,0.0,(0.0,10.0),k)
11 | sol = solve(prob)
12 | plot(sol,label=["Velocity" "Position"])
13 | 
14 | # get forces at all points
15 | plot_t = 0:0.01:10
16 | data_plot = sol(plot_t)
17 | positions_plot = [state[2] for state in data_plot]
18 | force_plot = [force(state[1],state[2],k,t) for state in data_plot]
19 | 
20 | # dataset at four points
21 | t = 0:3.3:10
22 | dataset = sol(t)
23 | position_data  = [state[2] for state in sol(t)]
24 | force_data   = [force(state[1],state[2],k,t) for state in sol(t)]
25 | 
26 | # see the four positions_plot
27 | plot(plot_t,force_plot,xlabel="t",label="True Force")
28 | scatter!(t,force_data,label="Force Measurements")
29 | 
30 | NNForce = Chain(x -> [Float32(x)],
31 |            Dense(1 => 32,tanh),
32 |            Dense(32 => 1),
33 |            first)
34 | 
35 | 
36 | random_positions = [2rand()-1 for i in 1:100] # random values in [-1,1]
37 | loss_ode() = sum(abs2,NNForce(x) - (-k*x) for x in random_positions)
38 | loss() = sum(abs2,NNForce(position_data[i]) - force_data[i] for i in 1:length(position_data))
39 | 
40 | λ = 0.1
41 | # penalizes for being off on the guess but also off on the data
42 | # a compromise between knowledge (presumed approximate) and observation (perhaps also approximate)
43 | composed_loss() = loss() + λ*loss_ode()
44 | 
45 | 
46 | 
47 | #opt = Flux.Descent(0.01)
48 | opt = Flux.Adam(0.01)
49 | data = Iterators.repeated((), 10000)
50 | iter = 0
51 | cb = function () #callback function to observe training
52 |   global iter += 1
53 |   if iter % 500 == 0
54 |     display(composed_loss())
55 |   end
56 | end
57 | display(composed_loss())
58 | Flux.train!(composed_loss, Flux.params(NNForce), data, opt; cb=cb)
59 | 
60 | learned_force_plot = NNForce.(positions_plot)
61 | 
62 | plot(plot_t,force_plot,xlabel="t",label="True Force")
63 | plot!(plot_t,learned_force_plot,label="Predicted Force")
64 | scatter!(t,force_data,label="Force Measurements")


--------------------------------------------------------------------------------
/lecture8/pi.jl:
--------------------------------------------------------------------------------
  1 | 
  2 | using Distributions, Base.Threads, BenchmarkTools
  3 | 
  4 | 
  5 | """
  6 | function estimatepi(n)
  7 | 
  8 | Runs a simple Monte Carlo method
  9 | to estimate pi with n samples.
 10 | """
 11 | function estimate_pi(n)
 12 | 	count = 0
 13 | 	for i=1:n		
 14 | 		x = rand(Uniform(-1.0, 1.0))
 15 | 		y = rand(Uniform(-1.0, 1.0))
 16 | 		count += (x^2 + y^2) <= 1
 17 | 	end
 18 | 	
 19 | 	return 4*count/n
 20 | end
 21 | 
 22 | function estimate_pi_inner_threads(n)
 23 | 	counts = zeros(Int,Threads.nthreads())
 24 | 	@threads for i=1:n		
 25 | 		x = rand(Uniform(-1.0, 1.0))
 26 | 		y = rand(Uniform(-1.0, 1.0))
 27 | 		counts[Threads.threadid()] += (x^2 + y^2) <= 1
 28 | 	end
 29 | 	
 30 | 	return 4*sum(counts)/n
 31 | end
 32 | 
 33 | 
 34 | 
 35 | """
 36 | Compute pi in parallel, over ncores cores, with a Monte Carlo simulation throwing N total darts
 37 | """
 38 | # number 1
 39 | function estimate_pi_tasks_vector(N::Int)
 40 | 	ntasks = Base.Threads.nthreads()
 41 | 	slices_of_pi = Vector{Float64}(undef, ntasks)
 42 | 	n = N ÷ ntasks
 43 | 
 44 | 	@sync for tid in 1:ntasks
 45 | 		Threads.@spawn slices_of_pi[tid] = estimate_pi(n)
 46 | 	end
 47 |     return sum(slices_of_pi) / ntasks
 48 | end
 49 | 
 50 | # number 6
 51 | function estimate_pi_6(N::Int)
 52 | 	ntasks = Base.Threads.nthreads()
 53 | 	slices_of_pi = Vector{Float64}(undef, ntasks)
 54 | 	n = N ÷ ntasks
 55 | 
 56 | 	Threads.@threads for tid in 1:ntasks
 57 | 		 slices_of_pi[tid] = estimate_pi(n)
 58 | 	end
 59 |     return sum(slices_of_pi) / ntasks
 60 | end
 61 | 
 62 | import ThreadsX
 63 | 
 64 | function throw_dart() 
 65 | 	x = rand(Uniform(-1.0, 1.0))
 66 | 	y = rand(Uniform(-1.0, 1.0))
 67 | 	return (x^2 + y^2) <= 1
 68 | end
 69 | 
 70 | estimate_pi_ThreadX(N) =ThreadsX.sum( _->throw_dart() , 1:N )*4/N
 71 | #ThreadsX(_->throw_dart(),1:N)
 72 | 
 73 | """
 74 | Compute pi in parallel, over ncores cores, with a Monte Carlo simulation throwing N total darts with channels
 75 | """
 76 | # number 2
 77 | function estimate_pi_tasks_channel(N::Int)
 78 | 	ntasks = Base.Threads.nthreads()
 79 | 	ch = Channel{Float64}(ntasks)
 80 | 	n = N ÷ ntasks
 81 | 
 82 | 	@sync for _ in 1:ntasks
 83 | 		Threads.@spawn put!(ch, estimate_pi(n))
 84 | 	end
 85 | 	sum_of_pis = sum(take!(ch) for _ in 1:ntasks)
 86 |     return sum_of_pis / ntasks
 87 | 	#slices_of_pi = collect(take!(ch) for _ in 1:ntasks)
 88 | 	#return slices_of_pi
 89 | end
 90 | 
 91 | 
 92 | mutable struct Counter{T}
 93 | 	@atomic val::T
 94 | end
 95 | 
 96 | """
 97 | function estimatepi(n)
 98 | 
 99 | Runs a simple Monte Carlo method
100 | to estimate pi with n samples.
101 | """
102 | # number 3
103 | function estimate_pi_atomic(n)
104 | 	count = Counter(0)
105 | 	Threads.@threads for i=1:n
106 | 		x = rand(Uniform(-1.0, 1.0))
107 | 		y = rand(Uniform(-1.0, 1.0))
108 | 		@atomic count.val += (x^2 + y^2) <= 1
109 | 	end
110 | 	return 4*count.val/n
111 | end
112 | 
113 | # number 4
114 | function estimate_pi_tasks_atomic(N::Int)
115 | 	ntasks = Base.Threads.nthreads()
116 | 	#slices_of_pi = Vector{Float64}(undef, ntasks)
117 | 	n = N ÷ ntasks
118 | 	sum = Counter(0.0)
119 | 	@sync for tid in 1:ntasks
120 | 		Threads.@spawn begin
121 | 			@atomic sum.val += estimate_pi(n)
122 | 		end
123 | 	end
124 |     return sum.val / ntasks
125 | end
126 | 
127 | # number 5
128 | function estimate_pi_5(N::Int)
129 | 	v = zeros(N)
130 | 	Threads.@threads for i ∈ 1:N
131 | 		v[i] = estimate_pi(1)
132 | 	end	
133 | 	return sum(v)/N
134 | end
135 | 
136 | 
137 | 
138 | N = 2_000_000
139 | 
140 | 
141 | serial = @belapsed estimate_pi(N) seconds=1
142 | pchannel = @belapsed estimate_pi_tasks_channel(N)  seconds=1
143 | pvector = @belapsed estimate_pi_tasks_vector(N)  seconds=1
144 | patomic = @belapsed estimate_pi_atomic(N)  seconds=1
145 | ptasksatomic = @belapsed estimate_pi_tasks_atomic(N) seconds=1
146 | p5 = @belapsed estimate_pi_5(N) seconds=1
147 | p6 = @belapsed estimate_pi_6(N) seconds=1
148 | p7 = @belapsed estimate_pi_inner_threads(N) seconds=1
149 | p8 = @belapsed estimate_pi_ThreadX(N) seconds=1
150 | 
151 | 
152 | pvector/serial, pchannel/serial, patomic/serial, ptasksatomic/serial, p5/serial, p6/serial, p7/serial, p8/serial
153 | 


--------------------------------------------------------------------------------
/lecture8/threads.jl:
--------------------------------------------------------------------------------
  1 | using Base.Threads, BenchmarkTools, Statistics, StaticArrays
  2 | const N = 1_000
  3 | 
  4 | 
  5 | ## Review from the end of last lecture
  6 | ## best serial code was lorenz4 with solve_system_save!
  7 | ## @SVector puts the length 3 vector on the stack
  8 | ## @inbounds doesn't hurt, may not help much
  9 | ## there were NO allocations as it used mutation
 10 | ## specifically we preallocate a vector u that will contain N Svectors
 11 | ## 
 12 | 
 13 | 
 14 |   function lorenz4(u,p)
 15 |     α,σ,ρ,β = p
 16 |     @inbounds begin
 17 |       du1 = u[1] + α*(σ*(u[2]-u[1]))
 18 |       du2 = u[2] + α*(u[1]*(ρ-u[3]) - u[2])
 19 |       du3 = u[3] + α*(u[1]*u[2] - β*u[3])
 20 |     end
 21 |     @SVector [du1,du2,du3]
 22 |   end
 23 | 
 24 |   function solve_system_save!(u,f,u0,p,n)
 25 |     @inbounds u[1] = u0
 26 |     @inbounds for i in 1:length(u)-1
 27 |       u[i+1] = f(u[i],p)
 28 |     end
 29 |     u
 30 |   end
 31 | 
 32 | u = Vector{typeof(@SVector([1.0,0.0,0.0]))}(undef,N);  # preallocate space for 3N floats
 33 | p = (0.02,10.0,28.0,8/3)
 34 | 
 35 | println("Time for length N=$N Iteration")
 36 | @btime solve_system_save!(u,lorenz4,@SVector([1.0,0.0,0.0]),p,N);
 37 | 
 38 | 
 39 | 
 40 | 
 41 | println("Now for some means")
 42 | 
 43 | function compute_trajectory_mean(u0,p)
 44 |     u = Vector{typeof(@SVector([1.0,0.0,0.0]))}(undef,N)
 45 |     solve_system_save!(u,lorenz4,u0,p,N);
 46 |     mean(u)
 47 |   end
 48 |   @btime compute_trajectory_mean(@SVector([1.0,0.0,0.0]),p);
 49 | 
 50 | 
 51 | # There is a tiny benefit for preallocating the global u 
 52 | 
 53 | function compute_trajectory_mean2(u0,p)
 54 |     # u is automatically captured
 55 |     solve_system_save!(u,lorenz4,u0,p,1000);
 56 |     mean(u)
 57 |   end
 58 |   @btime compute_trajectory_mean2(@SVector([1.0,0.0,0.0]),p);
 59 | 
 60 | 
 61 |   # slight  benefit for making this a const vector (maybe/maybe not)
 62 |   const _u_cache = Vector{typeof(@SVector([1.0,0.0,0.0]))}(undef,N);
 63 |   
 64 |   function compute_trajectory_mean3(u0,p)
 65 |     # u is automatically captured
 66 |     solve_system_save!(_u_cache,lorenz4,u0,p,1000);
 67 |     mean(_u_cache)
 68 |   end
 69 |   @btime compute_trajectory_mean3(@SVector([1.0,0.0,0.0]),p);
 70 | 
 71 | # a closure is a nice style, and maybe a little benefit
 72 | function _compute_trajectory_mean4(u,u0,p)
 73 |     solve_system_save!(u,lorenz4,u0,p,N);
 74 |     mean(u)
 75 | end
 76 | compute_trajectory_mean4(u0,p) = _compute_trajectory_mean4(_u_cache,u0,p)  # called a closure
 77 | @btime compute_trajectory_mean4(@SVector([1.0,0.0,0.0]),p);
 78 | 
 79 | 
 80 | const M = 2000
 81 | # let's do a multi-parameter search
 82 | ps = [(0.02,10.0,28.0,8/3) .* (1.0,rand(3)...) for i in 1:M];
 83 | 
 84 | serial_out = map(p -> compute_trajectory_mean4(@SVector([1.0,0.0,0.0]),p),ps);
 85 | 
 86 | # now with multithreading
 87 | function tmap(f,ps)
 88 |     out = Vector{typeof(@SVector([1.0,0.0,0.0]))}(undef,M)
 89 |     Threads.@threads for i in 1:M
 90 |       # each loop part is using a different part of the data
 91 |       out[i] = f(ps[i])
 92 |     end
 93 |     out
 94 |   end
 95 |   threaded_out = tmap(p -> compute_trajectory_mean4(@SVector([1.0,0.0,0.0]),p),ps)
 96 | 
 97 | serial_out .- threaded_out
 98 | 
 99 |   ## We need a different "heap location" for each thread
100 | const _u_cache_threads = [Vector{typeof(@SVector([1.0,0.0,0.0]))}(undef,N) for i in 1:Threads.nthreads()];
101 | 
102 | function compute_trajectory_mean5(u0,p)
103 |     # u is automatically captured
104 |     solve_system_save!(_u_cache_threads[Threads.threadid()],lorenz4,u0,p,N);
105 |     mean(_u_cache_threads[Threads.threadid()])
106 | end
107 | 
108 | 
109 |   
110 | serial_out = map(p -> compute_trajectory_mean5(@SVector([1.0,0.0,0.0]),p),ps)
111 | threaded_out = tmap(p -> compute_trajectory_mean5(@SVector([1.0,0.0,0.0]),p),ps)
112 | serial_out - threaded_out
113 | 
114 | 
115 | 
116 |   
117 | 
118 | @btime serial_out = map(p -> compute_trajectory_mean5(@SVector([1.0,0.0,0.0]),p),ps);
119 | @btime threaded_out = tmap(p -> compute_trajectory_mean5(@SVector([1.0,0.0,0.0]),p),ps);
120 | 
121 | 
122 |  


--------------------------------------------------------------------------------
/old lecture 13/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/old lecture 13/.DS_Store


--------------------------------------------------------------------------------
/old lecture 13/firstcuda.jl:
--------------------------------------------------------------------------------
 1 | using CUDA
 2 | CUDA.version()
 3 | CUDA.functional()
 4 | 
 5 | A = [1 2 3;4 5 6;7 8 9]
 6 | cA = CuArray(A)
 7 | Array(cA)
 8 | 
 9 | Array{Int}(undef,3,3)
10 | 
11 | CuArray{Int}(undef,3,3)
12 | 
13 | c=CUDA.rand(Float64,3,3)
14 | v=CUDA.rand(1000)
15 | sum(v)
16 | 
17 | map( x->sin(cos(x))+exp(x)  ,v )
18 | 
19 | using LinearAlgebra
20 | q,r = qr(c)
21 | CUDA.allowscalar(true)
22 | 
23 | using SparseArrays
24 | c = CuArray([1 0 2;0 0 3; 0 0 4])
25 | sparse(Array(c))
26 | #sparse(c) #not working?
27 | 
28 | using FFTW
29 | fft(Array(c))
30 | fft(c)
31 | 
32 | 
33 | ## implicit vectorization
34 | C = CUDA.zeros(Int64, 64)
35 | 
36 | 
37 | function kernel2!(A)
38 |     i = threadIdx().x
39 |     A[i] = i
40 |     return
41 | end
42 | 
43 | @cuda threads=128 kernel2!(C)
44 | C
45 | using ForwardDiff
46 | 
47 | map( x->ForwardDiff.derivative(sin,x), v)


--------------------------------------------------------------------------------
/old lecture 13/prefix.ppt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/old lecture 13/prefix.ppt


--------------------------------------------------------------------------------
/old lecture10/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/old lecture10/.DS_Store


--------------------------------------------------------------------------------
/old lecture10/helloworld:
--------------------------------------------------------------------------------
 1 | using MPI
 2 | 
 3 | # Initialize MPI environment
 4 | MPI.Init()
 5 | 
 6 | # Get MPI process rank id
 7 | rank = MPI.Comm_rank(MPI.COMM_WORLD)
 8 | 
 9 | # Get number of MPI processes in this communicator
10 | nproc = MPI.Comm_size(MPI.COMM_WORLD)
11 | 
12 | # Print hello world message
13 | print("Hello world, I am rank $(rank) of $(nproc) processors\n")


--------------------------------------------------------------------------------
/old lecture10/mpihelloworld.jl:
--------------------------------------------------------------------------------
 1 | # steps to setting up MPI
 2 | # 1. Pkg.add, using
 3 | # 2. MPI.install_mpiexecjl()
 4 | # 3. mpiexecjl --project=/path/to/project -n 20 julia script.jl
 5 | # 4. mpiexecjl -np 6 julia mpihelloworld.jl  
 6 | #
 7 | #also
 8 | #export PATH=/Applications/Julia-1.7.app/Contents/Resources/julia/bin:$PATH
 9 | #export PATH=/Users/alanedelman/.julia/bin:$PATH
10 | #also https://juliaparallel.github.io/MPI.jl/latest/configuration/#Julia-wrapper-for-mpiexec
11 | 
12 | using MPI
13 | 
14 | # Initialize MPI environment
15 | MPI.Init()
16 | 
17 | # Get MPI process rank id
18 | rank = MPI.Comm_rank(MPI.COMM_WORLD)
19 | 
20 | # Get number of MPI processes in this communicator
21 | nproc = MPI.Comm_size(MPI.COMM_WORLD)
22 | 
23 | # Print hello world message
24 | print("Hello world, I am rank $(rank) of $(nproc) processors\n")


--------------------------------------------------------------------------------
/old lecture10/mpijl_demo/helloworld.jl:
--------------------------------------------------------------------------------
1 | # Print hello world message
2 | println("Hello world!")
3 | 


--------------------------------------------------------------------------------
/old lecture10/mpijl_demo/mpihelloworld.jl:
--------------------------------------------------------------------------------
 1 | using MPI
 2 | 
 3 | # Initialize MPI environment
 4 | MPI.Init()
 5 | 
 6 | # Get MPI process rank id
 7 | rank = MPI.Comm_rank(MPI.COMM_WORLD)
 8 | 
 9 | # Get number of MPI processes in this communicator
10 | nproc = MPI.Comm_size(MPI.COMM_WORLD)
11 | 
12 | # Print hello world message
13 | print("Hello world, I am rank $(rank) of $(nproc) processors\n")
14 | 


--------------------------------------------------------------------------------
/old lecture10/mpijl_demo/submit.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | # Slurm sbatch options
 4 | #SBATCH -o top5norm_collective.log-%j
 5 | #SBATCH -n 4
 6 | 
 7 | # Initialize Modules
 8 | source /etc/profile
 9 | 
10 | # Load Julia and MPI Modules
11 | module load julia
12 | module load mpi
13 | 
14 | # Call your script as you would from the command line
15 | mpirun julia top5norm_collective.jl
16 | 


--------------------------------------------------------------------------------
/old lecture10/mpijl_demo/top5norm.jl:
--------------------------------------------------------------------------------
 1 | # Read in file of helper functions
 2 | # This file incluse: getcounts, getnormcount
 3 | 
 4 | include("word_count_helpers.jl")
 5 | 
 6 | # Load the file names
 7 | dataLoc = "data/";
 8 | fnames = dataLoc.*readdir(dataLoc)
 9 | 
10 | # Find word counts for all books
11 | allcounts = getcounts.(fnames)
12 | 
13 | # Get overall counts for each word
14 | overallcounts = merge(+,allcounts...)
15 | 
16 | # Calculate and print the normalized counts
17 | normcount = getnormcount.(allcounts,Ref(overallcounts))
18 |         
19 | for i in 1:length(fnames)
20 |     fname = basename(fnames[i])
21 |     top5 = normcount[i][1:min(5,length(normcount[i])),:]
22 |     top5 = join(first.(top5), ", ",", and ")
23 |     println("Top 5 words for document $fname are $top5")
24 | end


--------------------------------------------------------------------------------
/old lecture10/mpijl_demo/top5norm_collective.jl:
--------------------------------------------------------------------------------
 1 | # Load packages and helper functions
 2 | using MPI, Statistics
 3 | include("word_count_helpers.jl")
 4 | 
 5 | # Call MPI.init() and 
 6 | MPI.Init()
 7 | comm = MPI.COMM_WORLD
 8 | rank = MPI.Comm_rank(comm)
 9 | nprocs = MPI.Comm_size(comm)
10 | root = 0
11 | 
12 | # Load the file names
13 | dataLoc = "data";
14 | fnames = joinpath.(dataLoc,readdir(dataLoc))
15 | 
16 | # Distribute filenames by rank
17 | myfnames = fnames[rank+1:nprocs:length(fnames)]
18 | 
19 | # Calculate the word counts
20 | mycounts =  getcounts.(myfnames)
21 | 
22 | # Do an initial merge so we only send one dictionary
23 | myoverall = merge(+,mycounts...)
24 | 
25 | # Gather all counts onto Process 0
26 | 
27 | # First we have to serialize the dictionary so we can send it
28 | msg = MPI.serialize(myoverall)
29 | 
30 | # Since each msg size is different we have to get the length of each one
31 | msglengths = MPI.Allgather(Int32(length(msg)),comm)
32 | 
33 | # Then we can gather on process 0 (root)
34 | res = MPI.Gatherv(msg, msglengths, root, comm)
35 | 
36 | # And deserialize and merge the counts to get the overall word counts
37 | if rank == 0
38 |     
39 |     # res is one long vector, first split it up
40 |     idx = [0; cumsum(msglengths)]
41 |     res = [res[idx[i]+1:idx[i+1]] for i in 1:length(idx)-1]
42 |     
43 |     # Once it's split we can deserialized each dictionary and merge
44 |     allcounts = MPI.deserialize.(res)
45 |     overallcounts = merge(+,allcounts...)
46 | else
47 |     overallcounts = nothing
48 | end
49 | 
50 | # Then we can use Broadcast to send these counts to the rest of the processes
51 | overallcounts = MPI.bcast(overallcounts, root, comm)
52 | 
53 | # Calculate the normalized counts
54 | normcount = getnormcount.(mycounts,Ref(overallcounts))
55 | 
56 | for i in 1:length(myfnames)
57 |     fname = basename(myfnames[i])
58 |     top5 = normcount[i][1:min(5,length(normcount[i])),:]
59 |     top5 = join(first.(top5), ", ",", and ")
60 |     println("$rank: Top 5 words for document $fname are $top5")
61 | end
62 | 


--------------------------------------------------------------------------------
/old lecture10/mpijl_demo/top5norm_sendrecv.jl:
--------------------------------------------------------------------------------
 1 | # Load MPI package and read in file of helper functions
 2 | # This file incluse: getcounts, getnormcount
 3 | using MPI
 4 | include("word_count_helpers.jl")
 5 | 
 6 | # Call MPI.init() and get communicator, rank, and nprocs
 7 | MPI.Init()
 8 | comm = MPI.COMM_WORLD
 9 | rank = MPI.Comm_rank(comm)
10 | nprocs = MPI.Comm_size(comm)
11 | 
12 | # Load the file names
13 | dataLoc = "data";
14 | fnames = joinpath.(dataLoc,readdir(dataLoc))
15 | 
16 | # Distribute filenames by rank
17 | myfnames = fnames[rank+1:nprocs:length(fnames)]
18 | 
19 | # Calculate the word counts
20 | mycounts =  getcounts.(myfnames)
21 | 
22 | # Gather all counts onto Process 0 and merge
23 | if rank > 0
24 |     
25 |     # Send mycounts to rank 0
26 |     println("$rank: Sending mycounts $rank -> 0\n")
27 |     MPI.send(mycounts, 0, rank+nprocs, comm)
28 |     
29 | else # rank == 0
30 |     
31 |     # Recieve counts from each rank
32 |     allcounts = Array{Array{Dict,1},1}(undef,nprocs)
33 |     allcounts[1] = mycounts
34 |     for i = 1:nprocs-1
35 |         allcounts[i+1],statrcv = MPI.recv(i, i+nprocs, comm)
36 |     end
37 |     
38 |     # Use merge to get the overall counts
39 |     allcounts = vcat(allcounts...)
40 |     overallcounts = merge(+,allcounts...)
41 | end
42 | 
43 | # Now send the overall counts to all the other Processes
44 | if rank == 0
45 |     for i in 1:nprocs-1
46 |         println("$rank: Sending overallcounts $rank -> $i\n")
47 |         MPI.send(overallcounts, i, i+(nprocs*2), comm)
48 |     end
49 | else
50 |     overallcounts,statrcv = MPI.recv(0, rank+(nprocs*2), comm)
51 | end
52 | 
53 | # Calculate and print the normalized counts
54 | normcount = getnormcount.(mycounts,Ref(overallcounts))
55 |         
56 | for i in 1:length(myfnames)
57 |     fname = basename(myfnames[i])
58 |     top5 = normcount[i][1:min(5,length(normcount[i])),:]
59 |     top5 = join(first.(top5), ", ",", and ")
60 |     println("$rank: Top 5 words for document $fname are $top5")
61 | end
62 | 


--------------------------------------------------------------------------------
/old lecture10/mpijl_demo/word_count_helpers.jl:
--------------------------------------------------------------------------------
 1 | using Statistics
 2 | # A list of stopwords to remove from the text
 3 | stopwords=["as", "a", "able", "about", "above", "according", "accordingly", "across", "actually",
 4 |     "after", "afterwards", "again", "against", "ain", "t", "all", "allow", "allows", "almost", "alone",
 5 |     "along", "already", "also", "although", "always", "am", "among", "amongst", "an", "and", "another",
 6 |     "any", "anybody", "anyhow", "anyone", "anything", "anyway", "anyways", "anywhere", "apart", "appear",
 7 |     "appreciate", "appropriate", "are", "aren", "t", "around", "as", "aside", "ask", "asking", "associated",
 8 |     "at", "available", "away", "awfully", "be", "became", "because", "become", "becomes", "becoming",
 9 |     "been", "before", "beforehand", "behind", "being", "believe", "below", "beside", "besides", "best",
10 |     "better", "between", "beyond", "both", "brief", "but", "by", "c", "mon", "c", "s", "came", "can",
11 |     "can", "t", "cannot", "cant", "cause", "causes", "certain", "certainly", "changes", "clearly", "co",
12 |     "com", "come", "comes", "concerning", "consequently", "consider", "considering", "contain", "containing",
13 |     "contains", "corresponding", "could", "couldn", "t", "course", "currently", "definitely", "described",
14 |     "despite", "did", "didn", "t", "different", "do", "does", "doesn", "t", "doing", "don", "t", "done", "down",
15 |     "downwards", "during", "each", "edu", "eg", "eight", "either", "else", "elsewhere", "enough",
16 |     "entirely", "especially", "et", "etc", "even", "ever", "every", "everybody", "everyone", "everything",
17 |     "everywhere", "ex", "exactly", "example", "except", "far", "few", "fifth", "first", "five", "followed",
18 |     "following", "follows", "for", "former", "formerly", "forth", "four", "from", "further", "furthermore",
19 |     "get", "gets", "getting", "given", "gives", "go", "goes", "going", "gone", "got", "gotten", "greetings",
20 |     "had", "hadn", "t", "happens", "hardly", "has", "hasn", "t", "have", "haven", "t", "having", "he", "he", "s",
21 |     "hello", "help", "hence", "her", "here", "here", "s", "hereafter", "hereby", "herein", "hereupon", "hers",
22 |     "herself", "hi", "him", "himself", "his", "hither", "hopefully", "how", "howbeit", "however", "i", "d",
23 |     "i", "ll", "i", "m", "i", "ve", "ie", "if", "ignored", "immediate", "in", "inasmuch", "inc", "indeed", "indicate",
24 |     "indicated", "indicates", "inner", "insofar", "instead", "into", "inward", "is", "isn", "t", "it", "it", "d",
25 |     "it", "ll", "it", "s", "its", "itself", "just", "keep", "keeps", "kept", "know", "knows", "known", "last",
26 |     "lately", "later", "latter", "latterly", "least", "less", "lest", "let", "let", "s", "like", "liked",
27 |     "likely", "little", "look", "looking", "looks", "ltd", "made", "mainly", "many", "may", "maybe", "me", "mean",
28 |     "meanwhile", "merely", "might", "more", "moreover", "most", "mostly", "much", "must", "my", "myself",
29 |     "name", "namely", "nd", "near", "nearly", "necessary", "need", "needs", "neither", "never", "nevertheless",
30 |     "new", "next", "nine", "no", "nobody", "non", "none", "noone", "nor", "normally", "not", "nothing",
31 |     "novel", "now", "nowhere", "obviously", "of", "off", "often", "oh", "ok", "okay", "old", "on", "once",
32 |     "one", "ones", "only", "onto", "or", "other", "others", "otherwise", "ought", "our", "ours", "ourselves",
33 |     "out", "outside", "over", "overall", "own", "particular", "particularly", "per", "perhaps", "placed", "please",
34 |     "plus", "possible", "presumably", "probably", "provides", "que", "quite", "qv", "rather", "rd", "re", "really",
35 |     "reasonably", "regarding", "regardless", "regards", "relatively", "respectively", "right", "said", "same", "saw",
36 |     "say", "saying", "says", "second", "secondly", "see", "seeing", "seem", "seemed", "seeming", "seems", "seen",
37 |     "self", "selves", "sensible", "sent", "serious", "seriously", "seven", "several", "shall", "she", "should",
38 |     "shouldn", "t", "since", "six", "so", "some", "somebody", "somehow", "someone", "something", "sometime",
39 |     "sometimes", "somewhat", "somewhere", "soon", "sorry", "specified", "specify", "specifying", "still", "sub",
40 |     "such", "sup", "sure", "t", "s", "take", "taken", "tell", "tends", "th", "than", "thank", "thanks", "thanx",
41 |     "that", "that", "s", "thats", "the", "their", "theirs", "them", "themselves", "then", "thence", "there",
42 |     "there", "s", "thereafter", "thereby", "therefore", "therein", "theres", "thereupon", "these", "they", "they", "d",
43 |     "they", "ll", "they", "re", "they", "ve", "thing", "things", "think", "third", "this", "thorough", "thoroughly", "those", "though",
44 |     "three", "through", "throughout", "thru", "thus", "to", "together", "too", "took", "toward", "towards",
45 |     "tried", "tries", "truly", "try", "trying", "twice", "two", "un", "under", "unfortunately", "unless",
46 |     "unlikely", "until", "unto", "up", "upon", "us", "use", "used", "useful", "uses", "using", "usually",
47 |     "value", "various", "very", "via", "viz", "vs", "want", "wants", "was", "wasn", "t", "way", "we", "we", "d",
48 |     "we", "ll", "we", "re", "we", "ve", "welcome", "well", "went", "were", "weren", "t", "what", "what", "s", "whatever",
49 |     "when", "whence", "whenever", "where", "where", "s", "whereafter", "whereas", "whereby", "wherein", "whereupon",
50 |     "wherever", "whether", "which", "while", "whither", "who", "who", "s", "whoever", "whole", "whom", "whose",
51 |     "why", "will", "willing", "wish", "with", "within", "without", "won", "t", "wonder", "would", "would",
52 |     "wouldn", "t", "yes", "yet", "you", "you", "d", "you", "ll", "you", "re", "you", "ve", "your", "yours", "yourself", "yourselves", "zero"];
53 | 
54 | # cleantext grabs the full text without whitespace, punctuation, or stopwords
55 | function cleantext(text)
56 |     idx = findall(occursin.("***",text))
57 |     text = text[idx[1]+1:idx[2]-1]
58 |     text = replace(join(text[text.!=""]," "),r"\p{P}|[0-9]" => " ")
59 |     text = lowercase(replace(text, r"\s{2,}" => " "))
60 | 
61 |     for w in stopwords
62 |         text = replace(text," "*w*" " => " ");
63 |     end
64 | 
65 |     return text
66 | end
67 | 
68 | # countwords constructs a dictionary of the words that appear in the text as the keys and their counts as the values
69 | function countwords(text)
70 |     textSep = split(text," ")
71 |     wordcounts = Dict{String,Float64}()
72 |     for w in textSep
73 |         wordcounts[w] = get(wordcounts, w, 0.0) + 1.0
74 |     end
75 |     return wordcounts
76 | end
77 | 
78 | function getcounts(fname)
79 |     f = open(fname)
80 |     text=cleantext(readlines(f))
81 |     return countwords(text)
82 | end
83 | 
84 | function getnormcount(counts,overallcounts)
85 | 
86 |     # Calculate normalized score
87 |     thresh = quantile(collect(values(counts)), .98)
88 |     counts = filter!(word-> word.second > thresh, counts)
89 |     normscore = merge(/,counts,filter(word->haskey(counts,word.first), overallcounts))
90 | 
91 |     # Rank the resulting scores
92 |     rankedwords = sort(collect(normscore), by=x->x[2], rev=true)
93 |     return rankedwords
94 | end
95 | 


--------------------------------------------------------------------------------
/old lecture11/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mitmath/18337/bd60c58e052232f6ae7ada430904de534d1c5843/old lecture11/.DS_Store


--------------------------------------------------------------------------------
/old lecture11/Manifest.toml:
--------------------------------------------------------------------------------
  1 | # This file is machine-generated - editing it directly is not advised
  2 | 
  3 | julia_version = "1.7.1"
  4 | manifest_format = "2.0"
  5 | 
  6 | [[deps.ArgTools]]
  7 | uuid = "0dad84c5-d112-42e6-8d28-ef12dabb789f"
  8 | 
  9 | [[deps.Artifacts]]
 10 | uuid = "56f22d72-fd6d-98f1-02f0-08ddc0907c33"
 11 | 
 12 | [[deps.Base64]]
 13 | uuid = "2a0f44e3-6c83-55bd-87e4-b1978d98bd5f"
 14 | 
 15 | [[deps.ChainRulesCore]]
 16 | deps = ["Compat", "LinearAlgebra", "SparseArrays"]
 17 | git-tree-sha1 = "c9a6160317d1abe9c44b3beb367fd448117679ca"
 18 | uuid = "d360d2e6-b24c-11e9-a2a3-2a2ae2dbcce4"
 19 | version = "1.13.0"
 20 | 
 21 | [[deps.ChangesOfVariables]]
 22 | deps = ["ChainRulesCore", "LinearAlgebra", "Test"]
 23 | git-tree-sha1 = "bf98fa45a0a4cee295de98d4c1462be26345b9a1"
 24 | uuid = "9e997f8a-9a97-42d5-a9f1-ce6bfc15e2c0"
 25 | version = "0.1.2"
 26 | 
 27 | [[deps.Compat]]
 28 | deps = ["Base64", "Dates", "DelimitedFiles", "Distributed", "InteractiveUtils", "LibGit2", "Libdl", "LinearAlgebra", "Markdown", "Mmap", "Pkg", "Printf", "REPL", "Random", "SHA", "Serialization", "SharedArrays", "Sockets", "SparseArrays", "Statistics", "Test", "UUIDs", "Unicode"]
 29 | git-tree-sha1 = "96b0bc6c52df76506efc8a441c6cf1adcb1babc4"
 30 | uuid = "34da2185-b29b-5c13-b0c7-acf172513d20"
 31 | version = "3.42.0"
 32 | 
 33 | [[deps.CompilerSupportLibraries_jll]]
 34 | deps = ["Artifacts", "Libdl"]
 35 | uuid = "e66e0078-7015-5450-92f7-15fbd957f2ae"
 36 | 
 37 | [[deps.Dates]]
 38 | deps = ["Printf"]
 39 | uuid = "ade2ca70-3891-5945-98fb-dc099432e06a"
 40 | 
 41 | [[deps.DelimitedFiles]]
 42 | deps = ["Mmap"]
 43 | uuid = "8bb1440f-4735-579b-a4ab-409b98df4dab"
 44 | 
 45 | [[deps.Distributed]]
 46 | deps = ["Random", "Serialization", "Sockets"]
 47 | uuid = "8ba89e20-285c-5b6f-9357-94700520ee1b"
 48 | 
 49 | [[deps.DocStringExtensions]]
 50 | deps = ["LibGit2"]
 51 | git-tree-sha1 = "b19534d1895d702889b219c382a6e18010797f0b"
 52 | uuid = "ffbed154-4ef7-542d-bbb7-c09d3a79fcae"
 53 | version = "0.8.6"
 54 | 
 55 | [[deps.Downloads]]
 56 | deps = ["ArgTools", "LibCURL", "NetworkOptions"]
 57 | uuid = "f43a241f-c20a-4ad4-852c-f6b1247861c6"
 58 | 
 59 | [[deps.InteractiveUtils]]
 60 | deps = ["Markdown"]
 61 | uuid = "b77e0a4c-d291-57a0-90e8-8db25a27a240"
 62 | 
 63 | [[deps.InverseFunctions]]
 64 | deps = ["Test"]
 65 | git-tree-sha1 = "91b5dcf362c5add98049e6c29ee756910b03051d"
 66 | uuid = "3587e190-3f89-42d0-90ee-14403ec27112"
 67 | version = "0.1.3"
 68 | 
 69 | [[deps.IrrationalConstants]]
 70 | git-tree-sha1 = "7fd44fd4ff43fc60815f8e764c0f352b83c49151"
 71 | uuid = "92d709cd-6900-40b7-9082-c6be49f344b6"
 72 | version = "0.1.1"
 73 | 
 74 | [[deps.JLLWrappers]]
 75 | deps = ["Preferences"]
 76 | git-tree-sha1 = "abc9885a7ca2052a736a600f7fa66209f96506e1"
 77 | uuid = "692b3bcd-3c85-4b1f-b108-f13ce0eb3210"
 78 | version = "1.4.1"
 79 | 
 80 | [[deps.LibCURL]]
 81 | deps = ["LibCURL_jll", "MozillaCACerts_jll"]
 82 | uuid = "b27032c2-a3e7-50c8-80cd-2d36dbcbfd21"
 83 | 
 84 | [[deps.LibCURL_jll]]
 85 | deps = ["Artifacts", "LibSSH2_jll", "Libdl", "MbedTLS_jll", "Zlib_jll", "nghttp2_jll"]
 86 | uuid = "deac9b47-8bc7-5906-a0fe-35ac56dc84c0"
 87 | 
 88 | [[deps.LibGit2]]
 89 | deps = ["Base64", "NetworkOptions", "Printf", "SHA"]
 90 | uuid = "76f85450-5226-5b5a-8eaa-529ad045b433"
 91 | 
 92 | [[deps.LibSSH2_jll]]
 93 | deps = ["Artifacts", "Libdl", "MbedTLS_jll"]
 94 | uuid = "29816b5a-b9ab-546f-933c-edad1886dfa8"
 95 | 
 96 | [[deps.Libdl]]
 97 | uuid = "8f399da3-3557-5675-b5ff-fb832c97cbdb"
 98 | 
 99 | [[deps.LinearAlgebra]]
100 | deps = ["Libdl", "libblastrampoline_jll"]
101 | uuid = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
102 | 
103 | [[deps.LogExpFunctions]]
104 | deps = ["ChainRulesCore", "ChangesOfVariables", "DocStringExtensions", "InverseFunctions", "IrrationalConstants", "LinearAlgebra"]
105 | git-tree-sha1 = "3f7cb7157ef860c637f3f4929c8ed5d9716933c6"
106 | uuid = "2ab3a3ac-af41-5b50-aa03-7779005ae688"
107 | version = "0.3.7"
108 | 
109 | [[deps.Logging]]
110 | uuid = "56ddb016-857b-54e1-b83d-db4d58db5568"
111 | 
112 | [[deps.Markdown]]
113 | deps = ["Base64"]
114 | uuid = "d6f4376e-aef5-505a-96c1-9c027394607a"
115 | 
116 | [[deps.MbedTLS_jll]]
117 | deps = ["Artifacts", "Libdl"]
118 | uuid = "c8ffd9c3-330d-5841-b78e-0817d7145fa1"
119 | 
120 | [[deps.Mmap]]
121 | uuid = "a63ad114-7e13-5084-954f-fe012c677804"
122 | 
123 | [[deps.MozillaCACerts_jll]]
124 | uuid = "14a3606d-f60d-562e-9121-12d972cd8159"
125 | 
126 | [[deps.NetworkOptions]]
127 | uuid = "ca575930-c2e3-43a9-ace4-1e988b2c1908"
128 | 
129 | [[deps.OpenBLAS_jll]]
130 | deps = ["Artifacts", "CompilerSupportLibraries_jll", "Libdl"]
131 | uuid = "4536629a-c528-5b80-bd46-f80d51c5b363"
132 | 
133 | [[deps.OpenLibm_jll]]
134 | deps = ["Artifacts", "Libdl"]
135 | uuid = "05823500-19ac-5b8b-9628-191a04bc5112"
136 | 
137 | [[deps.OpenSpecFun_jll]]
138 | deps = ["Artifacts", "CompilerSupportLibraries_jll", "JLLWrappers", "Libdl", "Pkg"]
139 | git-tree-sha1 = "13652491f6856acfd2db29360e1bbcd4565d04f1"
140 | uuid = "efe28fd5-8261-553b-a9e1-b2916fc3738e"
141 | version = "0.5.5+0"
142 | 
143 | [[deps.Pkg]]
144 | deps = ["Artifacts", "Dates", "Downloads", "LibGit2", "Libdl", "Logging", "Markdown", "Printf", "REPL", "Random", "SHA", "Serialization", "TOML", "Tar", "UUIDs", "p7zip_jll"]
145 | uuid = "44cfe95a-1eb2-52ea-b672-e2afdf69b78f"
146 | 
147 | [[deps.Preferences]]
148 | deps = ["TOML"]
149 | git-tree-sha1 = "de893592a221142f3db370f48290e3a2ef39998f"
150 | uuid = "21216c6a-2e73-6563-6e65-726566657250"
151 | version = "1.2.4"
152 | 
153 | [[deps.Printf]]
154 | deps = ["Unicode"]
155 | uuid = "de0858da-6303-5e67-8744-51eddeeeb8d7"
156 | 
157 | [[deps.REPL]]
158 | deps = ["InteractiveUtils", "Markdown", "Sockets", "Unicode"]
159 | uuid = "3fa0cd96-eef1-5676-8a61-b3b8758bbffb"
160 | 
161 | [[deps.Random]]
162 | deps = ["SHA", "Serialization"]
163 | uuid = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
164 | 
165 | [[deps.SHA]]
166 | uuid = "ea8e919c-243c-51af-8825-aaa63cd721ce"
167 | 
168 | [[deps.Serialization]]
169 | uuid = "9e88b42a-f829-5b0c-bbe9-9e923198166b"
170 | 
171 | [[deps.SharedArrays]]
172 | deps = ["Distributed", "Mmap", "Random", "Serialization"]
173 | uuid = "1a1011a3-84de-559e-8e89-a11a2f7dc383"
174 | 
175 | [[deps.Sockets]]
176 | uuid = "6462fe0b-24de-5631-8697-dd941f90decc"
177 | 
178 | [[deps.SparseArrays]]
179 | deps = ["LinearAlgebra", "Random"]
180 | uuid = "2f01184e-e22b-5df5-ae63-d93ebab69eaf"
181 | 
182 | [[deps.SpecialFunctions]]
183 | deps = ["ChainRulesCore", "IrrationalConstants", "LogExpFunctions", "OpenLibm_jll", "OpenSpecFun_jll"]
184 | git-tree-sha1 = "5ba658aeecaaf96923dce0da9e703bd1fe7666f9"
185 | uuid = "276daf66-3868-5448-9aa4-cd146d93841b"
186 | version = "2.1.4"
187 | 
188 | [[deps.Statistics]]
189 | deps = ["LinearAlgebra", "SparseArrays"]
190 | uuid = "10745b16-79ce-11e8-11f9-7d13ad32a3b2"
191 | 
192 | [[deps.TOML]]
193 | deps = ["Dates"]
194 | uuid = "fa267f1f-6049-4f14-aa54-33bafae1ed76"
195 | 
196 | [[deps.Tar]]
197 | deps = ["ArgTools", "SHA"]
198 | uuid = "a4e569a6-e804-4fa4-b0f3-eef7a1d5b13e"
199 | 
200 | [[deps.Test]]
201 | deps = ["InteractiveUtils", "Logging", "Random", "Serialization"]
202 | uuid = "8dfed614-e22c-5e08-85e1-65c5234f0b40"
203 | 
204 | [[deps.UUIDs]]
205 | deps = ["Random", "SHA"]
206 | uuid = "cf7118a7-6976-5b1a-9a39-7adc72f591a4"
207 | 
208 | [[deps.Unicode]]
209 | uuid = "4ec0a83e-493e-50e2-b9ac-8f72acf5a8f5"
210 | 
211 | [[deps.Zlib_jll]]
212 | deps = ["Libdl"]
213 | uuid = "83775a58-1f1d-513f-b197-d71354ab007a"
214 | 
215 | [[deps.libblastrampoline_jll]]
216 | deps = ["Artifacts", "Libdl", "OpenBLAS_jll"]
217 | uuid = "8e850b90-86db-534c-a0d3-1478176c7d93"
218 | 
219 | [[deps.nghttp2_jll]]
220 | deps = ["Artifacts", "Libdl"]
221 | uuid = "8e850ede-7688-5339-a07c-302acd2aaf8d"
222 | 
223 | [[deps.p7zip_jll]]
224 | deps = ["Artifacts", "Libdl"]
225 | uuid = "3f19e933-33d8-53b3-aaab-bd5110c3b7a0"
226 | 


--------------------------------------------------------------------------------
/old lecture11/Project.toml:
--------------------------------------------------------------------------------
1 | [deps]
2 | SpecialFunctions = "276daf66-3868-5448-9aa4-cd146d93841b"
3 | 


--------------------------------------------------------------------------------
/old lecture11/lecture11.jl:
--------------------------------------------------------------------------------
 1 | y = :(x^2 + 1)
 2 | typeof(y)
 3 | dump(y)
 4 | x = 10
 5 | eval(y)
 6 | 
 7 | function derive(ex, x)
 8 |     ex == x ? 1 :
 9 |     ex isa Union{Number,Symbol} ? 0 :
10 |     error("$ex is not differentiable")
11 |   end
12 | 
13 | using MacroTools
14 | @capture(y, a_ + b_)
15 | a,b
16 | 
17 | function derive(ex, x)
18 |     ex == x ? 1 :
19 |     ex isa Union{Number,Symbol} ? 0 :
20 |     @capture(ex, a_ + b_) ? :($(derive(a, x)) + $(derive(b, x))) :
21 |     error("$ex is not differentiable")
22 |   end
23 | 
24 |   function derive(ex, x)
25 |     ex == x ? 1 :
26 |     ex isa Union{Number,Symbol} ? 0 :
27 |     @capture(ex, a_ + b_) ? :($(derive(a, x)) + $(derive(b, x))) :
28 |     @capture(ex, a_ * b_) ? :($a * $(derive(b, x)) + $b * $(derive(a, x))) :
29 |     @capture(ex, a_^n_Number) ? :($(derive(a, x)) * ($n * $a^$(n-1))) :
30 |     @capture(ex, a_ / b_) ? :($b * $(derive(a, x)) - $a * $(derive(b, x)) / $b^2) :
31 |     error("$ex is not differentiable")
32 |   end
33 | 
34 |   y = :(3x^2 + (2x + 1))
35 | dy = derive(y, :x)
36 | 
37 | addm(a, b) = a == 0 ? b : b == 0 ? a : :($a + $b)
38 | mulm(a, b) = 0 in (a, b) ? 0 : a == 1 ? b : b == 1 ? a : :($a * $b)
39 | mulm(a, b, c...) = mulm(mulm(a, b), c...)
40 | 
41 | function derive(ex, x)
42 |     ex == x ? 1 :
43 |     ex isa Union{Number,Symbol} ? 0 :
44 |     @capture(ex, a_ + b_) ? addm(derive(a, x), derive(b, x)) :
45 |     @capture(ex, a_ * b_) ? addm(mulm(a, derive(b, x)), mulm(b, derive(a, x))) :
46 |     @capture(ex, a_^n_Number) ? mulm(derive(a, x),n,:($a^$(n-1))) :
47 |     @capture(ex, a_ / b_) ? :($(mulm(b, derive(a, x))) - $(mulm(a, derive(b, x))) / $b^2) :
48 |     error("$ex is not differentiable")
49 |   end
50 | 
51 |   y = :(3x^2 + (2x + 1))
52 | dy = derive(y, :x)
53 | 
54 | printstructure(x, _, _) = x
55 | 
56 | function printstructure(ex::Expr, cache = IdDict(), n = Ref(0))
57 |     haskey(cache, ex) && return cache[ex]
58 |     args = map(x -> printstructure(x, cache, n), ex.args)
59 |     cache[ex] = sym = Symbol(:y, n[] += 1)
60 |     println(:($sym = $(Expr(ex.head, args...))))
61 |     return sym
62 |   end
63 | 
64 |   printstructure(y2);
65 | 
66 | :(x / (1 + x^2)) |> printstructure;
67 | 
68 | derive(:(x / (1 + x^2)), :x) |> printstructure;
69 | 


--------------------------------------------------------------------------------
/old lecture11/utils.jl:
--------------------------------------------------------------------------------
  1 | using MacroTools, InteractiveUtils, SpecialFunctions
  2 | 
  3 | struct Variable
  4 |   name::Symbol
  5 |   number::Int
  6 | end
  7 | 
  8 | Symbol(x::Variable) = Symbol(x.name, x.number)
  9 | 
 10 | Base.show(io::IO, x::Variable) = print(io, ":(", x.name, x.number, ")")
 11 | 
 12 | Base.print(io::IO, x::Variable) = Base.show_unquoted(io, x, 0, -1)
 13 | Base.show_unquoted(io::IO, x::Variable, ::Int, ::Int) =
 14 |   print(io, x.name, x.number)
 15 | 
 16 | struct Wengert
 17 |   variable::Symbol
 18 |   instructions::Vector{Any}
 19 | end
 20 | 
 21 | Wengert(; variable = :y) = Wengert(variable, [])
 22 | 
 23 | Base.keys(w::Wengert) = (Variable(w.variable, i) for i = 1:length(w.instructions))
 24 | Base.lastindex(w::Wengert) = Variable(w.variable, length(w.instructions))
 25 | 
 26 | Base.getindex(w::Wengert, v::Variable) = w.instructions[v.number]
 27 | 
 28 | function Base.show(io::IO, w::Wengert)
 29 |   println(io, "Wengert List")
 30 |   for (i, x) in enumerate(w.instructions)
 31 |     print(io, Variable(w.variable, i), " = ")
 32 |     Base.println(io, x)
 33 |   end
 34 | end
 35 | 
 36 | Base.push!(w::Wengert, x) = x
 37 | 
 38 | function Base.push!(w::Wengert, x::Expr)
 39 |   isexpr(x, :block) && return pushblock!(w, x)
 40 |   x = Expr(x.head, map(x -> x isa Expr ? push!(w, x) : x, x.args)...)
 41 |   push!(w.instructions, x)
 42 |   return lastindex(w)
 43 | end
 44 | 
 45 | function pushblock!(w::Wengert, x)
 46 |   bs = Dict()
 47 |   rename(ex) = Expr(ex.head, map(x -> get(bs, x, x), ex.args)...)
 48 |   for arg in MacroTools.striplines(x).args
 49 |     if @capture(arg, x_ = y_)
 50 |       bs[x] = push!(w, rename(y))
 51 |     else
 52 |       push!(w, rename(arg))
 53 |     end
 54 |   end
 55 |   return Variable(w.variable, length(w.instructions))
 56 | end
 57 | 
 58 | function Wengert(ex; variable = :y)
 59 |   w = Wengert(variable = variable)
 60 |   push!(w, ex)
 61 |   return w
 62 | end
 63 | 
 64 | function Expr(w::Wengert)
 65 |   cs = Dict()
 66 |   for x in w.instructions
 67 |     x isa Expr || continue
 68 |     for v in x.args
 69 |       v isa Variable || continue
 70 |       cs[v] = get(cs, v, 0) + 1
 71 |     end
 72 |   end
 73 |   bs = Dict()
 74 |   rename(ex::Expr) = Expr(ex.head, map(x -> get(bs, x, x), ex.args)...)
 75 |   rename(x) = x
 76 |   #ex = :(;)
 77 |   ex = Expr(:block)
 78 |   for v in keys(w)
 79 |     if get(cs, v, 0) > 1
 80 |       push!(ex.args, :($(Symbol(v)) = $(rename(w[v]))))
 81 |       bs[v] = Symbol(v)
 82 |     else
 83 |       bs[v] = rename(w[v])
 84 |     end
 85 |   end
 86 |   push!(ex.args, rename(bs[lastindex(w)]))
 87 |   return unblock(ex)
 88 | end
 89 | 
 90 | addm(a, b) = a == 0 ? b : b == 0 ? a : :($a + $b)
 91 | mulm(a, b) = 0 in (a, b) ? 0 : a == 1 ? b : b == 1 ? a : :($a * $b)
 92 | mulm(a, b, c...) = mulm(mulm(a, b), c...)
 93 | 
 94 | function derive(w::Wengert, x; out = w)
 95 |   ds = Dict()
 96 |   ds[x] = 1
 97 |   d(x) = get(ds, x, 0)
 98 |   for v in keys(w)
 99 |     ex = w[v]
100 |     Δ = @capture(ex, a_ + b_) ? addm(d(a), d(b)) :
101 |         @capture(ex, a_ * b_) ? addm(mulm(a, d(b)), mulm(b, d(a))) :
102 |         @capture(ex, a_^n_Number) ? mulm(d(a),n,:($a^$(n-1))) :
103 |         @capture(ex, a_ / b_) ? :($(mulm(b, d(a))) - $(mulm(a, d(b))) / $b^2) :
104 |         @capture(ex, sin(a_)) ? mulm(:(cos($a)), d(a)) :
105 |         @capture(ex, cos(a_)) ? mulm(:(-sin($a)), d(a)) :
106 |         @capture(ex, exp(a_)) ? mulm(v, d(a)) :
107 |         @capture(ex, log(a_)) ? mulm(:(1/$a), d(a)) :
108 |         error("$ex is not differentiable")
109 |     ds[v] = push!(out, Δ)
110 |   end
111 |   return out
112 | end
113 | 
114 | function derive_r(w::Wengert, x)
115 |   ds = Dict()
116 |   d(x) = get(ds, x, 0)
117 |   d(x, Δ) = ds[x] = haskey(ds, x) ? addm(ds[x],Δ) : Δ
118 |   d(lastindex(w), 1)
119 |   for v in reverse(collect(keys(w)))
120 |     ex = w[v]
121 |     Δ = d(v)
122 |     if @capture(ex, a_ + b_)
123 |       d(a, Δ)
124 |       d(b, Δ)
125 |     elseif @capture(ex, a_ * b_)
126 |       d(a, push!(w, mulm(Δ, b)))
127 |       d(b, push!(w, mulm(Δ, a)))
128 |     elseif @capture(ex, a_^n_Number)
129 |       d(a, mulm(Δ, n, :($a^$(n-1))))
130 |     elseif @capture(ex, a_ / b_)
131 |       d(a, push!(w, mulm(Δ, b)))
132 |       d(b, push!(w, :(-$(mulm(Δ, a))/$b^2)))
133 |     else
134 |       error("$ex is not differentiable")
135 |     end
136 |   end
137 |   push!(w, d(x))
138 |   return w
139 | end
140 | 
141 | 
142 | 1+1
143 | 


--------------------------------------------------------------------------------
/old lecture9/eigenvalue derivative.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "code",
  5 |    "execution_count": 1,
  6 |    "metadata": {},
  7 |    "outputs": [],
  8 |    "source": [
  9 |     "using LinearAlgebra, GenericLinearAlgebra, ForwardDiff"
 10 |    ]
 11 |   },
 12 |   {
 13 |    "cell_type": "markdown",
 14 |    "metadata": {},
 15 |    "source": [
 16 |     "$$ dA = \\prod_{i <j} (\\lambda_i - \\lambda_j)(d\\Lambda)^\\wedge(Q'dQ)^\\wedge $$"
 17 |    ]
 18 |   },
 19 |   {
 20 |    "cell_type": "code",
 21 |    "execution_count": 2,
 22 |    "metadata": {},
 23 |    "outputs": [],
 24 |    "source": [
 25 |     "n = 2\n",
 26 |     "A = randn(n,n);"
 27 |    ]
 28 |   },
 29 |   {
 30 |    "cell_type": "code",
 31 |    "execution_count": 3,
 32 |    "metadata": {},
 33 |    "outputs": [],
 34 |    "source": [
 35 |     "upper = vec((triu(ones(n,n)))) .==1\n",
 36 |     "Λ, Q =  eigen(Hermitian(A))\n",
 37 |     "dΛ, dQ = (ForwardDiff.jacobian(t -> _eig(Hermitian(t)), A) for _eig=(eigvals, eigvecs))\n",
 38 |     "dΛ, dQ = dΛ[:,upper], dQ[:,upper];"
 39 |    ]
 40 |   },
 41 |   {
 42 |    "cell_type": "code",
 43 |    "execution_count": 4,
 44 |    "metadata": {},
 45 |    "outputs": [],
 46 |    "source": [
 47 |     "supupper = vec((triu(ones(n, n), 1))) .==1\n",
 48 |     "dQ = (kron(Matrix(I, size(A)),Q')*dQ)[supupper,:];"
 49 |    ]
 50 |   },
 51 |   {
 52 |    "cell_type": "code",
 53 |    "execution_count": 5,
 54 |    "metadata": {},
 55 |    "outputs": [
 56 |     {
 57 |      "data": {
 58 |       "text/plain": [
 59 |        "(0.8950480804299183, 0.895048080429918)"
 60 |       ]
 61 |      },
 62 |      "execution_count": 5,
 63 |      "metadata": {},
 64 |      "output_type": "execute_result"
 65 |     }
 66 |    ],
 67 |    "source": [
 68 |     "# Experiment vs Theory\n",
 69 |     "abs(det([dΛ;dQ])),1/abs(prod([Λ[i] - Λ[j] for i=1:n, j=1:n if i<j]))"
 70 |    ]
 71 |   },
 72 |   {
 73 |    "cell_type": "markdown",
 74 |    "metadata": {},
 75 |    "source": [
 76 |     "$$ \\int_0^1 x^2 dx $$"
 77 |    ]
 78 |   },
 79 |   {
 80 |    "cell_type": "code",
 81 |    "execution_count": 6,
 82 |    "metadata": {},
 83 |    "outputs": [
 84 |     {
 85 |      "data": {
 86 |       "text/plain": [
 87 |        "∫ (generic function with 1 method)"
 88 |       ]
 89 |      },
 90 |      "execution_count": 6,
 91 |      "metadata": {},
 92 |      "output_type": "execute_result"
 93 |     }
 94 |    ],
 95 |    "source": [
 96 |     "∫(f,a,b) = f+a+b"
 97 |    ]
 98 |   },
 99 |   {
100 |    "cell_type": "code",
101 |    "execution_count": 7,
102 |    "metadata": {},
103 |    "outputs": [
104 |     {
105 |      "data": {
106 |       "text/plain": [
107 |        "8"
108 |       ]
109 |      },
110 |      "execution_count": 7,
111 |      "metadata": {},
112 |      "output_type": "execute_result"
113 |     }
114 |    ],
115 |    "source": [
116 |     "∫(1,3,4)"
117 |    ]
118 |   },
119 |   {
120 |    "cell_type": "code",
121 |    "execution_count": 8,
122 |    "metadata": {},
123 |    "outputs": [
124 |     {
125 |      "data": {
126 |       "text/plain": [
127 |        "3"
128 |       ]
129 |      },
130 |      "execution_count": 8,
131 |      "metadata": {},
132 |      "output_type": "execute_result"
133 |     }
134 |    ],
135 |    "source": [
136 |     "ALPHA = 3"
137 |    ]
138 |   },
139 |   {
140 |    "cell_type": "code",
141 |    "execution_count": null,
142 |    "metadata": {},
143 |    "outputs": [],
144 |    "source": [
145 |     "α = 3"
146 |    ]
147 |   }
148 |  ],
149 |  "metadata": {
150 |   "@webio": {
151 |    "lastCommId": null,
152 |    "lastKernelId": null
153 |   },
154 |   "kernelspec": {
155 |    "display_name": "Julia 1.7 1.7.1",
156 |    "language": "julia",
157 |    "name": "julia-1.7-1.7"
158 |   },
159 |   "language_info": {
160 |    "file_extension": ".jl",
161 |    "mimetype": "application/julia",
162 |    "name": "julia",
163 |    "version": "1.7.1"
164 |   }
165 |  },
166 |  "nbformat": 4,
167 |  "nbformat_minor": 4
168 | }
169 | 


--------------------------------------------------------------------------------
/old lecture9/gsvd derivative.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "code",
  5 |    "execution_count": 1,
  6 |    "metadata": {},
  7 |    "outputs": [],
  8 |    "source": [
  9 |     "using ForwardDiff, GenericLinearAlgebra, LinearAlgebra"
 10 |    ]
 11 |   },
 12 |   {
 13 |    "cell_type": "markdown",
 14 |    "metadata": {},
 15 |    "source": [
 16 |     "## Generalized SVD\n",
 17 |     "$$ d([A;B]) = \\prod_{i<j}|c_i^2 - c_j^2|\\prod_i c_i^{m_1 - n} s_i^{m_2 - n}|H|^{(m_1+m_2-n)}(U'dU)^\\wedge (V'd V)^\\wedge(d\\Theta)^\\wedge (dH)^\\wedge $$"
 18 |    ]
 19 |   },
 20 |   {
 21 |    "cell_type": "code",
 22 |    "execution_count": 2,
 23 |    "metadata": {},
 24 |    "outputs": [
 25 |     {
 26 |      "data": {
 27 |       "text/plain": [
 28 |        "gsvd (generic function with 1 method)"
 29 |       ]
 30 |      },
 31 |      "execution_count": 2,
 32 |      "metadata": {},
 33 |      "output_type": "execute_result"
 34 |     }
 35 |    ],
 36 |    "source": [
 37 |     "function gsvd(AB,m₁)  # gsvd computation\n",
 38 |     "    A = AB[1:m₁, :]\n",
 39 |     "    B = AB[(m₁ + 1):end,:]\n",
 40 |     "    n = size(A, 2)\n",
 41 |     "    U, σ, V = svd(A*pinv(B))\n",
 42 |     "    U = U[:, 1:n]\n",
 43 |     "    V = V[:, 1:n]\n",
 44 |     "    θ = acot.(σ[1:n])\n",
 45 |     "    H = (cos.(θ)) .\\ (U'A)    \n",
 46 |     "    U, V, θ, H\n",
 47 |     "end"
 48 |    ]
 49 |   },
 50 |   {
 51 |    "cell_type": "code",
 52 |    "execution_count": 3,
 53 |    "metadata": {},
 54 |    "outputs": [
 55 |     {
 56 |      "data": {
 57 |       "text/plain": [
 58 |        "gsvd_auto (generic function with 1 method)"
 59 |       ]
 60 |      },
 61 |      "execution_count": 3,
 62 |      "metadata": {},
 63 |      "output_type": "execute_result"
 64 |     }
 65 |    ],
 66 |    "source": [
 67 |     "function gsvd_auto(A,B)\n",
 68 |     "    m₁, n = size(A)\n",
 69 |     "    AB = [A; B]\n",
 70 |     "    JU, JV, Jθ, JH = (ForwardDiff.jacobian(x -> gsvd(x, m₁)[i], AB) for i in 1:4)\n",
 71 |     "    U, σ, V = svd(A*pinv(B), full=true)\n",
 72 |     "    θ = acot.(σ[1:n])  \n",
 73 |     "    Uk = kron(Matrix(I, n, n), U') * JU   \n",
 74 |     "    Vk = kron(Matrix(I, n, n), V') * JV    \n",
 75 |     "    rowsU = vec((tril(ones(m₁, n),-1))) .==1\n",
 76 |     "    rowsV = vec((tril(ones(m₂, n),-1))) .==1    \n",
 77 |     "    Uk = Uk[rowsU, :]\n",
 78 |     "    Vk = Vk[rowsV, :]   \n",
 79 |     "    1/abs(det( [Jθ;JH;Uk;Vk] )) \n",
 80 |     "end"
 81 |    ]
 82 |   },
 83 |   {
 84 |    "cell_type": "code",
 85 |    "execution_count": 4,
 86 |    "metadata": {},
 87 |    "outputs": [
 88 |     {
 89 |      "data": {
 90 |       "text/plain": [
 91 |        "290466.92782096186"
 92 |       ]
 93 |      },
 94 |      "execution_count": 4,
 95 |      "metadata": {},
 96 |      "output_type": "execute_result"
 97 |     }
 98 |    ],
 99 |    "source": [
100 |     "m₁, m₂, n = 5, 4, 4\n",
101 |     "A = randn(m₁,n)\n",
102 |     "B = randn(m₂,n)\n",
103 |     "U, V, θ, H = gsvd([A;B], size(A,1))\n",
104 |     "c = cos.(θ)\n",
105 |     "s = sin.(θ)\n",
106 |     "gsvd_auto(A, B)   #  Experiment (theory below)"
107 |    ]
108 |   },
109 |   {
110 |    "cell_type": "markdown",
111 |    "metadata": {},
112 |    "source": [
113 |     "$$  |H|^{(m_1+m_2-n)} \\prod_{i<j}|c_i^2 - c_j^2|\\prod_i c_i^{m_1 - n} s_i^{m_2 - n} $$"
114 |    ]
115 |   },
116 |   {
117 |    "cell_type": "code",
118 |    "execution_count": 5,
119 |    "metadata": {},
120 |    "outputs": [
121 |     {
122 |      "data": {
123 |       "text/plain": [
124 |        "290466.9278209635"
125 |       ]
126 |      },
127 |      "execution_count": 5,
128 |      "metadata": {},
129 |      "output_type": "execute_result"
130 |     }
131 |    ],
132 |    "source": [
133 |     "abs(det(H)^(m₁ + m₂ - n) * prod([c[i]^2 - c[j]^2 for i in 1:n, j in 1:n if i<j]))*prod(c)^(m₁ - n)*prod(s)^(m₂ - n)"
134 |    ]
135 |   }
136 |  ],
137 |  "metadata": {
138 |   "@webio": {
139 |    "lastCommId": null,
140 |    "lastKernelId": null
141 |   },
142 |   "kernelspec": {
143 |    "display_name": "Julia 1.5.2",
144 |    "language": "julia",
145 |    "name": "julia-1.5"
146 |   },
147 |   "language_info": {
148 |    "file_extension": ".jl",
149 |    "mimetype": "application/julia",
150 |    "name": "julia",
151 |    "version": "1.5.2"
152 |   }
153 |  },
154 |  "nbformat": 4,
155 |  "nbformat_minor": 4
156 | }
157 | 


--------------------------------------------------------------------------------
/old lecture9/jacobian_example.jl:
--------------------------------------------------------------------------------
 1 | using Symbolics
 2 | 
 3 | struct MultiDual
 4 |     val
 5 |     derivs
 6 | end
 7 | 
 8 | import Base: +, *
 9 | 
10 | function +(f::MultiDual, g::MultiDual) 
11 |     return MultiDual(f.val + g.val, f.derivs + g.derivs)
12 | end
13 | 
14 | function *(f::MultiDual, g::MultiDual)
15 |     return MultiDual(f.val * g.val, f.val .* g.derivs .+ g.val .* f.derivs)
16 | end
17 | 
18 | f(x) = [x[1]*x[1]+x[2]+x[3],
19 |         x[2]*x[3],
20 |         x[1] ]
21 | 
22 | @variables x₁,x₂,x₃
23 | x = [x₁,x₂,x₃]
24 | 
25 | v =f([MultiDual(x₁,[1,0,0]),
26 |   MultiDual(x₂,[0,1,0]),
27 |   MultiDual(x₃,[0,0,1])]
28 | )
29 | 
30 | display(   [x.val for x∈v ] )
31 | display(  Matrix(hcat([x.derivs for x∈v]...)') )
32 | @variables a,b,c
33 | g(x) = x[2]*x[2] * x[3] + x[1]


--------------------------------------------------------------------------------
/old lecture9/lecture9-1.jl:
--------------------------------------------------------------------------------
 1 | x = 3.6
 2 | 
 3 | #---
 4 | for h ∈ 10. .^ (-1:-1:-15)
 5 |  println( imag(log(x+im*h))/h - 1/x )
 6 | end
 7 | 
 8 | using StaticArrays
 9 | Base.:+(f::Dual, g::Dual) = Dual(f.val + g.val, f.der + g.der)
10 | Base.:+(f::Dual, α::Number) = Dual(f.val + α, f.der)
11 | Base.:+(α::Number, f::Dual) = f + α
12 | 
13 | #=
14 | You can also write:
15 | import Base: +
16 | f::Dual + g::Dual = Dual(f.val + g.val, f.der + g.der)
17 | =#
18 | 
19 | Base.:-(f::Dual, g::Dual) = Dual(f.val - g.val, f.der - g.der)
20 | 
21 | # Product Rule
22 | Base.:*(f::Dual, g::Dual) = Dual(f.val*g.val, f.der*g.val + f.val*g.der)
23 | Base.:*(α::Number, f::Dual) = Dual(f.val * α, f.der * α)
24 | Base.:*(f::Dual, α::Number) = α * f
25 | 
26 | # Quotient Rule
27 | Base.:/(f::Dual, g::Dual) = Dual(f.val/g.val, (f.der*g.val - f.val*g.der)/(g.val^2))
28 | Base.:/(α::Number, f::Dual) = Dual(α/f.val, -α*f.der/f.val^2)
29 | Base.:/(f::Dual, α::Number) = f * inv(α) # Dual(f.val/α, f.der * (1/α))
30 | 
31 | Base.:^(f::Dual, n::Integer) = Base.power_by_squaring(f, n)  # use repeated squaring for integer powers
32 | 
33 | struct MultiDual{N,T}
34 |     val::T
35 |     derivs::SVector{N,T}
36 | end
37 | 
38 | import Base: +, *
39 | 
40 | function +(f::MultiDual{N,T}, g::MultiDual{N,T}) where {N,T}
41 |     return MultiDual{N,T}(f.val + g.val, f.derivs + g.derivs)
42 | end
43 | 
44 | function *(f::MultiDual{N,T}, g::MultiDual{N,T}) where {N,T}
45 |     return MultiDual{N,T}(f.val * g.val, f.val .* g.derivs + g.val .* f.derivs)
46 | end
47 | 
48 | struct Dual{T}
49 |     val::T   # value
50 |     der::T  # derivative
51 | end
52 | 
53 | 
54 | f(x,y) = x*x*y
55 | f( Dual(1.0,2.0), Dual(3.0,4.0))
56 | 
57 | 
58 | f(MultiDual(1.0,SVector(2.0)),MultiDual(3.0,SVector(4.0)))
59 | 
60 | a = MultiDual(1.0,SVector(2.0))
61 | b = MultiDual(1.0,SVector(2.0,3.0))


--------------------------------------------------------------------------------
/old lecture9/lecture9.jl:
--------------------------------------------------------------------------------
 1 | x = 3.6
 2 | 
 3 | #---
 4 | for h ∈ 10. .^ (-1:-1:-15)
 5 |  println( imag(log(x+im*h))/h - 1/x )
 6 | end
 7 | 
 8 | using StaticArrays
 9 | Base.:+(f::Dual, g::Dual) = Dual(f.val + g.val, f.der + g.der)
10 | Base.:+(f::Dual, α::Number) = Dual(f.val + α, f.der)
11 | Base.:+(α::Number, f::Dual) = f + α
12 | 
13 | #=
14 | You can also write:
15 | import Base: +
16 | f::Dual + g::Dual = Dual(f.val + g.val, f.der + g.der)
17 | =#
18 | 
19 | Base.:-(f::Dual, g::Dual) = Dual(f.val - g.val, f.der - g.der)
20 | 
21 | # Product Rule
22 | Base.:*(f::Dual, g::Dual) = Dual(f.val*g.val, f.der*g.val + f.val*g.der)
23 | Base.:*(α::Number, f::Dual) = Dual(f.val * α, f.der * α)
24 | Base.:*(f::Dual, α::Number) = α * f
25 | 
26 | # Quotient Rule
27 | Base.:/(f::Dual, g::Dual) = Dual(f.val/g.val, (f.der*g.val - f.val*g.der)/(g.val^2))
28 | Base.:/(α::Number, f::Dual) = Dual(α/f.val, -α*f.der/f.val^2)
29 | Base.:/(f::Dual, α::Number) = f * inv(α) # Dual(f.val/α, f.der * (1/α))
30 | 
31 | Base.:^(f::Dual, n::Integer) = Base.power_by_squaring(f, n)  # use repeated squaring for integer powers
32 | 
33 | struct MultiDual{N,T}
34 |     val::T
35 |     derivs::SVector{N,T}
36 | end
37 | 
38 | import Base: +, *
39 | 
40 | function +(f::MultiDual{N,T}, g::MultiDual{N,T}) where {N,T}
41 |     return MultiDual{N,T}(f.val + g.val, f.derivs + g.derivs)
42 | end
43 | 
44 | function *(f::MultiDual{N,T}, g::MultiDual{N,T}) where {N,T}
45 |     return MultiDual{N,T}(f.val * g.val, f.val .* g.derivs + g.val .* f.derivs)
46 | end
47 | 
48 | struct Dual{T}
49 |     val::T   # value
50 |     der::T  # derivative
51 | end
52 | 
53 | 
54 | f(x,y) = x*x*y
55 | f( Dual(1.0,2.0), Dual(3.0,4.0))
56 | 
57 | 
58 | f(MultiDual(1.0,SVector(2.0)),MultiDual(3.0,SVector(4.0)))
59 | 
60 | a = MultiDual(1.0,SVector(2.0))
61 | b = MultiDual(1.0,SVector(2.0,3.0))


--------------------------------------------------------------------------------
/old lecture9/svd derivative.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "code",
  5 |    "execution_count": 5,
  6 |    "metadata": {},
  7 |    "outputs": [],
  8 |    "source": [
  9 |     " using ForwardDiff, GenericLinearAlgebra, LinearAlgebra"
 10 |    ]
 11 |   },
 12 |   {
 13 |    "cell_type": "code",
 14 |    "execution_count": 2,
 15 |    "metadata": {},
 16 |    "outputs": [],
 17 |    "source": [
 18 |     "using Pkg"
 19 |    ]
 20 |   },
 21 |   {
 22 |    "cell_type": "code",
 23 |    "execution_count": 3,
 24 |    "metadata": {},
 25 |    "outputs": [
 26 |     {
 27 |      "name": "stderr",
 28 |      "output_type": "stream",
 29 |      "text": [
 30 |       "\u001b[32m\u001b[1m    Updating\u001b[22m\u001b[39m registry at `~/.julia/registries/General`\n",
 31 |       "┌ Error: Some registries failed to update:\n",
 32 |       "│     — `~/.julia/registries/General` — registry dirty\n",
 33 |       "└ @ Pkg.Registry /Users/julia/buildbot/worker/package_macos64/build/usr/share/julia/stdlib/v1.7/Pkg/src/Registry/Registry.jl:450\n",
 34 |       "\u001b[32m\u001b[1m   Resolving\u001b[22m\u001b[39m package versions...\n",
 35 |       "\u001b[32m\u001b[1m  No Changes\u001b[22m\u001b[39m to `~/.julia/environments/v1.7/Project.toml`\n",
 36 |       "\u001b[32m\u001b[1m  No Changes\u001b[22m\u001b[39m to `~/.julia/environments/v1.7/Manifest.toml`\n"
 37 |      ]
 38 |     }
 39 |    ],
 40 |    "source": [
 41 |     "Pkg.add(\"ForwardDiff\")"
 42 |    ]
 43 |   },
 44 |   {
 45 |    "cell_type": "code",
 46 |    "execution_count": 4,
 47 |    "metadata": {},
 48 |    "outputs": [
 49 |     {
 50 |      "name": "stderr",
 51 |      "output_type": "stream",
 52 |      "text": [
 53 |       "\u001b[32m\u001b[1m   Resolving\u001b[22m\u001b[39m package versions...\n",
 54 |       "\u001b[32m\u001b[1m    Updating\u001b[22m\u001b[39m `~/.julia/environments/v1.7/Project.toml`\n",
 55 |       " \u001b[90m [14197337] \u001b[39m\u001b[92m+ GenericLinearAlgebra v0.2.5\u001b[39m\n",
 56 |       "\u001b[32m\u001b[1m    Updating\u001b[22m\u001b[39m `~/.julia/environments/v1.7/Manifest.toml`\n",
 57 |       " \u001b[90m [14197337] \u001b[39m\u001b[92m+ GenericLinearAlgebra v0.2.5\u001b[39m\n",
 58 |       "\u001b[32m\u001b[1mPrecompiling\u001b[22m\u001b[39m project...\n",
 59 |       "\u001b[32m  ✓ \u001b[39mGenericLinearAlgebra\n",
 60 |       "  1 dependency successfully precompiled in 2 seconds (277 already precompiled, 1 skipped during auto due to previous errors)\n"
 61 |      ]
 62 |     }
 63 |    ],
 64 |    "source": [
 65 |     "Pkg.add(\"GenericLinearAlgebra\")"
 66 |    ]
 67 |   },
 68 |   {
 69 |    "cell_type": "markdown",
 70 |    "metadata": {},
 71 |    "source": [
 72 |     "## Singular Value Decomposition\n",
 73 |     "$$ dA = \\prod_{i < j} |\\sigma_i^2 - \\sigma_j^2| \\prod_i\\sigma_i^{m-n}(H'dU)^\\wedge(d\\Sigma)^\\wedge (V'dV)^\\wedge $$"
 74 |    ]
 75 |   },
 76 |   {
 77 |    "cell_type": "code",
 78 |    "execution_count": 6,
 79 |    "metadata": {},
 80 |    "outputs": [
 81 |     {
 82 |      "data": {
 83 |       "text/plain": [
 84 |        "check_svd (generic function with 1 method)"
 85 |       ]
 86 |      },
 87 |      "execution_count": 6,
 88 |      "metadata": {},
 89 |      "output_type": "execute_result"
 90 |     }
 91 |    ],
 92 |    "source": [
 93 |     "function sv_prod(σ)\n",
 94 |     "    n = length(σ)\n",
 95 |     "    abs(prod([σ[i]^2 - σ[j]^2 for i in 1:n, j in 1:n if i<j]))   \n",
 96 |     "end\n",
 97 |     "\n",
 98 |     "function check_svd(x)\n",
 99 |     "    H, σ, V = svd(x, full=false)\n",
100 |     "  \n",
101 |     "    JU = ForwardDiff.jacobian(t -> svd(t).U, x)\n",
102 |     "    Jσ = ForwardDiff.jacobian(t -> svd(t).S, x)\n",
103 |     "    JV = ForwardDiff.jacobian(t -> copy(svd(t).V), x)\n",
104 |     "\n",
105 |     "    Uk    = kron(Matrix(I, size(x)), H') * JU   \n",
106 |     "    Vk    = kron(Matrix(I, size(V)), V') * JV\n",
107 |     "    rowsU = vec((tril(ones(size(x)), -1))) .== 1\n",
108 |     "    rowsV = vec((tril(ones(size(V)), -1))) .== 1\n",
109 |     "\n",
110 |     "    Uk = Uk[rowsU, :]\n",
111 |     "    Vk = Vk[rowsV, :]\n",
112 |     "    m, n = size(x)\n",
113 |     "    (abs(det(vcat( Jσ, Uk, Vk))) , 1/(sv_prod(σ)*prod(σ)^(m - n) ))\n",
114 |     "end"
115 |    ]
116 |   },
117 |   {
118 |    "cell_type": "code",
119 |    "execution_count": 11,
120 |    "metadata": {},
121 |    "outputs": [
122 |     {
123 |      "data": {
124 |       "text/plain": [
125 |        "(0.19947988709616224, 0.1994798870961451)"
126 |       ]
127 |      },
128 |      "execution_count": 11,
129 |      "metadata": {},
130 |      "output_type": "execute_result"
131 |     }
132 |    ],
133 |    "source": [
134 |     "x = randn(3,3)\n",
135 |     "check_svd(x)"
136 |    ]
137 |   },
138 |   {
139 |    "cell_type": "code",
140 |    "execution_count": null,
141 |    "metadata": {},
142 |    "outputs": [],
143 |    "source": []
144 |   },
145 |   {
146 |    "cell_type": "code",
147 |    "execution_count": null,
148 |    "metadata": {},
149 |    "outputs": [],
150 |    "source": []
151 |   },
152 |   {
153 |    "cell_type": "code",
154 |    "execution_count": null,
155 |    "metadata": {},
156 |    "outputs": [],
157 |    "source": []
158 |   }
159 |  ],
160 |  "metadata": {
161 |   "@webio": {
162 |    "lastCommId": null,
163 |    "lastKernelId": null
164 |   },
165 |   "kernelspec": {
166 |    "display_name": "Julia 1.7 1.7.1",
167 |    "language": "julia",
168 |    "name": "julia-1.7-1.7"
169 |   },
170 |   "language_info": {
171 |    "file_extension": ".jl",
172 |    "mimetype": "application/julia",
173 |    "name": "julia",
174 |    "version": "1.7.1"
175 |   }
176 |  },
177 |  "nbformat": 4,
178 |  "nbformat_minor": 4
179 | }
180 | 


--------------------------------------------------------------------------------
/oldhw3/hints3.md:
--------------------------------------------------------------------------------
1 | # Hints and Tricks for HW3. 
2 | 
3 | ## How to get started on JuliaHub
4 | 
5 | * Log into JuliaHub using Google with the same Gmail address you put into the signup sheet
6 | * Under "Applications" launch a "Julia IDE"
7 | * It will take a while (~3 minutes for me) to start up, then you can press connect in the same place to connect to the session.
8 | * 


--------------------------------------------------------------------------------
/threads.jl:
--------------------------------------------------------------------------------
 1 | using Base.Threads, BenchmarkTools, Statistics, StaticArrays
 2 | const N = 1_000
 3 | 
 4 | 
 5 | ## Review from the end of last lecture
 6 | ## best serial code was lorenz4 with solve_system_save!
 7 | ## @SVector puts the length 3 vector on the stack
 8 | ## @inbounds doesn't hurt, may not help much
 9 | ## there were NO allocations as it used mutation
10 | ## specifically we preallocate a vector u that will contain N Svectors
11 | ## 
12 | 
13 | 
14 |   function lorenz4(u,p)
15 |     α,σ,ρ,β = p
16 |     @inbounds begin
17 |       du1 = u[1] + α*(σ*(u[2]-u[1]))
18 |       du2 = u[2] + α*(u[1]*(ρ-u[3]) - u[2])
19 |       du3 = u[3] + α*(u[1]*u[2] - β*u[3])
20 |     end
21 |     @SVector [du1,du2,du3]
22 |   end
23 | 
24 |   function solve_system_save!(u,f,u0,p,n)
25 |     @inbounds u[1] = u0
26 |     @inbounds for i in 1:length(u)-1
27 |       u[i+1] = f(u[i],p)
28 |     end
29 |     u
30 |   end
31 | u = Vector{typeof(@SVector([1.0,0.0,0.0]))}(undef,N)
32 | p = (0.02,10.0,28.0,8/3)
33 | 
34 | @btime solve_system_save!(u,lorenz4,@SVector([1.0,0.0,0.0]),p,N);
35 | 
36 | 
37 | const _u_cache_threads = [Vector{typeof(@SVector([1.0,0.0,0.0]))}(undef,N) for i in 1:Threads.nthreads()]
38 | const _u_cache = Vector{typeof(@SVector([1.0,0.0,0.0]))}(undef,N)
39 | 
40 | 
41 | function compute_trajectory_mean(u0,p)
42 |     u = Vector{typeof(@SVector([1.0,0.0,0.0]))}(undef,N)
43 |     solve_system_save!(u,lorenz4,u0,p,N);
44 |     mean(u)
45 |   end
46 | 
47 | 
48 | function _compute_trajectory_mean4(u,u0,p)
49 |     solve_system_save!(u,lorenz4,u0,p,N);
50 |     mean(u)
51 | end
52 |   
53 | function compute_trajectory_mean5(u0,p)
54 |     # u is automatically captured
55 |     solve_system_save!(_u_cache_threads[Threads.threadid()],lorenz4,u0,p,N);
56 |     mean(_u_cache_threads[Threads.threadid()])
57 | end
58 | 
59 | 
60 |   compute_trajectory_mean4(u0,p) = _compute_trajectory_mean4(_u_cache,u0,p)
61 |   #@btime compute_trajectory_mean4(@SVector([1.0,0.0,0.0]),p)
62 | 
63 |   ps = [(0.02,10.0,28.0,8/3) .* (1.0,rand(3)...) for i in 1:N]
64 | 
65 | function tmap(f,ps)
66 |     out = Vector{typeof(@SVector([1.0,0.0,0.0]))}(undef,N)
67 |     Threads.@threads :static for i in 1:N
68 |       # each loop part is using a different part of the data
69 |       out[i] = f(ps[i])
70 |     end
71 |     out
72 |   end
73 |   threaded_out = tmap(p -> compute_trajectory_mean4(@SVector([1.0,0.0,0.0]),p),ps)
74 | 
75 |   #@btime compute_trajectory_mean(@SVector([1.0,0.0,0.0]),p);
76 |   @btime map(p->compute_trajectory_mean5(@SVector([1.0,0.0,0.0]),p),ps);
77 |   @btime threaded_out = tmap(p -> compute_trajectory_mean5(@SVector([1.0,0.0,0.0]),p),ps);


--------------------------------------------------------------------------------