├── .gitignore ├── Optimizers ├── NAG.py ├── accsgd.py ├── adabelief.py ├── adabound.py ├── adadelta.py ├── adafactor.py ├── adagrad.py ├── adahessian.py ├── adai.py ├── adam.py ├── adam_mini.py ├── adamax.py ├── adamod.py ├── adamp.py ├── adamw.py ├── adan.py ├── aggmo.py ├── apollo.py ├── came.py ├── diffgrad.py ├── dummy.py ├── lamb.py ├── lars.py ├── lion.py ├── lookahead.py ├── madgrad.py ├── nadam.py ├── novograd.py ├── pid.py ├── prodigy.py ├── qhadam.py ├── qhm.py ├── radam.py ├── ranger.py ├── rmsprop.py ├── rprop.py ├── sam.py ├── sgd.py ├── sgdp.py ├── sgdw.py ├── shampoo.py ├── sophia.py ├── svrg.py ├── swats.py └── yogi.py ├── README.md ├── Tutorial ├── EPFL_optML │ ├── lecture-notes.pdf │ ├── lecture01.pdf │ ├── lecture02.pdf │ ├── lecture03.pdf │ ├── lecture04.pdf │ ├── lecture05.pdf │ ├── lecture06.pdf │ ├── lecture07.pdf │ ├── lecture08.pdf │ ├── lecture09.pdf │ ├── lecture10.pdf │ ├── lecture11.pdf │ └── lecture12.pdf ├── Presentation___Data-centric_Methods__mobile.pdf ├── Presentation___Optimizer_Preconditioners__main.pdf ├── Presentation___Optimizer_Preconditioners__mobile.pdf └── slides-summer-school.pdf ├── assets ├── css │ └── styles.css ├── img │ ├── blogs │ │ ├── lora-weight-decay-2025.svg │ │ ├── lora-without-regret-2025.png │ │ ├── modular-manifolds-2025.png │ │ └── optimizer-choice-training-2024.jpg │ ├── logo.png │ ├── rastrigin.png │ ├── rosenbrock.jpg │ ├── scalingopt.png │ ├── tianshijing.png │ └── tutorials │ │ ├── cmu-convex-opt-2018.gif │ │ ├── cmu-convex-opt-2018.png │ │ ├── convex-optimization-ahmad-bazzi.png │ │ ├── data-centric-methods.png │ │ ├── epfl-optml-lecture01.png │ │ ├── epfl-optml-lecture02.png │ │ ├── epfl-optml-lecture03.png │ │ ├── epfl-optml-lecture04.png │ │ ├── epfl-optml-lecture05.png │ │ ├── epfl-optml-lecture06.png │ │ ├── epfl-optml-lecture07.png │ │ ├── epfl-optml-lecture08.png │ │ ├── epfl-optml-lecture09.png │ │ ├── epfl-optml-lecture10.png │ │ ├── epfl-optml-lecture11.png │ │ ├── epfl-optml-lecture12.png │ │ ├── epfl-optml-notes.png │ │ ├── gradient_descent.png │ │ ├── hessian_eigenvalues.png │ │ ├── loss_landscape.png │ │ ├── momentum.png │ │ ├── momentum.svg │ │ ├── nesterov.png │ │ ├── optimization-algorithms-ut-austin.png │ │ ├── optimization-machine-learning.png │ │ ├── optimization-methods-kit.png │ │ ├── optimizer-preconditioners-main.png │ │ ├── optimizer-preconditioners-mobile.png │ │ ├── quasi_newton.png │ │ ├── saddle_point.png │ │ ├── saddle_point.svg │ │ ├── stanford-ee364a.jpg │ │ └── stanford-ee364b.jpg └── js │ ├── benchmarks-complete-data.js │ ├── benchmarks-data.js │ ├── conferences-data.js │ ├── implementations-data.js │ ├── layout.js │ ├── optimizers-data.js │ ├── papers-data.js │ ├── schedulers-data.js │ └── utils.js ├── benchmark ├── tab_app_hyper_cifar.tex ├── tab_c4_pt_full.tex ├── tab_cifar100_backbone.tex ├── tab_coco.tex └── tab_in1k.tex ├── index.html ├── pages ├── about_us.html ├── benchmarks.html ├── blogs.html ├── community.html ├── conferences.html ├── experiments.html ├── implementations.html ├── optimizers.html ├── packages.html ├── papers.html ├── precision.html ├── schedulers.html ├── training_strategy.html ├── tutorials.html ├── tutorials │ └── basic_knowledge.html └── visualizations.html └── scripts └── viz_optimizers.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/.gitignore -------------------------------------------------------------------------------- /Optimizers/NAG.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/NAG.py -------------------------------------------------------------------------------- /Optimizers/accsgd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/accsgd.py -------------------------------------------------------------------------------- /Optimizers/adabelief.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/adabelief.py -------------------------------------------------------------------------------- /Optimizers/adabound.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/adabound.py -------------------------------------------------------------------------------- /Optimizers/adadelta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/adadelta.py -------------------------------------------------------------------------------- /Optimizers/adafactor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/adafactor.py -------------------------------------------------------------------------------- /Optimizers/adagrad.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/adagrad.py -------------------------------------------------------------------------------- /Optimizers/adahessian.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/adahessian.py -------------------------------------------------------------------------------- /Optimizers/adai.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/adai.py -------------------------------------------------------------------------------- /Optimizers/adam.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/adam.py -------------------------------------------------------------------------------- /Optimizers/adam_mini.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/adam_mini.py -------------------------------------------------------------------------------- /Optimizers/adamax.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/adamax.py -------------------------------------------------------------------------------- /Optimizers/adamod.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/adamod.py -------------------------------------------------------------------------------- /Optimizers/adamp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/adamp.py -------------------------------------------------------------------------------- /Optimizers/adamw.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/adamw.py -------------------------------------------------------------------------------- /Optimizers/adan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/adan.py -------------------------------------------------------------------------------- /Optimizers/aggmo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/aggmo.py -------------------------------------------------------------------------------- /Optimizers/apollo.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /Optimizers/came.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/came.py -------------------------------------------------------------------------------- /Optimizers/diffgrad.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/diffgrad.py -------------------------------------------------------------------------------- /Optimizers/dummy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/dummy.py -------------------------------------------------------------------------------- /Optimizers/lamb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/lamb.py -------------------------------------------------------------------------------- /Optimizers/lars.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/lars.py -------------------------------------------------------------------------------- /Optimizers/lion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/lion.py -------------------------------------------------------------------------------- /Optimizers/lookahead.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/lookahead.py -------------------------------------------------------------------------------- /Optimizers/madgrad.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/madgrad.py -------------------------------------------------------------------------------- /Optimizers/nadam.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/nadam.py -------------------------------------------------------------------------------- /Optimizers/novograd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/novograd.py -------------------------------------------------------------------------------- /Optimizers/pid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/pid.py -------------------------------------------------------------------------------- /Optimizers/prodigy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/prodigy.py -------------------------------------------------------------------------------- /Optimizers/qhadam.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/qhadam.py -------------------------------------------------------------------------------- /Optimizers/qhm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/qhm.py -------------------------------------------------------------------------------- /Optimizers/radam.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/radam.py -------------------------------------------------------------------------------- /Optimizers/ranger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/ranger.py -------------------------------------------------------------------------------- /Optimizers/rmsprop.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/rmsprop.py -------------------------------------------------------------------------------- /Optimizers/rprop.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/rprop.py -------------------------------------------------------------------------------- /Optimizers/sam.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/sam.py -------------------------------------------------------------------------------- /Optimizers/sgd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/sgd.py -------------------------------------------------------------------------------- /Optimizers/sgdp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/sgdp.py -------------------------------------------------------------------------------- /Optimizers/sgdw.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/sgdw.py -------------------------------------------------------------------------------- /Optimizers/shampoo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/shampoo.py -------------------------------------------------------------------------------- /Optimizers/sophia.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/sophia.py -------------------------------------------------------------------------------- /Optimizers/svrg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/svrg.py -------------------------------------------------------------------------------- /Optimizers/swats.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/swats.py -------------------------------------------------------------------------------- /Optimizers/yogi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Optimizers/yogi.py -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/README.md -------------------------------------------------------------------------------- /Tutorial/EPFL_optML/lecture-notes.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/EPFL_optML/lecture-notes.pdf -------------------------------------------------------------------------------- /Tutorial/EPFL_optML/lecture01.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/EPFL_optML/lecture01.pdf -------------------------------------------------------------------------------- /Tutorial/EPFL_optML/lecture02.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/EPFL_optML/lecture02.pdf -------------------------------------------------------------------------------- /Tutorial/EPFL_optML/lecture03.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/EPFL_optML/lecture03.pdf -------------------------------------------------------------------------------- /Tutorial/EPFL_optML/lecture04.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/EPFL_optML/lecture04.pdf -------------------------------------------------------------------------------- /Tutorial/EPFL_optML/lecture05.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/EPFL_optML/lecture05.pdf -------------------------------------------------------------------------------- /Tutorial/EPFL_optML/lecture06.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/EPFL_optML/lecture06.pdf -------------------------------------------------------------------------------- /Tutorial/EPFL_optML/lecture07.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/EPFL_optML/lecture07.pdf -------------------------------------------------------------------------------- /Tutorial/EPFL_optML/lecture08.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/EPFL_optML/lecture08.pdf -------------------------------------------------------------------------------- /Tutorial/EPFL_optML/lecture09.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/EPFL_optML/lecture09.pdf -------------------------------------------------------------------------------- /Tutorial/EPFL_optML/lecture10.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/EPFL_optML/lecture10.pdf -------------------------------------------------------------------------------- /Tutorial/EPFL_optML/lecture11.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/EPFL_optML/lecture11.pdf -------------------------------------------------------------------------------- /Tutorial/EPFL_optML/lecture12.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/EPFL_optML/lecture12.pdf -------------------------------------------------------------------------------- /Tutorial/Presentation___Data-centric_Methods__mobile.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/Presentation___Data-centric_Methods__mobile.pdf -------------------------------------------------------------------------------- /Tutorial/Presentation___Optimizer_Preconditioners__main.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/Presentation___Optimizer_Preconditioners__main.pdf -------------------------------------------------------------------------------- /Tutorial/Presentation___Optimizer_Preconditioners__mobile.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/Presentation___Optimizer_Preconditioners__mobile.pdf -------------------------------------------------------------------------------- /Tutorial/slides-summer-school.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/Tutorial/slides-summer-school.pdf -------------------------------------------------------------------------------- /assets/css/styles.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/css/styles.css -------------------------------------------------------------------------------- /assets/img/blogs/lora-weight-decay-2025.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/blogs/lora-weight-decay-2025.svg -------------------------------------------------------------------------------- /assets/img/blogs/lora-without-regret-2025.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/blogs/lora-without-regret-2025.png -------------------------------------------------------------------------------- /assets/img/blogs/modular-manifolds-2025.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/blogs/modular-manifolds-2025.png -------------------------------------------------------------------------------- /assets/img/blogs/optimizer-choice-training-2024.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/blogs/optimizer-choice-training-2024.jpg -------------------------------------------------------------------------------- /assets/img/logo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/logo.png -------------------------------------------------------------------------------- /assets/img/rastrigin.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/rastrigin.png -------------------------------------------------------------------------------- /assets/img/rosenbrock.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/rosenbrock.jpg -------------------------------------------------------------------------------- /assets/img/scalingopt.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/scalingopt.png -------------------------------------------------------------------------------- /assets/img/tianshijing.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tianshijing.png -------------------------------------------------------------------------------- /assets/img/tutorials/cmu-convex-opt-2018.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/cmu-convex-opt-2018.gif -------------------------------------------------------------------------------- /assets/img/tutorials/cmu-convex-opt-2018.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/cmu-convex-opt-2018.png -------------------------------------------------------------------------------- /assets/img/tutorials/convex-optimization-ahmad-bazzi.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/convex-optimization-ahmad-bazzi.png -------------------------------------------------------------------------------- /assets/img/tutorials/data-centric-methods.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/data-centric-methods.png -------------------------------------------------------------------------------- /assets/img/tutorials/epfl-optml-lecture01.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/epfl-optml-lecture01.png -------------------------------------------------------------------------------- /assets/img/tutorials/epfl-optml-lecture02.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/epfl-optml-lecture02.png -------------------------------------------------------------------------------- /assets/img/tutorials/epfl-optml-lecture03.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/epfl-optml-lecture03.png -------------------------------------------------------------------------------- /assets/img/tutorials/epfl-optml-lecture04.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/epfl-optml-lecture04.png -------------------------------------------------------------------------------- /assets/img/tutorials/epfl-optml-lecture05.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/epfl-optml-lecture05.png -------------------------------------------------------------------------------- /assets/img/tutorials/epfl-optml-lecture06.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/epfl-optml-lecture06.png -------------------------------------------------------------------------------- /assets/img/tutorials/epfl-optml-lecture07.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/epfl-optml-lecture07.png -------------------------------------------------------------------------------- /assets/img/tutorials/epfl-optml-lecture08.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/epfl-optml-lecture08.png -------------------------------------------------------------------------------- /assets/img/tutorials/epfl-optml-lecture09.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/epfl-optml-lecture09.png -------------------------------------------------------------------------------- /assets/img/tutorials/epfl-optml-lecture10.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/epfl-optml-lecture10.png -------------------------------------------------------------------------------- /assets/img/tutorials/epfl-optml-lecture11.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/epfl-optml-lecture11.png -------------------------------------------------------------------------------- /assets/img/tutorials/epfl-optml-lecture12.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/epfl-optml-lecture12.png -------------------------------------------------------------------------------- /assets/img/tutorials/epfl-optml-notes.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/epfl-optml-notes.png -------------------------------------------------------------------------------- /assets/img/tutorials/gradient_descent.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/gradient_descent.png -------------------------------------------------------------------------------- /assets/img/tutorials/hessian_eigenvalues.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/hessian_eigenvalues.png -------------------------------------------------------------------------------- /assets/img/tutorials/loss_landscape.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/loss_landscape.png -------------------------------------------------------------------------------- /assets/img/tutorials/momentum.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/momentum.png -------------------------------------------------------------------------------- /assets/img/tutorials/momentum.svg: -------------------------------------------------------------------------------- 1 | 404: Not Found -------------------------------------------------------------------------------- /assets/img/tutorials/nesterov.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/nesterov.png -------------------------------------------------------------------------------- /assets/img/tutorials/optimization-algorithms-ut-austin.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/optimization-algorithms-ut-austin.png -------------------------------------------------------------------------------- /assets/img/tutorials/optimization-machine-learning.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/optimization-machine-learning.png -------------------------------------------------------------------------------- /assets/img/tutorials/optimization-methods-kit.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/optimization-methods-kit.png -------------------------------------------------------------------------------- /assets/img/tutorials/optimizer-preconditioners-main.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/optimizer-preconditioners-main.png -------------------------------------------------------------------------------- /assets/img/tutorials/optimizer-preconditioners-mobile.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/optimizer-preconditioners-mobile.png -------------------------------------------------------------------------------- /assets/img/tutorials/quasi_newton.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/quasi_newton.png -------------------------------------------------------------------------------- /assets/img/tutorials/saddle_point.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/saddle_point.png -------------------------------------------------------------------------------- /assets/img/tutorials/saddle_point.svg: -------------------------------------------------------------------------------- 1 | 404: Not Found -------------------------------------------------------------------------------- /assets/img/tutorials/stanford-ee364a.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/stanford-ee364a.jpg -------------------------------------------------------------------------------- /assets/img/tutorials/stanford-ee364b.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/img/tutorials/stanford-ee364b.jpg -------------------------------------------------------------------------------- /assets/js/benchmarks-complete-data.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/js/benchmarks-complete-data.js -------------------------------------------------------------------------------- /assets/js/benchmarks-data.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/js/benchmarks-data.js -------------------------------------------------------------------------------- /assets/js/conferences-data.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/js/conferences-data.js -------------------------------------------------------------------------------- /assets/js/implementations-data.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/js/implementations-data.js -------------------------------------------------------------------------------- /assets/js/layout.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/js/layout.js -------------------------------------------------------------------------------- /assets/js/optimizers-data.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/js/optimizers-data.js -------------------------------------------------------------------------------- /assets/js/papers-data.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/js/papers-data.js -------------------------------------------------------------------------------- /assets/js/schedulers-data.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/js/schedulers-data.js -------------------------------------------------------------------------------- /assets/js/utils.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/assets/js/utils.js -------------------------------------------------------------------------------- /benchmark/tab_app_hyper_cifar.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/benchmark/tab_app_hyper_cifar.tex -------------------------------------------------------------------------------- /benchmark/tab_c4_pt_full.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/benchmark/tab_c4_pt_full.tex -------------------------------------------------------------------------------- /benchmark/tab_cifar100_backbone.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/benchmark/tab_cifar100_backbone.tex -------------------------------------------------------------------------------- /benchmark/tab_coco.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/benchmark/tab_coco.tex -------------------------------------------------------------------------------- /benchmark/tab_in1k.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/benchmark/tab_in1k.tex -------------------------------------------------------------------------------- /index.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/index.html -------------------------------------------------------------------------------- /pages/about_us.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/pages/about_us.html -------------------------------------------------------------------------------- /pages/benchmarks.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/pages/benchmarks.html -------------------------------------------------------------------------------- /pages/blogs.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/pages/blogs.html -------------------------------------------------------------------------------- /pages/community.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/pages/community.html -------------------------------------------------------------------------------- /pages/conferences.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/pages/conferences.html -------------------------------------------------------------------------------- /pages/experiments.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/pages/experiments.html -------------------------------------------------------------------------------- /pages/implementations.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/pages/implementations.html -------------------------------------------------------------------------------- /pages/optimizers.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/pages/optimizers.html -------------------------------------------------------------------------------- /pages/packages.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/pages/packages.html -------------------------------------------------------------------------------- /pages/papers.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/pages/papers.html -------------------------------------------------------------------------------- /pages/precision.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/pages/precision.html -------------------------------------------------------------------------------- /pages/schedulers.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/pages/schedulers.html -------------------------------------------------------------------------------- /pages/training_strategy.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/pages/training_strategy.html -------------------------------------------------------------------------------- /pages/tutorials.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/pages/tutorials.html -------------------------------------------------------------------------------- /pages/tutorials/basic_knowledge.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/pages/tutorials/basic_knowledge.html -------------------------------------------------------------------------------- /pages/visualizations.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/pages/visualizations.html -------------------------------------------------------------------------------- /scripts/viz_optimizers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tianshijing/ScalingOpt/HEAD/scripts/viz_optimizers.py --------------------------------------------------------------------------------