Add post on Kolmogorov-Arnold Networks
This commit is contained in:
parent
fe066d13ed
commit
681974170e
2 changed files with 127 additions and 0 deletions
|
@ -740,3 +740,49 @@
|
|||
volume = 21,
|
||||
year = 1999,
|
||||
}
|
||||
|
||||
@misc{liu2024_kan,
|
||||
author = {Liu, Ziming and Wang, Yixuan and Vaidya, Sachin and
|
||||
Ruehle, Fabian and Halverson, James and Soljačić,
|
||||
Marin and Hou, Thomas Y. and Tegmark, Max},
|
||||
title = {{KAN}: {Kolmogorov}-{Arnold} {Networks}},
|
||||
year = 2024,
|
||||
month = may,
|
||||
publisher = {arXiv},
|
||||
doi = {10.48550/arXiv.2404.19756},
|
||||
url = {http://arxiv.org/abs/2404.19756},
|
||||
note = {arXiv:2404.19756 [cond-mat, stat]},
|
||||
keywords = {Computer Science - Machine Learning, Condensed
|
||||
Matter - Disordered Systems and Neural Networks,
|
||||
Computer Science - Artificial Intelligence,
|
||||
Statistics - Machine Learning},
|
||||
}
|
||||
|
||||
@article{chenNeuralOrdinaryDifferential2018,
|
||||
archivePrefix = {arXiv},
|
||||
eprinttype = {arxiv},
|
||||
eprint = {1806.07366},
|
||||
primaryClass = {cs, stat},
|
||||
title = {Neural {{Ordinary Differential Equations}}},
|
||||
url = {http://arxiv.org/abs/1806.07366},
|
||||
abstract = {We introduce a new family of deep neural network models. Instead of specifying a discrete sequence of hidden layers, we parameterize the derivative of the hidden state using a neural network. The output of the network is computed using a black-box differential equation solver. These continuous-depth models have constant memory cost, adapt their evaluation strategy to each input, and can explicitly trade numerical precision for speed. We demonstrate these properties in continuous-depth residual networks and continuous-time latent variable models. We also construct continuous normalizing flows, a generative model that can train by maximum likelihood, without partitioning or ordering the data dimensions. For training, we show how to scalably backpropagate through any ODE solver, without access to its internal operations. This allows end-to-end training of ODEs within larger models.},
|
||||
urldate = {2019-01-05},
|
||||
date = {2018-06-19},
|
||||
keywords = {Statistics - Machine Learning,Computer Science - Artificial Intelligence,Computer Science - Machine Learning},
|
||||
author = {Chen, Ricky T. Q. and Rubanova, Yulia and Bettencourt, Jesse and Duvenaud, David},
|
||||
file = {/home/dimitri/Nextcloud/Zotero/storage/26D4Y3GG/Chen et al. - 2018 - Neural Ordinary Differential Equations.pdf;/home/dimitri/Nextcloud/Zotero/storage/RNXT4EQV/1806.html}
|
||||
}
|
||||
|
||||
@article{ruthotto2024_differ_equat,
|
||||
author = {Ruthotto, Lars},
|
||||
title = {Differential {Equations} for {Continuous}-{Time}
|
||||
{Deep} {Learning}},
|
||||
journal = {Notices of the American Mathematical Society},
|
||||
year = 2024,
|
||||
month = may,
|
||||
volume = 71,
|
||||
number = 05,
|
||||
issn = {0002-9920, 1088-9477},
|
||||
doi = {10.1090/noti2930},
|
||||
url = {https://www.ams.org/notices/202405/rnoti-p613.pdf},
|
||||
}
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue