@article{bender2021dangers,
  title={On the Dangers of Stochastic Parrots: Can Language Models Be Too Big? $\backslash$textborn},
  author={Bender, Emily M and Gebru, Timnit and McMillan-Major, Angelina and Shmitchell, Shmargaret},
  journal={Proceedings of the 2021 ACM Conference on Fairness, Accountability, and Transparency},
  pages={610--623},
  year={2021}
}

@article{vaswani2017attention,
  title={Attention is all you need},
  author={Vaswani, Ashish and Shazeer, Noam and Parmar, Niki and Uszkoreit, Jakob and Jones, Llion and Gomez, Aidan N and Kaiser, {\L}ukasz and Polosukhin, Illia},
  journal={Advances in neural information processing systems},
  volume={30},
  year={2017}
}

@article{shannon1948mathematical,
  title={A mathematical theory of communication},
  author={Shannon, Claude E},
  journal={The Bell system technical journal},
  volume={27},
  number={3},
  pages={379--423},
  year={1948},
  publisher={Nokia Bell Labs}
}

@book{kelso1995dynamic,
  title={Dynamic patterns: The self-organization of brain and behavior},
  author={Kelso, J. A. Scott},
  year={1995},
  publisher={MIT press}
}

@article{levin2021basal,
  title={Basal cognition: multicellular morphological networks},
  author={Levin, Michael},
  journal={Philosophical Transactions of the Royal Society B},
  volume={376},
  number={1820},
  pages={20190757},
  year={2021},
  publisher={The Royal Society}
}

@book{clark2013surfing,
  title={Surfing uncertainty: Prediction, action, and the embodied mind},
  author={Clark, Andy},
  year={2015},
  publisher={Oxford University Press}
}

@article{friston2010free,
  title={The free-energy principle: a unified brain theory?},
  author={Friston, Karl},
  journal={Nature reviews neuroscience},
  volume={11},
  number={2},
  pages={127--138},
  year={2010},
  publisher={Nature Publishing Group}
}