\documentclass[preprint,review,12pt]{elsarticle} \usepackage[utf8]{inputenc} \usepackage{amsmath,amssymb,amsfonts,amsthm} \usepackage{graphicx} \usepackage{hyperref} \newtheorem{theorem}{Theorem} \newtheorem{lemma}{Lemma} \newtheorem{definition}{Definition} \journal{Journal of Theoretical Biology} \begin{document} \begin{frontmatter} \title{Information Bottlenecks and Bounded Rational Decision Making: A Mathematical Proof of Fitness Beats Truth (Rapid Communication)} \author[1]{Antigravity} \address[1]{Institute for Advanced Cybernetic Physics} \begin{abstract} Evolutionary epistemology, particularly the "Fitness Beats Truth" (FBT) theorem, asserts that biological perception is tuned strictly to utility rather than objective reality. In this Letter, we provide a formal, rigorous mathematical proof of FBT using the framework of Bounded Rational Decision Making and the Information Bottleneck method. We define the objective world as a Riemannian manifold $\mathcal{M}$ endowed with a prior probability measure $\mu(x)$. By defining biological distortion directly as the expected utility loss under an optimal action policy, we formulate perception as a joint optimization over the perceptual encoder $p(y|x)$ and the actor policy $a(y)$ subject to a strict Shannon channel capacity bound $I(X;Y) \le C$. We mathematically prove that for generic fitness landscapes where the level sets of fitness do not align with the distance balls of the metric $g$, the optimal perceptual channel must actively destroy structural isomorphism to minimize the Lagrangian cost. \end{abstract} \begin{keyword} Evolutionary Game Theory \sep Information Bottleneck \sep Perception \sep Bounded Rationality \end{keyword} \end{frontmatter} \section{Introduction} Standard Rate-Distortion theory assumes an objective distortion metric $D(x,y)$ independent of the perceptual channel. However, biological perception is a decision-theoretic problem. The true biological cost of a perception depends entirely on the action $a(y)$ the organism subsequently takes. Thus, subjective inference directly defines the biological cost. \section{Formal Definitions and The Joint Optimization Model} \begin{definition}[State Space and Measure] Let $\mathcal{M}$ be a compact Riemannian manifold representing objective world states, endowed with metric $g$ and a prior probability measure $\mu(x)$ absolutely continuous with respect to the volume form. Let $\mathcal{Y}$ be a finite set of perceptual states. Let $\mathcal{A}$ be the space of actions. \end{definition} \begin{definition}[Fitness Landscape] Let $F: \mathcal{M} \times \mathcal{A} \to \mathbb{R}$ be a smooth fitness function mapping a world state and an action to a biological payoff. \end{definition} The organism possesses a bounded channel capacity $I(X;Y) \le C$. The optimal action policy maximizes expected fitness given the perceptual posterior: \begin{equation} a^*(y) = \arg\max_{a \in \mathcal{A}} \int_{\mathcal{M}} F(x, a) p(x|y) d\mu(x) \end{equation} The organism minimizes the Lagrangian functional $\mathcal{L}$: \begin{equation} \mathcal{L}[p(y|x), a(y)] = \int_{\mathcal{M}} \sum_{y} p(y|x) [-F(x, a(y))] d\mu(x) + \frac{1}{\beta} I(X;Y) \end{equation} \section{Minimizing Distortion Destroys Isomorphism} \begin{lemma} For a generic smooth fitness landscape $F(x, a)$, the level sets of $F$ do not align with the distance balls defined by the Riemannian metric $g$. Therefore, there exist points $x_1, x_2 \in \mathcal{M}$ separated by a large geodesic distance such that $a^*(y_1) = a^*(y_2)$ maximizes fitness. \end{lemma} \begin{theorem} Given a strict capacity bound $C < H(X)$ and a generic fitness landscape $F$, the encoder $p(y|x)$ minimizing $\mathcal{L}$ must violate structural isomorphism. \end{theorem} \begin{proof} Suppose $p(y|x)$ strictly preserves structural isomorphism. By Lemma 1, if distant points $x_1$ and $x_2$ share identical optimal actions $a^*$, distinguishing them requires allocating mutual information $\Delta I > 0$. Because the actions are identical, the expected fitness $\mathbb{E}[F]$ remains constant whether they are distinguished or clustered. However, distinguishing them strictly increases the channel cost $\frac{1}{\beta} I(X;Y)$. To minimize $\mathcal{L}$, the optimal encoder must actively collapse topologically distant points in $\mathcal{M}$ that share fitness level sets, obliterating structural isomorphism. \end{proof} \bibliographystyle{elsarticle-num} \begin{thebibliography}{10} \bibitem{Hoffman2015} D. D. Hoffman, M. Singh, C. Prakash, The interface theory of perception, Psychonomic Bulletin \& Review 22 (2015) 1480-1506. \bibitem{Ortega2013} P. A. Ortega, D. A. Braun, Thermodynamics as a theory of decision-making with information-processing costs, Proceedings of the Royal Society A 469 (2013) 20120683. \end{thebibliography} \end{document}