\section{Higher Derivatives}
\label{section:higher-derivatives}

\begin{definition}[$n$-Fold Differentiability]
\label{definition:n-differentiable-sets}
    Let $E, F$ be TVSs over $K \in \RC$ with $F$ being separated, $\sigma \subset \mathfrak{B}(E)$ be a covering ideal, $\mathcal{H} \subset B_\sigma(E; F)$ be a subspace, and $\mathcal{R}_\sigma = \mathcal{R}_\sigma(E; F)$.

    Let $U \subset E$ be open, $f: U \to F$, $x_0 \in U$, and $n > 1$, then $f$ is \textbf{$n$-fold $\sigma$-differentiable at $x_0$} if
    \begin{enumerate}
        \item There exists $V \in \cn_E(x_0)$ such that $f$ is $(n-1)$-fold differentiable on $V$.
        \item The derivative $D_\sigma^{n-1}f: U \to B^{n-1}_\sigma(E; F)$ is derivative at $x_0$.
    \end{enumerate}

    In which case, $D_\sigma(D_\sigma^{n-1}f)(x_0) \in L(E; B^{n-1}_\sigma(E; F))$ is the \textbf{$n$-fold $\sigma$-derivative of $f$ at $x_0$}.

    The mapping $f: U \to F$ is \textbf{$n$-fold $\sigma$-differentiable on $U$} if it is $n$-fold $\sigma$-differentiable at every point in $U$. Under the identification $B_\sigma(E; B^{n-1}_\sigma(E; F)) = B_\sigma^{n}(E; F)$ given by \autoref{proposition:multilinear-identify},
    \[
    D_\sigma^{n}f: U \to B^{n-1}_\sigma(E; F)
    \]

    is the \textbf{$n$-fold $\sigma$-derivative of $f$ at $x_0$}.
\end{definition}

\begin{theorem}[Symmetry of Higher Derivatives]
\label{theorem:derivative-symmetric-frechet}
    Let $E, F$ be Banach spaces, $U \subset E$ be open, $n \in \natp$, and $f: U \to F$ be a function $n$-times Fréchet-differentiable at $x \in U$, then $D^nf(x) \in L^n(E; F)$ is symmetric.
\end{theorem}
\begin{proof}[Proof {{\cite[Theorem 5.1.1]{Cartan}}}. ]
    First suppose that $n = 2$. Let $r > 0$ such that $B(x, 2r) \subset U$, and define $A: B_E(0, r) \times B_E(0, r) \to F$ by
    \[
    A(h, k) = f(x + h + k) - f(x + h) - f(x + k) + f(x)
    \]

    then there exists $r_1 \in \mathcal{R}_{\mathfrak{B}(E)}$ such that
    \begin{align*}
        A(h, k) &= Df(x + h)(k) + Df(x)(k) \\
        &+ [f(x + h + k) - f(x + h) - Df(x + h)(k)] \\
        &- [f(x + k) - f(x) - Df(x)(k)] \\
        &= D^2f(x)(h, k) + r_1(h) \cdot Df(x)(k) \\
        &+ [f(x + h + k) - f(x + h) - Df(x + h)(k)] \\
        &- [f(x + k) - f(x) - Df(x)(k)] \\
    \end{align*}
    Let $B_h: B_E(0, r) \to F$ be defined by
    \begin{align*}
    B_h(k) &= f(x + h + k) - f(x + k) \\
    &- Df(x + h)(k) + Df(x)(k)
    \end{align*}
    

    then
    \begin{align*}
    B_h(k) - B_h(0) &= f(x + h + k) - f(x + k) \\
    &- Df(x + h)(k) + Df(x)(k) \\
    &-f(x + h) + f(x)
    \end{align*}
    

    Now, there exists $r_2, r_3 \in \mathcal{R}_{\mathfrak{B}(E)}$ such that for any $k \in B(0, r)$,
    \begin{align*}
    DB_h(k) &= Df(x + h + k) - Df(x + k) - Df(x + h) + Df(x) \\
    &= D^2f(x)(h + k) + Df(x) - D^2f(x)(h) \\
    &- Df(x) - D^2f(x)(k) + r_2(k) + r_3(h) \\
    &=r_2(k) + r_3(h)
    \end{align*}

    By the \hyperref[Mean Value Theorem]{theorem:mean-value-theorem},
    \[
    \norm{B_h(k) - B_h(0)}_F \le \norm{k}_E \cdot o(\norm{k}_E + \norm{h}_E)
    \]

    As the above argument is symmetric,
    \[
    \norm{D^2f(x)(h, k) - D^2f(x)(k, h)}_F \le \norm{k}_E \cdot o(\norm{k}_E + \norm{h}_E)
    \]

    so $D^2f(x)(h, k) - D^2f(x)(k, h) = 0$.

    Now suppose that the proposition holds for $n$. Identify $L^n(E; F) = L^{2}(E; L^{n-2}(E; F))$, then for any $\seqf[n]{x_j} \subset E$,
    \begin{align*}
    Df(x)(x_1, \cdots, x_n) &= Df(x)(x_1, x_2)(x_3, \cdots, x_n) \\
    &= Df(x)(x_2, x_1)(x_3, \cdots, x_n) \\
    &= Df(x)(x_2, x_1, x_3, \cdots, x_n)
    \end{align*}
    

    Since any element $\sigma \in S_n$ that does not fix $x_1$ is the composition of the transposition $(12)$ and an element that fixes $x_1$, $Df(x)$ is symmetric.
\end{proof}

\begin{theorem}[Symmetry of Higher Derivatives]
\label{theorem:derivative-symmetric}
    Let $E$ be a topological vector space over $K \in \RC$, $\sigma \subset \mathfrak{B}(E)$ be an ideal that includes all bounded sets contained in finite-dimensional spaces, $F$ be a separated locally convex space over $K$, $U \subset E$ be open, and $f: E \to F$ be $n$-fold $\sigma$-differentiable at $x_0 \in U$, then $D_\sigma^nf(x_0) \in B_\sigma^n(E; F)$ is symmetric.
\end{theorem}
\begin{proof}[Proof {{\cite[Proposition 4.5.14]{Bogachev}}}. ]
    Let $\seqf{h_j} \subset E$, $E_0$ be the subspace generated by $\seqf{h_j}$, and $g = f|_{E_0 \cap U}: E_0 \cap U \to F$. Since $\sigma$ includes all bounded sets contained in finite-dimensional spaces, for any $\phi \in F^*$, the mapping $\phi \circ g: E_0 \cap U \to K$ is $n$-times Fréchet-differentiable, with
    \[
    D_{\mathfrak{B}(E_0)}^n(\phi \circ g)(x_0) = \phi \circ D_\sigma^n g(x_0)
    \]

    by the \hyperref[chain rule]{proposition:chain-rule-sets-conditions}. By \autoref{theorem:derivative-symmetric-frechet}, $\phi \circ D_\sigma^n g(x_0) \in L^n(E_0; K)$ is symmetric. As this holds for any $\seqf{h_j} \subset E$ and $\phi \in F^*$, $D_{\sigma}^n g(x_0) \in B_\sigma^n(E; F)$ is symmetric by the \hyperref[Hahn-Banach theorem]{proposition:hahn-banach-utility}.
\end{proof}

\begin{proposition}[Power Rule]
\label{proposition:multilinear-derivative}
    Let $E$ be a topological vector space, $\sigma \subset \mathfrak{B}(E)$ be an ideal that includes all bounded sets contained in finite-dimensional spaces, $F$ be a Hausdorff locally convex space, and
    \[
    T \in \underbrace{L(E; L(E; \cdots L(E; F) \cdots ))}_{n \text{ times}} \subset B^n(E; F)
    \]

    be symmetric. For any $x \in E$ and $1 \le k \le n$, let $x^{(k)}$ denote the tuple of $x$ repeated $k$ times, then:
    \begin{enumerate}
        \item The mapping $f: E \to F \quad x \mapsto T(x^{(n)})$ is infinitely $\sigma$-differentiable on $E$.
        \item For each $1 \le k \le n$ and $x, h \in E$,
        \[
        Df(x)(h_1, \cdots, h_k) = \frac{n!}{(n-k)!} T(x^{(n-k)}, h_1, \cdots, h_k)
        \]

        In particular, $D^kf = n! \cdot T$.
        \item For each $k > n$ and $x \in E$, $Df(x) = 0$.
    \end{enumerate}
\end{proposition}
\begin{proof}
    Suppose inductively that (2) holds for $0 \le k \le n$. Let $G =  B^{k}_\sigma(E; F)$, then $D^k_\sigma f \in B^{n-k}_\sigma(E; G)$ under the identification $B^n_\sigma(E; F) = B^{n-k}_\sigma(E; B^k_\sigma(E; F))$ in \autoref{proposition:multilinear-identify}. By \autoref{theorem:derivative-symmetric}, $D^k_\sigma f$ is also symmetric, so using the Binomial formula,
    \begin{align*}
        D^k_\sigma f(x + h) &= \sum_{r = 0}^{n-k}{n - k \choose r}D^k_\sigma f(x^{(n-k-r)}, h^{(r)}) \\
        &= f(x) + (n-k)D^k_\sigma f(x^{(n-k-1)}, h) \\
        &+ \underbrace{\sum_{r = 2}^{n-k}{n - k \choose r}D^k_\sigma f(x^{(n-k-r)}, h^{(r)})}_{r(h)}
    \end{align*}

    For each $k \ge 2$, let $A \in \sigma$ and $U \in \cn_F(0)$, then since $D^k_\sigma f \in B^{n-k}_\sigma(E; F)$, there exists $t > 0$ such that
    \[
    \frac{D^k_\sigma f(x^{(n-k)}, (sA)^{(k)})}{t} = s^{k-1}D^k_\sigma f(x^{(n-k)}, A^{(k)}) \subset U
    \]

    for all $s \in (0, t)$. Hence $r \in \mathcal{R}_\sigma(E; G)$, and
    \[
    D^{k+1}_\sigma f(x + h) = f(x) + \frac{n!}{(n-k-1)!}T(x^{(n-k-1)}, h_1, \cdots, h_{k+1}) + r(h)
    \]

    by the inductive hypothesis.

    (3): Since $D^n_\sigma f$ is constant, $D^k_\sigma f = 0$ for all $k > n$.
\end{proof}