For each epoch the 60.000 training samples % were used, or for data generation 10.000 steps with each using % batches of 60 generated data points. For each configuration the % model was trained 5 times and the average accuracies at each epoch % are given in (a). As the distribution of $v$ is continuous as well we get $\mathcal{L}(v_k) = \mathcal{L} v| \xi = \delta l) \forall k \in \kappa : \xi_k \in [\delta l, \delta(l+1))$ for $delta \leq \delta(\varepsilon, \tilde{\varepsilon})$. Thus we get with the law of large numbers \begin{align*} &\sum_{k \in \kappa : \xi_k < T} \varphi(\xi_k, v_k) h_{k,n} \approx\\ &\approx \sum_{\substack{l \in \mathbb{Z} \\ [\delta l, \delta (l+1)) \in [C_{g_\xi}^l,\min\{C_{g_\xi}^u, T \}]}}\left(\mathbb{E}[\phi(\xi, v)|\xi=\delta l] \stackrel{\mathbb{P}}{\pm}\right) \delta \left(1 \pm \frac{\tilde{\varepsilon}}{g_\xi(\delta l)}\right) \pm \varepsilon \\ &\approx \left(\sum_{\substack{l \in \mathbb{Z} \\ [\delta l, \delta (l+1)) \in [C_{g_\xi}^l,\min\{C_{g_\xi}^u, T \}]}}\mathbb{E}[\phi(\xi, v)|\xi=\delta l] \delta \stackrel{\mathbb{P}}{\pm}\tilde{\tilde{\varepsilon}} \abs{C_{g_\xi}^u - C_{g_\xi}^l} \right)\\ &\phantom{\approx}\cdot \left(1 \pm \frac{\tilde{\varepsilon}}{g_\xi(\delta l)}\right) \pm \varepsilon \end{align*} As the distribution of $v$ is continuous as well we get $\mathcal{L}(v_k) = \mathcal{L} v| \xi = \delta l) \forall k \in \kappa : \xi_k \in [\delta l, \delta(l+1))$ for $delta \leq \delta(\varepsilon, \tilde{\varepsilon})$. Thus we get with the law of large numbers \begin{align*} &\sum_{k \in \kappa : \xi_k < T} \varphi(\xi_k, v_k) h_{k,n} \approx\\ &\approx \sum_{\substack{l \in \mathbb{Z} \\ [\delta l, \delta (l+1)) \in [C_{g_\xi}^l,\min\{C_{g_\xi}^u, T \}]}}\left(\mathbb{E}[\phi(\xi, v)|\xi=\delta l] \stackrel{\mathbb{P}}{\pm}\right) \delta \left(1 \pm \frac{\tilde{\varepsilon}}{g_\xi(\delta l)}\right) \pm \varepsilon \\ &\approx \left(\sum_{\substack{l \in \mathbb{Z} \\ [\delta l, \delta (l+1)) \in [C_{g_\xi}^l,\min\{C_{g_\xi}^u, T \}]}}\mathbb{E}[\phi(\xi, v)|\xi=\delta l] \delta \stackrel{\mathbb{P}}{\pm}\tilde{\tilde{\varepsilon}} \abs{C_{g_\xi}^u - C_{g_\xi}^l} \right)\\ &\phantom{\approx}\cdot \left(1 \pm \frac{\tilde{\varepsilon}}{g_\xi(\delta l)}\right) \pm \varepsilon \end{align*} \newpage \end{document} %%% Local Variables: %%% mode: latex %%% TeX-master: t %%% End: