# HG changeset patch # User Yoshua Bengio # Date 1300590677 14400 # Node ID 677d1b1d8158f0a8935e62aedd2a7c4abd06f7bd # Parent fe98896745a55952011d6cfb35116da4b202a1a3 fits diff -r fe98896745a5 -r 677d1b1d8158 writeup/aistats2011_cameraready.tex --- a/writeup/aistats2011_cameraready.tex Sat Mar 19 23:07:03 2011 -0400 +++ b/writeup/aistats2011_cameraready.tex Sat Mar 19 23:11:17 2011 -0400 @@ -435,14 +435,8 @@ \[ P({\rm class}|{\rm input}=x)={\rm softmax}(b_2+W_2\tanh(b_1+W_1 x)), \] -i.e., two layers, where -\[ - p={\rm softmax}(a) -\] -means that -\[ - p_i(x)=\exp(a_i)/\sum_j \exp(a_j) -\] +i.e., two layers, where $p={\rm softmax}(a)$ means that +$p_i(x)=\exp(a_i)/\sum_j \exp(a_j)$ representing the probability for class $i$, $\tanh$ is the element-wise hyperbolic tangent, $b_i$ are parameter vectors, and $W_i$ are