Search results for key=KrH1992 : 1 match found.

Refereed full papers (journals, book chapters, international conferences)

1992

@article{KrH1992,
	vgclass =	{refpap},
	vgproject =	{nn},
	author =	{Anders Krogh and John A. Hertz},
	title =	{A simple weight decay can improve generalisation},
	journal =	{Advances in Neural Information Processing Systems},
	volume =	{4},
	pages =	{950--957},
	year =	{1992},
	abstract =	{It has been observed in
	numerical simulations that a weight decay can improve generalization in
	a feed forward neural network.  This paper explains why. It is proven
	that a weight decay has two effects in a linear network. First, it
	suppresses any irrelevant components of the weight vector by choosing
	the smallest vector that solves the learning problem. Second, if the
	size is chosen right, a weight decay can suppress some of the effects
	of static noise on the targets, which improves generalization quite a
	lot. It is then shown how to extend these results to networks with
	hidden layers and non-linear units. Finally the theory is confirmed by
	some numerical simulations using the data from NetTalk.},
}