@article{yaras2023law, title={The Law of Parsimony in Gradient Descent for Learning Deep Linear Networks}, author={Yaras, Can and Wang, Peng and Hu, Wei and Zhu, Zhihui and Balzano, Laura and Qu, Qing}, journal={arXiv preprint arXiv:2306.01154}, year={2023} }