SauerkrautLM's Multi-Phase Spectrum Training: A Technical Deep Dive
•
5
@staticmethod
def marchenko_pastur_threshold(sigma, n, m):
beta = n / m if n < m else m / n
threshold = sigma * np.sqrt((1 + np.sqrt(beta))**2)
return thr