eval_loss = 1.7592002375037978 perplexity = tensor(5.8078)