eval_loss = 2.418710708618164 perplexity = tensor(11.2314)