eval_loss = 1.604232376272028 perplexity = tensor(4.9740)