eval_loss = 1.8451406680773768 perplexity = tensor(6.3290)