eval_loss = 2.4966046573928975 perplexity = tensor(12.1412)