eval_loss = 2.83157302924993 perplexity = tensor(16.9721)