eval_loss = 2.7945688366889954 perplexity = tensor(16.3556)