pub fn evaluate_dataset( tokenizer: &mut Tokenizer, dataset: &TestDataset, ) -> EvaluationResult
데이터셋 평가
tokenizer
dataset
평가 결과