trainer = HiddenMarkovModelTrainer(tag_set, list(symbols))
print('Training (unsupervised, %d sentences)...' % unsupervised)
# it's rather slow - so only use 10 samples by default
unlabeled = _untag(sentences[test + supervised :])
print unlabeled[0]
hmm = trainer.train_unsupervised(
unlabeled, max_iterations=max_iterations
)
symbols 要和 unlabeled 裏面的字符編碼一致,不然會報 KeyError