Spaces:

Booguy
/

linguask

Build error

App Files Files Community

linguask / tests /test_text_cleaning.py

GitHub Action

refs/heads/ci-cd/hugging-face

8b414b0 almost 2 years ago

history blame contribute delete

483 Bytes

	from src.data_reader import load_train_test_df
	from src.spell_checker import SmartSpellChecker
	from src.text_preprocessings.spellcheck_preprocessing import \
	SpellcheckTextPreprocessor


	def test_text_cleaning():
	train_df, _ = load_train_test_df(is_testing=True)

	spellcheck = SmartSpellChecker()
	text_preprocessor = SpellcheckTextPreprocessor(spellcheck)

	cleaned_texts = text_preprocessor.preprocess_data(train_df.full_text)

	assert len(cleaned_texts) == 5