rpmlint/test/test_spellchecking.py

88 lines
3.1 KiB
Python

import pytest
import rpmlint.spellcheck
from Testing import HAS_CZECH_DICTIONARY, HAS_ENGLISH_DICTIONARY
def get_suggestions(suggestion):
suggestion = suggestion.split(' -> ')[-1]
return sorted(suggestion.split(', '))
@pytest.mark.skipif(not rpmlint.spellcheck.ENCHANT, reason='Missing enchant bindings')
@pytest.mark.skipif(not HAS_ENGLISH_DICTIONARY, reason='Missing English dictionary')
def test_spelldict(capsys):
"""
Check we can init dictionary spellchecker
"""
spell = rpmlint.spellcheck.Spellcheck()
spell._init_checker()
out, err = capsys.readouterr()
assert not out
assert not err
assert 'unable to load spellchecking dictionary' not in err
spell._init_checker('not-existing-language')
out, err = capsys.readouterr()
assert not out
assert 'unable to load spellchecking dictionary' in err
assert 'en_US' in spell._enchant_checkers
assert spell._enchant_checkers['en_US'] is not None
assert 'not-existing-language' not in spell._enchant_checkers
@pytest.mark.skipif(not rpmlint.spellcheck.ENCHANT, reason='Missing enchant bindings')
@pytest.mark.skipif(not HAS_ENGLISH_DICTIONARY, reason='Missing English dictionary')
@pytest.mark.skipif(not HAS_CZECH_DICTIONARY, reason='Missing Czech dictionary')
def test_spellchecking():
"""
Check if we can test the spelling
"""
spell = rpmlint.spellcheck.Spellcheck()
# correct text
text = 'I swear this text is proper English'
result = spell.spell_check(text, 'Description({}):')
assert not result
# english 2 typos
text = "I don't think tihs tetx is correct English"
result = spell.spell_check(text, 'Description({}):')
assert len(result) == 2
assert result['tihs'].startswith('Description(en_US): tihs -> ')
assert get_suggestions(result['tihs']) == ['hits', 'this', 'ties']
# different language, one typo
text = 'Příčerně žluťoučký kůň'
result = spell.spell_check(text, 'Summary({}):', 'cs_CZ')
assert len(result) == 1
assert result['Příčerně'].startswith('Summary(cs_CZ): Příčerně -> ')
assert get_suggestions(result['Příčerně']) == ['Příčeně', 'Příčetně', 'Příšerně']
# non-existing language, should return nothing:
text = 'Weird english text'
result = spell.spell_check(text, 'Summary({}):', 'de_CZ')
assert not result
@pytest.mark.skipif(not rpmlint.spellcheck.ENCHANT, reason='Missing enchant bindings')
@pytest.mark.skipif(not HAS_ENGLISH_DICTIONARY, reason='Missing English dictionary')
def test_pkgname_spellchecking():
spell = rpmlint.spellcheck.Spellcheck()
pkgname = 'python-squeqe'
text = "This package is squeqe's framework helper"
result = spell.spell_check(text, 'Description({}):', 'en_US', pkgname)
assert not result
@pytest.mark.skipif(not rpmlint.spellcheck.ENCHANT, reason='Missing enchant bindings')
def test_ignorelist_spellchecking():
spell = rpmlint.spellcheck.Spellcheck()
ignore = ['wrod', 'žížala']
text = 'This package should not have any typos in wrod or žíŽala'
result = spell.spell_check(text, 'Description({}):', ignored_words=ignore)
assert not result