Python API wrapper for the languagetool REST API.
Simple usage::
>>> from pylanguagetool import api
>>> api.check(
... 'This is a example',
... api_url='',
... lang='en-US',
... )
{'software': {'name': 'LanguageTool', 'version': '4.6-SNAPSHOT', 'buildDate': '2019-05-15 19:25', 'apiVersion': 1, 'premium': False, 'premiumHint': 'You might be missing errors only the Premium version can find. Contact us at support<at>', 'status': ''}, 'warnings': {'incompleteResults': False}, 'language': {'name': 'English (US)', 'code': 'en-US', 'detectedLanguage': {'name': 'English (US)', 'code': 'en-US', 'confidence': 0.561}}, 'matches': [{'message': 'Use "an" instead of \'a\' if the following word starts with a vowel sound, e.g. \'an article\', \'an hour\'', 'shortMessage': 'Wrong article', 'replacements': [{'value': 'an'}], 'offset': 8, 'length': 1, 'context': {'text': 'This is a example', 'offset': 8, 'length': 1}, 'sentence': 'This is a example', 'type': {'typeName': 'Other'}, 'rule': {'id': 'EN_A_VS_AN', 'description': "Use of 'a' vs. 'an'", 'issueType': 'misspelling', 'category': {'id': 'MISC', 'name': 'Miscellaneous'}}, 'ignoreForIncompleteSentence': False, 'contextForSureMatch': 1}]}
import requests
def get_languages(api_url):
Return supported languages as a list of dictionaries.
api_url (str): API base url.
Supported languages as a list of dictionaries.
Each dictionary contains three keys, ``name``, ``code`` and
"name":"English (GB)",
r = requests.get(api_url + "languages")
return r.json()
def _is_in_pwl(match, pwl):
start = match['context']['offset']
end = start + match['context']['length']
word = match['context']['text'][start:end]
return word in pwl
def check(input_text, api_url, lang, mother_tongue=None, preferred_variants=None,
enabled_rules=None, disabled_rules=None,
enabled_categories=None, disabled_categories=None,
enabled_only=False, verbose=False,
Check given text and return API response as a dictionary.
input_text (str):
Plain text that will be checked for spelling mistakes.
api_url (str):
API base url, e.g. ````
lang: Language of the given text as `RFC 3066`__ language code.
For example ``en-GB`` or ``de-AT``. ``auto`` is a valid value too
and will cause the language to be detected automatically.
mother_tongue: Native language of the author as `RFC 3066`__ language
preferred_variants (str):
Comma-separated list of preferred language variants. The language
detector used with ``language=auto`` can detect e.g. English, but
it cannot decide whether British English or American English is
used. Therefore, this parameter can be used to specify the
preferred variants like ``en-GB`` and ``de-AT``. Only available
with ``language=auto``.
enabled_rules (str):
Comma-separated list of IDs of rules to be enabled
disabled_rules (str):
Comma-separated list of IDs of rules to be disabled.
enabled_categories (str):
Comma-separated list of IDs of categories to be enabled.
disabled_categories (str):
Comma-separated list of IDs of categories to be disabled.
enabled_only (bool):
If ``True``, only the rules and categories whose IDs are specified
with ``enabledRules`` or ``enabledCategories`` are enabled.
Defaults to ``False``.
verbose (bool):
If ``True``, a more verbose output will be printed. Defaults to
pwl (List[str]):
Personal world list. A custom dictionary of words that should be
excluded from spell checking errors.
A dictionary representation of the JSON API response.
The most notable key is ``matches``, which contains a list of all
spelling mistakes that have been found.
"language": {
"code": "en-US",
"detectedLanguage": {
"code": "en-US",
"confidence": 0.561,
"name": "English (US)",
"name": "English (US)",
"matches": [
"context": {"length": 1, "offset": 8, "text": "This is a example"},
"contextForSureMatch": 1,
"ignoreForIncompleteSentence": False,
"length": 1,
"message": "Use \"an\" instead of 'a' if the following word "
"starts with a vowel sound, e.g. 'an article', 'an "
"offset": 8,
"replacements": [{"value": "an"}],
"rule": {
"category": {"id": "MISC", "name": "Miscellaneous"},
"description": "Use of 'a' vs. 'an'",
"id": "EN_A_VS_AN",
"issueType": "misspelling",
"sentence": "This is a example",
"shortMessage": "Wrong article",
"type": {"typeName": "Other"},
"software": {
"apiVersion": 1,
"buildDate": "2019-05-15 19:25",
"name": "LanguageTool",
"premium": False,
"premiumHint": "You might be missing errors only the Premium "
"version can find. Contact us at "
"status": "",
"version": "4.6-SNAPSHOT",
"warnings": {"incompleteResults": False},
post_parameters = {
"text": input_text,
"language": lang,
if mother_tongue:
post_parameters["motherTongue"] = mother_tongue
if preferred_variants:
post_parameters["preferredVariants"] = preferred_variants
if enabled_rules:
post_parameters["enabledRules"] = enabled_rules
if disabled_rules:
post_parameters["disabledRules"] = disabled_rules
if enabled_categories:
post_parameters["enabledCategories"] = enabled_categories
if disabled_categories:
post_parameters["disabledCategories"] = disabled_categories
if enabled_only:
post_parameters["enabledOnly"] = 'true'
r = + "check", data=post_parameters)
if r.status_code != 200:
raise ValueError(r.text)
if verbose:
data = r.json()
if pwl:
matches = data.pop('matches', [])
data['matches'] = [
match for match in matches
if not _is_in_pwl(match, pwl)
return data