Skip to content

Commit

Permalink
Merge pull request #171 from InsomniacSabbir/master
Browse files Browse the repository at this point in the history
Added sanskrit corpora
  • Loading branch information
kylepjohnson committed Mar 5, 2016
2 parents d057ca5 + 399a653 commit b73a581
Show file tree
Hide file tree
Showing 3 changed files with 9 additions and 2 deletions.
Empty file.
5 changes: 5 additions & 0 deletions cltk/corpus/sanskrit/corpora.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
SANSKRIT_CORPORA = [
{'name':'sanskrit_text_jnu',
'location':'remote',
'type':'text'},
]
6 changes: 4 additions & 2 deletions cltk/corpus/utils/importer.py
Original file line number Diff line number Diff line change
Expand Up @@ -11,6 +11,7 @@
from cltk.corpus.coptic.corpora import COPTIC_CORPORA
from cltk.corpus.greek.corpora import GREEK_CORPORA
from cltk.corpus.latin.corpora import LATIN_CORPORA
from cltk.corpus.sanskrit.corpora import SANSKRIT_CORPORA
from cltk.corpus.multilingual.corpora import MULTILINGUAL_CORPORA
from cltk.corpus.pali.corpora import PALI_CORPORA
from cltk.corpus.tibetan.corpora import TIBETAN_CORPORA
Expand All @@ -22,15 +23,16 @@
from urllib.parse import urljoin


AVAILABLE_LANGUAGES = ['chinese', 'coptic', 'greek', 'latin', 'multilingual', 'pali', 'tibetan']
AVAILABLE_LANGUAGES = ['chinese', 'coptic', 'greek', 'latin', 'multilingual', 'pali', 'tibetan','sanskrit']
CLTK_DATA_DIR = '~/cltk_data'
LANGUAGE_CORPORA = {'chinese': CHINESE_CORPORA,
'coptic': COPTIC_CORPORA,
'greek': GREEK_CORPORA,
'latin': LATIN_CORPORA,
'multilingual': MULTILINGUAL_CORPORA,
'pali': PALI_CORPORA,
'tibetan': TIBETAN_CORPORA,}
'tibetan': TIBETAN_CORPORA,
'sanskrit': SANSKRIT_CORPORA,}



Expand Down

0 comments on commit b73a581

Please sign in to comment.