Unitex/GramLab C++ Core
Branch: master
Clone or download
Fetching latest commit…
Cannot retrieve the latest commit at this time.
Permalink
Type Name Latest commit message Commit time
Failed to load latest commit information.
.github
Disclaimers
Licenses
UnitexLibAndJni
UnitexNet
UnitexRuby
base
bin
build
include_tre
logger
misc/tools
vendor
win32vs2008
.appveyor.yml
.clang-format
.editorconfig
.gitattributes
.gitignore
.gitignore.in
.pullapprove.yml
.travis.yml
AbstractAllocator.cpp
AbstractAllocator.h
AbstractAllocatorPlugCallback.h
AbstractCallbackFuncModifier.h
AbstractDelaLoad.cpp
AbstractDelaLoad.h
AbstractDelaPlugCallback.h
AbstractFilePlugCallback.h
AbstractFst2Load.cpp
AbstractFst2Load.h
AbstractFst2PlugCallback.h
ActivityLogger.cpp
ActivityLogger.h
ActivityLoggerPlugCallback.h
Af_stdio.cpp
Af_stdio.h
Alphabet.cpp
Alphabet.h
Any.h
ApplyDic.cpp
ApplyDic.h
Arabic.cpp
Arabic.h
AsciiSearchTree.cpp
AsciiSearchTree.h
AutComplementation.cpp
AutComplementation.h
AutConcat.cpp
AutConcat.h
AutDeterminization.cpp
AutDeterminization.h
AutIntersection.cpp
AutIntersection.h
AutMinimization.cpp
AutMinimization.h
AutomatonDictionary2Bin.cpp
AutomatonDictionary2Bin.h
BitArray.cpp
BitArray.h
BitMasks.cpp
BitMasks.h
Buffer.cpp
Buffer.h
BuildKrMwuDic.cpp
BuildKrMwuDic.h
BuildTextAutomaton.cpp
BuildTextAutomaton.h
Cassys.cpp
Cassys.h
Cassys_concord.cpp
Cassys_concord.h
Cassys_external_program.cpp
Cassys_external_program.h
Cassys_io.cpp
Cassys_io.h
Cassys_lexical_tags.cpp
Cassys_lexical_tags.h
Cassys_main_test.cpp
Cassys_tokens.cpp
Cassys_tokens.h
Cassys_transducer.cpp
Cassys_transducer.h
Cassys_xml_output.cpp
Cassys_xml_output.h
CharNames.h
CheckDic.cpp
CheckDic.h
CodePages.cpp
CodePages.h
CompoundWordHashTable.cpp
CompoundWordHashTable.h
CompoundWordTree.cpp
CompoundWordTree.h
Compress.cpp
Compress.h
CompressedDic.cpp
CompressedDic.h
ConcorDiff.cpp
ConcorDiff.h
Concord.cpp
Concord.h
Concordance.cpp
Concordance.h
Contexts.cpp
Contexts.h
Convert.cpp
Convert.h
Copyright.cpp
Copyright.h
DELA.cpp
DELA.h
DELA_tree.cpp
DELA_tree.h
DebugMode.cpp
DebugMode.h
DicVariables.cpp
DicVariables.h
Dico.cpp
Dico.h
DictionaryTree.cpp
DictionaryTree.h
Diff.cpp
Diff.h
DirHelper.h
DirHelperPosix.cpp
DirHelperWin.cpp
DumpOffsets.cpp
DumpOffsets.h
DuplicateFile.cpp
DuplicateFile.h
DutchCompounds.cpp
DutchCompounds.h
Elag.cpp
Elag.h
ElagComp.cpp
ElagComp.h
ElagDebug.cpp
ElagDebug.h
ElagFstFilesIO.cpp
ElagFstFilesIO.h
ElagFunctions.cpp
ElagFunctions.h
ElagRulesCompilation.cpp
ElagRulesCompilation.h
ElagStateSet.cpp
ElagStateSet.h
Error.cpp
Error.h
Evamb.cpp
Evamb.h
Extract.cpp
Extract.h
ExtractUnits.cpp
ExtractUnits.h
FIFO.cpp
FIFO.h
File.cpp
File.h
FileEncoding.h
Flatten.cpp
Flatten.h
FlattenFst2.cpp
FlattenFst2.h
Fst2.cpp
Fst2.h
Fst2Automaton.cpp
Fst2Automaton.h
Fst2Check.cpp
Fst2Check.h
Fst2Check_lib.cpp
Fst2Check_lib.h
Fst2List.cpp
Fst2List.h
Fst2Txt.cpp
Fst2Txt.h
Fst2TxtAsRoutine.cpp
Fst2TxtAsRoutine.h
Fst2Txt_TokenTree.cpp
Fst2Txt_TokenTree.h
GeneralDerivation.cpp
GeneralDerivation.h
GermanCompounds.cpp
GermanCompounds.h
Grf2Fst2.cpp
Grf2Fst2.h
Grf2Fst2_lib.cpp
Grf2Fst2_lib.h
GrfBeauty.cpp
GrfBeauty.h
GrfDiff.cpp
GrfDiff.h
GrfDiff3.cpp
GrfDiff3.h
GrfSvn_lib.cpp
GrfSvn_lib.h
GrfTest.cpp
GrfTest.h
GrfTest_lib.cpp
GrfTest_lib.h
Grf_lib.cpp
Grf_lib.h
HTMLCharacters.cpp
HTMLCharacters.h
HashTable.cpp
HashTable.h
IOBuffer.cpp
IOBuffer.h
ImplodeTfst.cpp
ImplodeTfst.h
KeyWords.cpp
KeyWords.h
KeyWords_lib.cpp
KeyWords_lib.h
Keyboard.cpp
Keyboard.h
Korean.cpp
Korean.h
KrMwuDic.cpp
KrMwuDic.h
LICENSE
LanguageDefinition.cpp
LanguageDefinition.h
LemmaTree.cpp
LemmaTree.h
LinearAutomaton2Txt.cpp
LinearAutomaton2Txt.h
List_int.cpp
List_int.h
List_pointer.cpp
List_pointer.h
List_ustring.cpp
List_ustring.h
LoadInf.cpp
LoadInf.h
Locate.cpp
Locate.h
LocateCache.cpp
LocateCache.h
LocateConstants.h
LocateFst2Tags.cpp
LocateFst2Tags.h
LocateMatches.cpp
LocateMatches.h
LocatePattern.cpp
LocatePattern.h
LocateTfst.cpp
LocateTfst.h
LocateTfstMatches.cpp
LocateTfstMatches.h
LocateTfst_lib.cpp
LocateTfst_lib.h
LocateTrace.cpp
LocateTrace.h
LocateTracePlugCallback.h
MF_DLC_inflect.cpp
MF_DLC_inflect.h
MF_DicoMorpho.cpp
MF_DicoMorpho.h
MF_DicoMorphoBase.h
MF_FormMorpho.cpp
MF_FormMorpho.h
MF_Global.cpp
MF_Global.h
MF_LangMorpho.cpp
MF_LangMorpho.h
MF_LangMorphoBase.h
MF_MU_graph.cpp
MF_MU_graph.h
MF_MU_morpho.cpp
MF_MU_morpho.h
MF_MU_morphoBase.h
MF_Operators_Util.cpp
MF_Operators_Util.h
MF_SU_morpho.cpp
MF_SU_morpho.h
MF_SU_morphoBase.h
MF_Unif.cpp
MF_Unif.h
MF_UnifBase.h
MF_Util.cpp
MF_Util.h
Main_BuildKrMwuDic.cpp
Main_Cassys.cpp
Main_CheckDic.cpp
Main_Compress.cpp
Main_ConcorDiff.cpp
Main_Concord.cpp
Main_Convert.cpp
Main_Dico.cpp
Main_DumpOffsets.cpp
Main_Elag.cpp
Main_ElagComp.cpp
Main_Evamb.cpp
Main_Extract.cpp
Main_Flatten.cpp
Main_Fst2Check.cpp
Main_Fst2List.cpp
Main_Fst2Txt.cpp
Main_Grf2Fst2.cpp
Main_GrfDiff.cpp
Main_GrfDiff3.cpp
Main_GrfTest.cpp
Main_ImplodeTfst.cpp
Main_KeyWords.cpp
Main_Locate.cpp
Main_LocateTfst.cpp
Main_MultiFlex.cpp
Main_MzRepairUlp.cpp
Main_Normalize.cpp
Main_PolyLex.cpp
Main_RebuildTfst.cpp
Main_Reconstrucao.cpp
Main_Reg2Grf.cpp
Main_Seq2Grf.cpp
Main_SortTxt.cpp
Main_SpellCheck.cpp
Main_Stats.cpp
Main_TEI2Txt.cpp
Main_Table2Grf.cpp
Main_Tagger.cpp
Main_TagsetNormTfst.cpp
Main_Test.cpp
Main_Tfst2Grf.cpp
Main_Tfst2Unambig.cpp
Main_TfstTag.cpp
Main_Tokenize.cpp
Main_TrainingTagger.cpp
Main_Txt2Tfst.cpp
Main_Uncompress.cpp
Main_UnitexTool.cpp
Main_UnitexToolLogger.cpp
Main_Untokenize.cpp
Main_Unxmlize.cpp
Main_XMLizer.cpp
MappedFileHelper.h
MappedFileHelperDummy.cpp
MappedFileHelperPosix.cpp
MappedFileHelperWin.cpp
Match.cpp
Match.h
MetaSymbols.h
MorphologicalFilters.cpp
MorphologicalFilters.h
MorphologicalLocate.cpp
MorphologicalLocate.h
MultiFlex.cpp
MultiFlex.h
NewLineShifts.cpp
NewLineShifts.h
NormalizationFst2.cpp
NormalizationFst2.h
Normalize.cpp
Normalize.h
NormalizeAsRoutine.cpp
NormalizeAsRoutine.h
NorwegianCompounds.cpp
NorwegianCompounds.h
Offsets.cpp
Offsets.h
OptimizedFst2.cpp
OptimizedFst2.h
OptimizedTfstTagMatching.cpp
OptimizedTfstTagMatching.h
OutputTransductionVariables.cpp
OutputTransductionVariables.h
Overlap.cpp
Overlap.h
PRLG.cpp
PRLG.h
PackFst2.cpp
PackFst2.h
PackInf.cpp
PackInf.h
ParsingInfo.cpp
ParsingInfo.h
Pattern.cpp
Pattern.h
PatternTree.cpp
PatternTree.h
PersistResource.cpp
PersistResource.h
Persistence.cpp
Persistence.h
PersistenceInterface.cpp
PersistenceInterface.h
PolyLex.cpp
PolyLex.h
PortugueseNormalization.cpp
PortugueseNormalization.h
ProgramInvoker.cpp
ProgramInvoker.h
README.md
README.md.in
RebuildTfst.cpp
RebuildTfst.h
Reconstrucao.cpp
Reconstrucao.h
Reg2Grf.cpp
Reg2Grf.h
RegExFacade.cpp
RegExFacade.h
RegularExpressions.cpp
RegularExpressions.h
RussianCompounds.cpp
RussianCompounds.h
SelectOutput.cpp
SelectOutput.h
Sentence2Grf.cpp
Sentence2Grf.h
Seq2Grf.cpp
Seq2Grf.h
SingleGraph.cpp
SingleGraph.h
Snt.cpp
Snt.h
SortTxt.cpp
SortTxt.h
SpellCheck.cpp
SpellCheck.h
SpellChecking.cpp
SpellChecking.h
Stack_int.cpp
Stack_int.h
Stack_pointer.cpp
Stack_pointer.h
Stack_unichar.cpp
Stack_unichar.h
Stats.cpp
Stats.h
StringParsing.cpp
StringParsing.h
String_hash.cpp
String_hash.h
Symbol.cpp
Symbol.h
SymbolAlphabet.cpp
SymbolAlphabet.h
Symbol_op.cpp
Symbol_op.h
SyncTool.h
SyncToolDummy.cpp
SyncToolPosix.cpp
SyncToolWin.cpp
TEI2Txt.cpp
TEI2Txt.h
Table2Grf.cpp
Table2Grf.h
Tagger.cpp
Tagger.h
TaggingProcess.cpp
TaggingProcess.h
Tagset.cpp
Tagset.h
TagsetNormTfst.cpp
TagsetNormTfst.h
Test_lib.cpp
Text_parsing.cpp
Text_parsing.h
Text_tokens.cpp
Text_tokens.h
Tfst.cpp
Tfst.h
Tfst2Grf.cpp
Tfst2Grf.h
Tfst2Unambig.cpp
Tfst2Unambig.h
TfstStats.cpp
TfstStats.h
TfstTag.cpp
TfstTag.h
Thai.cpp
Thai.h
Token.h
Tokenization.cpp
Tokenization.h
Tokenize.cpp
Tokenize.h
TrainingProcess.cpp
TrainingProcess.h
TrainingTagger.cpp
TrainingTagger.h
TransductionStack.cpp
TransductionStack.h
TransductionStackTfst.cpp
TransductionStackTfst.h
TransductionVariables.cpp
TransductionVariables.h
Transitions.cpp
Transitions.h
Txt2Tfst.cpp
Txt2Tfst.h
Uncompress.cpp
Uncompress.h
Unicode.cpp
Unicode.h
UnitexGetOpt.cpp
UnitexGetOpt.h
UnitexLibDir.h
UnitexLibDirPosix.cpp
UnitexLibDirWin.cpp
UnitexLibIO.cpp
UnitexLibIO.h
UnitexLibIO_ICU.cpp
UnitexLibIO_ICU.h
UnitexRevisionInfo.cpp
UnitexRevisionInfo.h
UnitexString.h
UnitexTool.cpp
UnitexTool.h
Unitex_revision.h
Untokenize.cpp
Untokenize.h
UnusedParameter.h
Unxmlize.cpp
Unxmlize.h
UserCancelling.cpp
UserCancelling.h
UserCancellingPlugCallback.h
Ustring.cpp
Ustring.h
VariableUtils.cpp
VariableUtils.h
Vector.h
Version.h
Version.h.in
VersionInfo.cpp
VersionInfo.h
VirtualFiles.cpp
VirtualFiles.h
XMLizer.cpp
XMLizer.h
Xml.cpp
Xml.h
config.h
gitignore.io.sh

README.md

Unitex/GramLab Core Build Status Build status

Unitex/GramLab is an open source, cross-platform, multilingual, lexicon- and grammar-based corpus processing suite.

Unitex is the Natural Language Processing (NLP) engine of Unitex/GramLab.

How to Build

git clone https://github.com/UnitexGramLab/unitex-core
cd unitex-core/build
make DEBUG=yes UNITEXTOOLLOGGERONLY=yes

Contributing

We welcome everyone to contribute to improve this project. See CONTRIBUTING.md for contribution guidelines and instructions.

Documentation

User's Manual (in PDF format) is available in English and French (more translations are welcome). You can view and print them with Evince, downloadable here. The latest version of the User's Manual is accessible here.

Support

Support questions can be posted in the community support forum. Please feel free to submit any suggestions or requests for new features too. Some general advice about asking technical support questions can be found here.

Reporting Bugs

See the Bug Reporting Guide for information on how to report bugs.

Governance Model

Unitex/GramLab project decision-making is based on a community meritocratic process, anyone with an interest in it can join the community, contribute to the project design and participate in decisions. The Unitex/GramLab Governance Model describes how this participation takes place and how to set about earning merit within the project community.

Spelling

Unitex/GramLab is spelled with capitals "U" "G" and "L", and with everything else in lower case. Excepting the forward slash, do not put a space or any character between words. Only when the forward slash is not allowed, you can simply write “UnitexGramLab”.

It's common to refer to the Unitex/GramLab Core as "Unitex", and to the Unitex Project-oriented IDE as "GramLab". If you are mentioning the distribution suite (Core, IDE, Linguistic Resources and others bundled tools) always use "Unitex/GramLab".

License

This program is licensed under the GNU Lesser General Public License version 2.1. Contact unitex-devel@univ-mlv.fr for further inquiries.

--

Copyright (C) 2019 Université Paris-Est Marne-la-Vallée