[TAF] [TAF_Application:UPDATE] PlugInSequence = taf_tok, taf_poe TargetTypesSet = TAF_Token, TAF_Sentence, TAF_Paragraph FilterSet = StwIgnAllUpCs PreventDuplicateTargetTypes = yes Normalize = no NormalizeUmlauts = no ConvertToLowerCase = yes ConvertAllUpperCaseToLowerCase = yes MemPoolInstInitial = 64000 ; (bytes) MemPoolInstGrow = 64000 ; (bytes) MemPoolDocBufferInitial = 96000 ; (bytes) MemPoolDocBufferGrow = 128000 ; (bytes) MemPoolDocMiscInitial = 128000 ; (bytes) MemPoolDocMiscGrow = 128000 ; (bytes) [TAF_Application:QUERY] PlugInSequence = taf_tok, taf_poe, taf_thes, taf_soundex TargetTypesSet = TAF_Token, TAF_Sentence, TAF_Paragraph, TAF_Synonym, TAF_TokenInflectedForms, TAF_ThesaurusEntry, TAF_TokenSoundexString FilterSet = StwIgnAllUpCs PreventDuplicateTargetTypes = yes Normalize = no NormalizeUmlauts = no ConvertToLowerCase = yes ConvertAllUpperCaseToLowerCase = yes MemPoolInstInitial = 64000 ; (bytes) MemPoolInstGrow = 64000 ; (bytes) MemPoolDocBufferInitial = 8000 ; (bytes) MemPoolDocBufferGrow = 16000 ; (bytes) MemPoolDocMiscInitial = 64000 ; (bytes) MemPoolDocMiscGrow = 64000 ; (bytes) [TAF_PlugIn:TAF_TOK] Filename = /usr/lib/itetoknz UseAlternateTerritories = yes TokenNumbersIncludeStopwords = true ; stopwords are counted as token numbers IgnorePunctuationTokens = true ; ignore punctuation tokens for TSE [TAF_PlugIn:TAF_POE] Filename = /usr/lib/itepoe TraceCompId = 201 ; The trace component id for this plugin (200 < TraceCompId < 255) PreloadLanguages = EN-US ; A list of all languages which should be pre-loaded at init-time in the form XX-YY (XX language, YY sublanguage/territory ReplyBufferSizeKB = 64 ; The size (in KB) of the POE reply buffer ScanInputForLines = true ; enable/disable the (expensive) line-search pre-processing of input TokenNumbersIncludeStopwords = true ; enable/disable counting of stopwords as tokens SetOnlyTSERelevantAttributes = true ; enable/disable annotation of TSE relevant data DelayLoad = true GeneratedTypesForDelayedLoad = TAF_Token, TAF_Sentence, TAF_Paragraph, TAF_Lemma, TAF_Synonym, TAF_CompoundPart, TAF_TokenInflectedForms SupportedLanguagesForDelayedLoad = TAF_Token:ar:he:ja:th:ko:zh_traditional:zh_simplified, TAF_Sentence:ar:he:ja:th:ko:zh_traditional:zh_simplified, TAF_Paragraph:ar:he:ja:th:ko:zh_traditional:zh_simplified [TAF_PlugIn:TAF_THES] Filename = /usr/lib/itethes DelayLoad = true GeneratedTypesForDelayedLoad = TAF_ThesaurusEntry RequiredTypesForDelayedLoad = TAF_Token [TAF_PlugIn:TAF_SOUNDEX] Filename = /usr/lib/itesndex DelayLoad = true GeneratedTypesForDelayedLoad = TAF_TokenSoundexString RequiredTypesForDelayedLoad = TAF_Token [TAF_Filter:STWUSEALLUPCS] FilterType = TAF_FILTER_STW MinTokenLength = 1 ; anything shorter will be considered stopword MinUpperCaseTokenLength = 1 ; same as 'MinTokenLength': all uppercase tokens are no exceptions UseAlternateTerritories = yes [TAF_Filter:STWIGNALLUPCS] FilterType = TAF_FILTER_STW MinTokenLength = 1 ; anything shorter will be considered stopword MinUpperCaseTokenLength = 1 ; all uppercase tokens with length >=1 are exceptions UseAlternateTerritories = yes [TAF_AnnotationType:TAF_ThesaurusEntry] ThesBaseName = itethes Depth = 1 [TAF_AnnotationType:TAF_Token] GenerateInflectedForms = false ; must be disabled initially GenerateSoundex = false ; must be disabled initially [EndOfFile]