Property name CoreServer
General
license.file yes
license.database yes
endpointHost yes
endpointListenHost yes
endpointPort yes
httpDocbase yes
outputPath yes
externalBaseUrl yes
coreServerEndpointUrl no
pingInterval yes
postprocessXsltLocationUrl no
writeRequest yes
sentenceLengthStatistics no
resetAdminPassword yes
termRuleConstructionTextType no
clientPropertiesPath yes
clientPropertiesModelUser yes
output.writeDeepProcessorInput no
output.writeAnnotation no
logging.jetty yes
Language settings
language.id no
name no
no
rulePriorityFactor
Linguistic resources
tokenizer no
morphology no
spellchecker no
tagger no
tagger.lexica no
tagger.theta no
compounding no
Text type settings
textTypes no
[TEXTTYPE] .grammarRules no
[TEXTTYPE] .styleRules no
[TEXTTYPE]. harvestingRules no
[TEXTTYPE] .sentenceLength no
[TEXTTYPE] .ruleRelevantContexts no
[TEXTTYPE] .reportRelevantContexts no
[TEXTTYPE] .contextSegmentationDefinitions no
Tokenizer
tokenizer.significantInterspace no
tokenizer.formsRewrites no
CaseAdjuster
caseAdjuster.allowSentenceInitialCaseDifference no
TermChecking
canMarkKnownTerms no
terminology.sources no
terminology.pathPrefix no
terminology.helpPathPrefix no
terminology.defaultEngine no
terminology.useAsSpellingSuggestions no
terminology.illegalVariants.enableCaseVariants no
terminology.illegalVariants.flagAllUpperCase no
terminology.illegalVariants.flagAllLowerCase no
terminology.illegalVariants.flagMixedCase no
terminology.illegalVariants.flagBosFormAtMos no
terminology.illegalVariants.flagTitleCase no
terminology.significantTermElementRegex no
terminology.variantTrimmingRegex no
terminology.tokensToTreatAsDictionaryEntries no
terminology.mcatsToIncludeInVariants no
terminology.mcatsToExcludeFromVariants no
terminology.enableVariantsOfIllegal no
Built-in rule help
sentenceTooLongHelp no
sentenceTooLongPhrase no
Spellchecker settings
spellchecker.checkCapitalization no
spellchecker.disableSentenceUppercase no
spellchecker.reportUnknownWords no
spellchecker.tokensToCheck no
spellchecker.tokensNotToCheck no
spellchecker.tokensToIgnoreForCapitalisation no
spellchecker.tokensNoCaseChange no
spellchecker.tokensTransparentForCapitalisation no
spellchecker.tokensToIgnoreForDuplicates no
spellchecker.significantInterspace no
spellchecker.noCapitalAfterTokens no
spellchecker.possiblyCapitalAfterTokens no
spellchecker.maximumStringDistance no
spellchecker.doNotCheckShorterThan no
spellchecker.tryRunTogetherWords no
spellchecker.trySplitWords no
spellchecker.noDuplicatesShorterThan no
spellchecker.suggestTerms Deprecated! Use terminology.useAsSpellingSuggestions
spellchecker.derivationPrefixes no
spellchecker.truncatedTokens no
spellchecker.spellingRules no
Term design
termdesign.db.host no
termdesign.db.port no
termdesign.importPath no
termdesign.exportPath no
termdesign.handlePOS yes
Term harvesting
termharvesting.db.host no
termharvesting.db.port
termharvesting.surroundcontext no
termharvesting.onlyServerSide no
termharvesting.spellingNewWordsConflictPreference no
termharvesting.ignoreDisabledTermbanks no
termharvesting.clustering no
XML & Context-sensitive processing settings
xml.dtdPrefixMappings.[ID] .from no
xml.dtdPrefixMappings.[ID] .to no
xml.annotationType no
Annotation type "pi"
xml.pi.flagName no
xml.pi.markedTokenBeginName no
xml.pi.markedTokenEndName no
Annotation type "element"
xml.element.namespacePrefix no
xml.element.namespaceUri no
Internal settings
processibleSentenceFilter.maxWordCount no
processibleSentenceFilter.maxTokenCount no
soapLogging yes
tagger.createTrainingData no
internal.terminologyManagementIsActivated yes
internal.preloadTerminologyManager yes
Intelligent reuse settings
[TEXTTYPE].reuse.output.writeSentenceSurfaceIndex no
[TEXTTYPE].reuse.surfaceIndexPath no
[TEXTTYPE].reuse.indexerIsAlwaysActivated no
[TEXTTYPE].reuse.normalizer.settings no
[TEXTTYPE].reuse.repository no
[TEXTTYPE].reuse.usageStatistics no
[TEXTTYPE].reuse.maxNumberOfSuggestions no
[TEXTTYPE].reuse.maxQueryTerms no
[TEXTTYPE].reuse.minPercentTermsToMatch no
[TEXTTYPE].reuse.minScore no
[TEXTTYPE].reuse.checkerIsAlwaysActivated no
[TEXTTYPE].reuse.antonymList no
[TEXTTYPE].reuse.scoringStopwordList no
[TEXTTYPE].reuse.variableSubstitution.substituteVariables
no
[TEXTTYPE].reuse.showSuggestionDebugInfo no
LanguageServer Required Audience
no no admin (installation)
no no admin (installation)
yes no admin (installation)
no no admin (installation)
yes no admin (installation)
yes no admin (installation)
yes no admin (installation)
no no admin (installation)
yes yes admin (installation)
yes no admin (installation)
yes no admin (installation)
no no admin (installation)
yes no admin (installation)
no no admin (installation)
yes no admin (lingware)
no no admin (installation)
no no admin (installation)
yes no admin (lingware)
yes no admin (lingware)
no no admin (installation)
yes yes admin (installation)
yes no admin (installation)
yes no admin (lingware)
yes no admin (installation)
yes yes admin (installation)
yes no admin (installation)
yes no admin (installation)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (installation)
yes yes admin (installation)
yes yes admin (lingware)
yes yes admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (terminology)
yes no admin (lingware)
yes no admin (terminology)
yes no admin (terminology)
yes no admin (terminology)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (terminology)
yes no admin (terminology)
yes no admin (terminology)
yes no admin (terminology)
yes no admin (terminology)
yes no admin (terminology)
yes no admin (terminology)
yes no admin (terminology)
yes no admin (terminology)
yes no admin (terminology)
yes no admin (terminology)
yes no admin (terminology)
yes no admin (terminology)
yes no admin (terminology)
yes no admin (installation)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
Deprecated! Use terminology.useAsSpellingSuggestions instead or specify in the termbanks' "spelling" fields.
yes no admin (lingware)
yes no admin (lingware)
yes yes admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
no no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (installation)
yes no admin (installation)
yes no admin (installation)
yes no admin (installation)
yes no admin (installation)
yes no admin (installation)
yes no admin (installation)
yes no admin (installation)
yes no admin (lingware)
yes no admin (lingware)
yes no acrolinx service
yes no lingware developers
no no admin (installation)
no no admin (installation)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
yes no admin (lingware)
Type of value
String (Path)
String (Path)
String (Hostname / IP address)
String (Hostname / IP address)
Integer
String (Path)
String (Path)
String (URL)
String (URL)
Integer
String (Path)
Boolean
Boolean
String
String (TextType)
String (Path)
String (user id)
Boolean
Boolean
String (Path)
String
String
List of Pairs
String (Path)
String (Path)
String (Path)
String (Path)
List of Strings (Paths)
Integer
String (Path)
List of Strings
String (Path)
String (Path)
String (Path)
Integer
List of Strings
List of Strings
List of Strings (Paths)
List of TokenClasses
List of semicolon-separated comma-separated pairs
Boolean
Boolean
List of semicolon-separated Strings (Acrolinx URIs)
String (Path)
String (Path)
String (rule or fsa)
Boolean
Boolean
Boolean
Boolean
Boolean
Boolean
Boolean
String (Java regular expression)
String (Java regular expression)
List of TokenClasses
List of Strings
List of Strings
Boolean
String (Path)
String
Boolean
Boolean
Boolean
List of TokenClasses
List of TokenClasses
List of TokenClasses
List of TokenClasses
List of TokenClasses
List of TokenClasses
List of TokenClasses
List of TokenClasses
List of TokenClasses
Integer
Integer
Boolean
Boolean
Integer
ead or specify in the termbanks' "spelling" fields.
List of Strings (Prefixes)
List of TokenClasses
String (Path)
String (IP/Hostname)
Integer
String (Path)
String (Path)
Boolean
String (IP/Hostname)
Integer
Integer
Boolean
none|spellingError
Boolean
Boolean
String (URL)
String (URL)
String
String
String
String
String
String
Integer
Integer
Boolean
String (Path)
Boolean
Boolean
Boolean
String (Path)
Boolean
String (Path)
String (Path)
String (Path)
Integer
Integer
Float
Float
Boolean
String (Path)
String (Path)
Boolean
Boolean
Default value
acrocheck.license
acrocheck
127.0.0.1
0.0.0.0
8031 (core server), 8029 (language server)
../www
output
30
false
false
***BASE***
../../data/clients
admin
false
false
unknown
10
-1
true
true
../../data/[LANGID]/terms/
htmldata/[LANGID]/terms/defs
fsa
false
true
false
true
true
true
false
[^/\\- ]+
[/\\- ]+
false
[internal]
sentence_too_long
true
false
false
4
3
false
false
2
127.0.0.1
1527
../../data/import
../../data/export
false
spellingError
false
false
none
acrocheckFlag
acrocheckMarkedTokenBegin
acrocheckMarkedTokenEnd
a
http://www.acrolinx.com/xmlns/acrocheck
70
1.5*70
false
false
true
false
false
6
10
0.5
0.5
false
true
false
Description
Path to license file, relative to the server bin directory.
Path to license database file, relative to the server bin directory. The server will append extensions for the license
database (.ALD) and the license database backup (.ALB).
The host name or IP address under which this server is accessible for clients.
The host name or IP address on which this server should listen for client requests.
The TCP port number under which this server is accessible for clients and on which it should listen for requests.
Path to documents served by the webserver
Path prefix for output generated by server. Relative to httpDocbase.
URL of externally visible server address (e.g. for reverse proxies).
URL of core server server endpoint address that should be contacted.
Time (in seconds) between proxy / language server synchronization attempts
XSL stylesheet to render HTML report
If set to true the text and the checking options properties are stored in two separate files in the output folder.
If set to true statistics about sentence length distribution will be added to the reports.
If set, the password for the default admin user "admin" is reset to the specified value with the next server start.
The name of the text type which should be used by the client to generate term rules.
Path prefix for client (plugin) properties stored by the server. Relative to the server bin directory.
User id from which default values for client properties will be taken.
Determines whether deep processor input should be written for each file (to _deep_processor_input.dpi).
Determines whether annotated output should be written for each file (to _annotated.ala).
Path to request log file for the embedded Jetty server
Language identifier for language implemented by this server. Most commonly a two letter string.
Human readable name of the language implemented by this server.
A list of pairs with the factors for the rule priority of the grammar and style rules calculated for the score of the
report. Note that priorities are one-based, with priority one being the highest (and default) priority
Base name of main tokenizer rule file (.tok) (may include other tokenizer rule files).
Base name of file containing the morphological lexicon.
Base name of file containing spell checker lexicon.
Base name of files containing tagger model (.123), (optional) lexicon (.lex), (optional) morphology mapping (.map),
(optional) token class mapping (.tokmap), and (optional) word guesser rules (.awg).
Base names of files containing additional tagger lexica (.lex).
Threshold value for determining tag assignment reliability. Increasing this value results in fewer assignments being
classified as reliable.
Base name of files containing rules (.rul) and (optional) exceptions (.exc) for compound analysis.
List of text type names.
Name of file containing grammar rules for this text type.
Name of file containing style rules for this text type.
Name of file containing term harvesting rules for this text type. If not given, term harvesting is not available for this
text type.
Maximum sentence length for this text type.
Specifies the list of element names relevant for context-sensitive processing. Only elements mentioned here will be
available to the rule formalism.
Specifies the list of element names which should be included in the report as a flag's sourceContexts. Currently, this
includes mainly PDF page number contexts.
Specifies the list of context segmentation definition files to use for this text type.
Defines token classes that represent significant interspace, i.e. which are not allowed between multi token terms.
Defines rewrites to be performed for TOKEN.FORMS
############################################################################################
Determines whether the server allows the marking of known terms.
Files or directories containing files with term rules. All given files/all files from given directories are loaded. The
names are relative to the pathprefix.
Path prefix to term resources, currently only used for acroterm termbanks. Relative to server bin directory.
Path prefix to term definitions, relative to web server root.
Determines the standard engine (term rules or term fsa) to be used for termbanks. This can be overridden for each
termbank individually by specifying the "engine=rule" or "engine=fsa" property in the termbank's acrolinx URI.
Determines whether terms should be used as spelling suggestions. This value can be set individually for each
termbank by adding a "spelling=true" (or false) in the termbank's acrolinx URI specification.
Determines whether case variants should be checked at all; if set to false, no case variants are flagged.
Determines whether the all upper case variant of a legal term should be flagged as illegal by default.
Determines whether the all lower case variant of a legal term should be flagged as illegal by default.
Determines whether the mixed case variants of a legal term should be flagged as illegal by default.
Determines whether the BOS form of a legal term should be flagged as illegal by default when encountered in MOS
position.
Determines whether the Title Case Form of a legal term should be flagged as illegal by default.
Determines the parts of term surfaces which must not be normalized. To turn off term variant detection completely,
you can use the expression '.+' (without the quotes). See also variantTrimmingRegex.
Determines the leading and terminating parts of term surfaces which are ignored for variant detection. Use '$^'
(without the quotes) to turn off variant detection completely. See also significantTermElementRegex.
Defines token classes that are treated as dictionary entries, when the token itself is not in the dictionary (e.g. Unit)
Defines the mcats for which term variants should always be found. If all parts of a candidate term variant has any
one of these mcats, it is considered to be a term variant.
Defines the mcats for which no term variants should be found. If any one part of a candidate term variant has any
one of these mcats, it is not considered to be a term variant.
Iff false, no variants of illegal terms are flagged.
Name of file containing help for the sentence too long rule.
Label used for sentence too long errors.
If set to false, capitalization will not be checked.
If set to true, the check for sentence initial upper case is disabled.
If set to true, words which are not found in the lexicon are flagged (report only). Otherwise, they are silently ignored.
List of token classes to consider for spell checking.
############################################################################################
List of token classes to ignore when case checking.
List of token classes where case never changes
List of token classes which do not affect capitalisation
List of token classes to ignore when checking for repeated words.
Defines token classes that represent significant interspace, that they separate two occurrences of a string without
raising a duplicate flag.
Sentences that follow a sentence whose last token is one of these, should not be capitalised.
Sentences that follow a sentence whose last token is one of these, may be capitalised (i.e. both spellings are
possible).
Maximum distance between a string and its spelling suggestions. Suggestions that are farther away are not
presented to the user.
Do not check strings which are shorter than this value.
Check if a string consists of two words that have been accidentally written together.
Check if a word has been accidentally split into two by inserting a space.
Do not check if strings shorter than this might be duplicates.
Comma-separated list of prefixes. Spell checker suggestions are combined with these prefixes and if that gives the
word in the text, the suggestion is removed from the list.
List of token classes that are to be considered as truncated (typically beginning or ending with a hyphen)
Name of file containing spell checking rules.
Host for the term database connection
Port for the term database connection
Import directory for Term Design Client. Relative to the server bin directory.
Export directory for Term Design Client. Relative to the server bin directory.
If it is set to true the POS from the term, while importing a olif file, will be compared with the possible POS of this
word for the morphology. If it is set to false, the POS will be ignored.
Host for the term harvesting results database connection
Port for the term harvesting results database connection
Number of surrounding contexts of an extracted term
This property is set if the termharvester should not be available for clients.
If you set it to "spellingError", a spelling error will not be marked as new term (unless if the spelling mistake only
concerns case distinctions). If you set it to anything else, spelling errors may also be marked term candidates.
If it is set to "true", words in included but not enabled termbanks can be extracted as term.
If it is set to "false", the clustering will not be done on the harvested term. Disabling the clustering speeds up the
termharvesting.
The URL or path prefix where DTDs are looked up by XML document
The URL or path prefix to which an encountered "from" prefix should be mapped on the server side.
The type of XML annotation to use. Currently supported types are "none", "pi", and "element".
The name of the processing instruction to use for inserting an acrocheck flag in the XML annotation.
The name of the processing instruction to use for annotating the begin of a marked token.
The name of the processing instruction to use for annotating the end of a marked token.
The namespace prefix to use for acrocheck annotation elements.
The namespace URI to use for acrocheck annotation elements.
Maximum number of words in a processible sentence. Sentences with more words will be excluded from linguistic
processing.
Maximum number of tokens in a processible sentence. Sentences with more tokens will be excluded from linguistic
processing.
If set to true, the names of all incoming and outgoing SOAP messages will be logged.
Name of file where tagger training material will be written to.
Activate the new Terminology Management component in server releases not officially supporting it
Load and initialize the persistence layer of the Terminology Manager on startup of the server instead of on the first
access to the Terminology Manager through the Dashboard.
Determines whether the surface for each sentence should be written to a sentence surface index
If this parameter is set, the sentence surfaces are written to the specified index, otherwise a new index is created for
each checked document in the default output folder
Determines whether the surface index should always be written regardless what the client property says
Name of the file containing the normalizer settings for the normalization of sentences in the intelligent reuse
component
Name of the directory containing the intelligent reuse repository cluster index
Name of the directory containing the intelligent reuse repository usage statistics index
Maximum number of suggestions to generate from the reuse repository for a specific sentence being checked.
Maximum number of query terms which are generated from a sentence for the query against the reuse repository.
Minimum percentage of the query terms which must match a sentence from the reuse repository.
Minimum query and minimum jaccard score of a sentence from the reuse repository to qualify as suggestion.
Determines whether the reuse checker should always be run regardless what the client property says
Name of the antonym list file, used to decide if two similar sentences are semantically different
Name of the stopword file, that contains tokens which are not observed on computing the similarity score of a
sentence
Determines whether variable substitution should be activated
Determines whether suggestions should be displayed together with their score and the ID of their respective cluster.
Example value
d:/secure/acrocheck/license
10.10.10.10
10.10.10.10
9000
../www
acrocheckoutput
http://reverse.proxy.company.com/acrolinx/acrocheck
http://127.0.0.1:8031/acrolinx/services/core?wsdl
300
../../xsl/ur2html.xsl
true
true
newPasswd345
Service
d:/acrocheck/clientProperties
lingadmin
true
true
../logs/coreserver.jetty.log
EN
English
1, 2.;2, 1.;2, 0.5;3, 0.;
tokenRulesEN
english
english
taggerDE
taggerProductNames,taggerCustomeSpecific
100
german-compounding.rul
User,Service
rules/sampleGramar.rul
rules/sampleStyle.rul
rules/sampleTH.rul
40
H1,LIST
PAGE, ACROLINX
docbook.csd,html.csd,default.csd
Tabulator
ae,ä;oe,ö;ue,ü
termfinder.allowSentenceInitialCaseDifference=false
false
atd:file:jura.atd;axt:db:localhost:1527:bank1,bank2;axt:file:e:/customer/
terms/
htmldata/EN/terms/defs/
true - for a given termbank: axt:db:localhost:1527:products[spelling=true]
false
true
true
true
true
true
(\\p{Lu}|\\p{Ll}|\\p{Lt}|\\p{Lm}|\\p{Lo}|\\p{Nd}|\\p{Nl}|\\p{No}|\\p{Sm}|\\p{Sc}|\\p{Sk}|\\p{So
[/\\- ]+
Unit
Noun
Apd
true
../bin/sentence_too_long.xml
sentence too long
false
true
true
FirstLowerWord,FirstCapitalWord,LowerWord,LowerCaseWordWithHyphen,MixedWordWithHyphen
Colon,Number
CapitalWord
DoubleQuote
VersionNumber,HtmlEntity,Multiple,NumberWithSpace
Tabulator
Semicolon,ParenthesisOpen
Colon
6
3
true
true
2
un,pre,post
rules/spelling.rul
d:/terminology/import
x:/terms/export
localhost
1527
2
true
none
true
true
../../dtd/
../../data/DE/my_dtd
pi
acroFlag
acroTokenBegin
acroTokenEnd
30
60
true
true
true
false
true
true
resources/EN.ans
reuse/clusterIndex
reuse/usageIndex
8
15
0.7
0.7
true
resources/antonyms.aal
resources/scoringStopwordList.txt
false
true
Comment
If used for a specific term bank, only on the axt:db URL, not
on axt:file.
{Sm}|\\p{Sc}|\\p{Sk}|\\p{So})+
This may disappear with the integration of caseAdjuster.
xedWordWithHyphen
This may disappear with the integration of caseAdjuster.
The ace file is the equivalent for strings.
This may disappear with the integration of caseAdjuster.
Use tokenizer.significantInterspace instead.
This may disappear with the integration of caseAdjuster.
This may disappear with the integration of caseAdjuster.
Used by abb-based spelling suggester.
only usefull for the olif import
It is not possible for the time being to ignore spelling errors
in favour of term candidates.
This setting will disappear with release 4.0
This property and the next two properties must always be
configured, if intelligent reuse is to be used.
The availability of Intelligent reuse component is triggered
by the existence of this property
This property should always be configured together with the
property just above.