; ; following commands are available: ; - delete 'word' : delete 'word' from the mail word-list ; - set 'variablePart' 'value': set 'variablePart' to 'value' ; there are following variableParts available: ; - counter : number of classified words ; - group : group of the classified ; words ; - begin : start pattern of the word of ; the desired group ; - variablePart : variablePart pattern of the ; word of the desired group ; - ending : end pattern of the word of ; the desired group ; - baseRule : rule to convert the found ; word to the base word ; - endings : rules to convert the base ; word to the derivated words ; - allEndings : flag to add all forms to ; the base word ; - withBasewordOnly : flag to accept only word ; with an existing base word ; - add 'variablePart' 'value': add 'value' to 'variablePart' ; - extract : search next base word and extract all derivated ; words from the list delete "der" delete "die" delete "das" delete "ein" delete "eine" delete "ein" delete "ich" delete "du" delete "er" delete "sie" delete "es" delete "wir" delete "ihr" delete "sie" delete "mein" delete "dein" delete "sein" delete "ihr" delete "sein" delete "unser" delete "euer" delete "ihr" delete "wer" delete "wie" delete "was" delete "warum" delete "wieso" delete "weshalb" delete "weswegen" set allEndings false set withBasewordOnly true message "constant words extracted" set group "nouns, based on verbs" set counter 0 set begin "[ABCDEFGHIJKLMNOPQRSTUVWXYZÄÖÜ]" set variablePart "" set ending "ungen" set baseRule "-5en" set endings " -, -2ung, -2ungen," extract set begin "[ABCDEFGHIJKLMNOPQRSTUVWXYZÄÖÜ]" set variablePart "" set ending "ung" set baseRule "-3en" set endings " -, -2ung, -2ungen," extract ; ; Wird am ending wieder geloescht ; set begin "[ABCDEFGHIJKLMNOPQRSTUVWXYZÄÖÜ]" set variablePart "" set ending "ungs" set baseRule "-4en" set endings " -, -2ungs, -2ungen," extract set group "nouns, based on adjectives" set begin "[ABCDEFGHIJKLMNOPQRSTUVWXYZÄÖÜ]" set variablePart "" set ending "keiten" set baseRule "-6" set endings " -, -keit, -keiten," extract set begin "[ABCDEFGHIJKLMNOPQRSTUVWXYZÄÖÜ]" set variablePart "" set ending "keit" set baseRule "-4" set endings " -, -keit, -keiten," extract set begin "[ABCDEFGHIJKLMNOPQRSTUVWXYZÄÖÜ]" set variablePart "" set ending "heit" set baseRule "-4" set endings " -, -heit, -heiten," extract ; ; Wird am ending wieder geloescht ; set begin "[ABCDEFGHIJKLMNOPQRSTUVWXYZÄÖÜ]" set variablePart "" set ending "keits" set baseRule "-5" set endings " -, -keits, -keiten," extract set group "nouns" set begin "[ABCDEFGHIJKLMNOPQRSTUVWXYZÄÖÜ]" set variablePart "" set ending "chen" set baseRule "-4" set endings " -, -chen," extract set begin "[ABCDEFGHIJKLMNOPQRSTUVWXYZÄÖÜ]" set variablePart "" set ending "innen" set baseRule "-5" set endings " -, -in, -innen, -n, -s," extract set begin "[ABCDEFGHIJKLMNOPQRSTUVWXYZÄÖÜ]" set variablePart "" set ending "en" set baseRule "-1" set endings " -, -n," extract set begin "[ABCDEFGHIJKLMNOPQRSTUVWXYZÄÖÜ]" set variablePart "" set ending "en" set baseRule "-2" set endings " -, -e, -en, -es, -er, -s," extract set begin "[ABCDEFGHIJKLMNOPQRSTUVWXYZÄÖÜ]" set variablePart "" set ending "rn" set baseRule "-1" set endings " -, -n, -s," extract set begin "[ABCDEFGHIJKLMNOPQRSTUVWXYZÄÖÜ]" set variablePart "" set ending "es" set baseRule "-2" set endings " -, -e, -en, -es, -er, -s," extract set group "verbs" set counter 0 set maxLineCnt 10 set begin "[abcdefghijklmnopqrstuvwxyzäöü]" ; ; alle Worte, die mit '[^iuw]e[lr]test' endingn ; ; Da es anscheinend mit den negierten Suchmasken Probleme gibt ; (das '^' kann nicht direkt eingelesen werden, es werden nicht ; alle ausnahmen gefunden), werden generell nur die positiven ; Musterdefinitionen benutzt. ; set variablePart "[" &chr 94 "iuw]e[lr]" set ending "test" set baseRule "-4n" set endings " -1e, -1st, -1t, -, -1t, -, -1e, ge-lt, -1te, ge-1t, -, ge-1t, -1e, -1test, -d, -de, -den, -der, -des, an-, ab-, auf-, be-, durch-, ein-, er-, fort-, her-, mit-, um-, unter-, ver-, wider-, wieder-, zer-, zu-, zurück-, zusammen-, über-," extract set begin "[abcdefghijklmnopqrstuvwxyzäöü]" set variablePart "[bfghiklmnprsuxz]" set ending "test" set baseRule "-4en" set endings " -1, -2st, -2t, -, -2t, -, -1, ge-2t, -2te, ge-2t, -, ge-2t, -1, -2, -2test, -d, -de, -den, -der, -des, an-, ab-, auf-, be-, durch-, ein-, er-, fort-, her-, mit-, um-, unter-, ver-, wider-, wieder-, zer-, zu-, zurück-, zusammen-, über-," extract set begin "[abcdefghijklmnopqrstuvwxyzäöü]" set variablePart "" set ending "etest" set baseRule "-5en" set endings " -1, -1st, -1t, -, -1t, -, -1, ge-1t, -1te, ge-1t, -, ge-1t, -1, -2, -1test, -d, -de, -den, -der, -des, an-, ab-, auf-, be-, durch-, ein-, er-, fort-, her-, mit-, um-, unter-, ver-, wider-, wieder-, zer-, zu-, zurück-, zusammen-, über-," extract set begin "[abcdefghijklmnopqrstuvwxyzäöü]" set variablePart "" set ending "des" set baseRule "-3" set endings " -1, -1st, -1t, -, -1t, -, -1, ge-1t, -1te, ge-1t, -, ge-1t, -1, -2, -d, -de, -den, -der, -des, an-, ab-, auf-, be-, durch-, ein-, er-, fort-, her-, mit-, um-, unter-, ver-, wider-, wieder-, zer-, zu-, zurück-, zusammen-, über-,," extract set group "adjectives" set counter 0 set maxLineCnt 10 set begin "[abcdefghijklmnopqrstuvwxyzäöü]" set variablePart "[chgr]" set ending "sten" set baseRule "-4" set endings " -, -er, -em, -en, -eren, -erer, -eres, -ste, -stem, -sten, -ster, -stes," extract set begin "[abcdefghijklmnopqrstuvwxyzäöü]" set variablePart "[tdu]" set ending "esten" set baseRule "-5" set endings " -, -er, -em, -en, -eren, -erer, -eres, -este, -estem, -esten, -ester, -estes," extract set begin "[abcdefghijklmnopqrstuvwxyzäöü]" set variablePart "[gmhsl]" set ending "ste" set baseRule "-3" set endings " -, -er, -em, -en, -eren, -erer, -eres, -ste, -stem, -sten, -ster, -stes," extract set begin "[abcdefghijklmnopqrstuvwxyzäöü]" set variablePart "[ut]" set ending "este" set baseRule "-4" set endings " -, -er, -em, -en, -eren, -erer, -eres, -este, -estem, -esten, -ester, -estes," extract