Alvis-NLPPlatform
view release on metacpan or search on metacpan
etc/alvis-nlpplatform/nlpplatform-test.rc view on Meta::CPAN
# definition of the linguistic annotation steps
ALVISTMP = $HOME/tmp
PLATFORM_ROOT = $HOME/Recherche/Projets/ALVIS/Programs/WP5/Platform
AWK = /bin/awk
<alvis_connection>
HARVESTER_PORT = 6234
NEXTSTEP = 0
NEXTSTEP_HOST = localhost
NEXTSTEP_PORT = 7345
SPOOLDIR = $HOME/tmp/spool
OUTDIR = $HOME/tmp/Outdir
</alvis_connection>
<NLP_connection>
SERVER = localhost
PORT = 1510
RETRY_CONNECTION = 10
</NLP_connection>
<XML_INPUT>
PRESERVEWHITESPACE = 0
LINGUISTIC_ANNOTATION_LOADING = 0
</XML_INPUT>
<XML_OUTPUT>
FORM = 1
ID = 1
TOKEN_LEVEL = 1
SEMANTIC_UNIT_NAMED_ENTITY_LEVEL = 1
WORD_LEVEL = 1
SENTENCE_LEVEL = 1
MORPHOSYNTACTIC_FEATURE_LEVEL = 1
LEMMA_LEVEL = 1
SEMANTIC_UNIT_TERM_LEVEL = 1
SEMANTIC_UNIT_LEVEL = 1
SYNTACTIC_RELATION_LEVEL = 1
NO_STD_XML_OUTPUT = 0
YATEA = 1
</XML_OUTPUT>
<linguistic_annotation>
ENABLE_TOKEN = 1
ENABLE_NER = 0
ENABLE_WORD = 0
ENABLE_SENTENCE = 0
ENABLE_POS = 0
ENABLE_LEMMA = 0
ENABLE_TERM_TAG = 0
ENABLE_SYNTAX = 0
</linguistic_annotation>
<NLP_misc>
NLP_resources = $PLATFORM_ROOT/res
SAVE_IN_OUTDIR = 1
TERM_LIST_EN = $NLP_resources/terms.txt.sav
TERM_LIST_FR = $NLP_resources/terms_FR.txt
# valid tags for each language
<POSTAG_LIST>
<EN>
CC = 1
CD = 1
DT = 1
EX = 1
FW = 1
IN = 1
JJ = 1
JJR = 1
JJS = 1
LS = 1
MD = 1
NN = 1
NNS = 1
NP = 1
NPS = 1
PDT = 1
POS = 1
PP = 1
PP$ = 1
RB = 1
RBR = 1
RBS = 1
RP = 1
SYM = 1
TO = 1
UH = 1
VB = 1
VBD = 1
VBG = 1
VBN = 1
VBP = 1
VBZ = 1
VV = 1
VVD = 1
VVG = 1
VVN = 1
VVP = 1
VVZ = 1
WDT = 1
WP = 1
etc/alvis-nlpplatform/nlpplatform-test.rc view on Meta::CPAN
<FR>
ABR = 1
ADJ = 1
ADV = 1
DET:ART = 1
DET:POS = 1
INT = 1
KON = 1
NAM = 1
NOM = 1
NUM = 1
PRO = 1
PRO:DEM = 1
PRO:IND = 1
PRO:PER = 1
PRO:POS = 1
PRO:REL = 1
PRP = 1
PRP:det = 1
PUN = 2
PUN:cit = 2
SENT = 2
SYM = 1
VER:cond = 1
VER:futu = 1
VER:impe = 1
VER:impf = 1
VER:infi = 1
VER:pper = 1
VER:ppre = 1
VER:pres = 1
VER:simp = 1
VER:subi = 1
VER:subp = 1
</FR>
</POSTAG_LIST>
</NLP_misc>
NLP_tools_root = $PLATFORM_ROOT/tools
<NLP_tools>
NETAG_EN = "$NLP_tools_root/TagEN/tagen -t :bio"
NETAG_FR = "$NLP_tools_root/TagEN/tagen -t :equer"
WORDSEG_EN = "$AWK -f $NLP_tools_root/WordSeg/words-en.awk"
# WORDSEG_EN = "$NLP_tools_root/WordSeg/sentences.pl"
WORDSEG_FR = "$AWK -f $NLP_tools_root/WordSeg/words-fr.awk"
POSTAG_EN = "$NLP_tools_root/TreeTagger/bin/tree-tagger $NLP_tools_root/TreeTagger/lib/english.par -token -lemma -sgml -no-unknown"
#POSTAG_EN = "(cd $NLP_tools_root/geniatagger-2.0.1; sed 's/ /___/g' | tr '\n' ' '| ./geniatagger -nt | cut -f 1,2,3|sed 's/\([^\t]*\t\)\([^\t]*\)\t\([^\t]*\)/\1\3\t\2/g' | sed 's/___/ /g' | grep -v '^$')"
POSTAG_FR = "$NLP_tools_root/TreeTagger/bin/tree-tagger $NLP_tools_root/TreeTagger/lib/french.par -token -lemma -sgml -no-unknown"
# SYNTACTIC_PATH_EN = "$NLP_tools_root/link-4.1b"
SYNTACTIC_PATH_EN = "$NLP_tools_root/biolgForAlvis/biolg-1.1.7b"
SYNTACTIC_PATH_FR = ""
# SYNTACTIC_ANALYSIS_EN = "cd $SYNTACTIC_PATH_EN ; $SYNTACTIC_PATH_EN/parse"
SYNTACTIC_ANALYSIS_EN = "cd $SYNTACTIC_PATH_EN ; $SYNTACTIC_PATH_EN/parse -xmlin"
SYNTACTIC_ANALYSIS_FR = ""
TERM_TAG_FR = ""
TERM_TAG_EN = ""
YATEARC = "/etc/yatea/yatea-devTH.rc"
YATEAOUTPUT = "$ALVISTMP"
</NLP_tools>
<CONVERTERS>
text/plain = text2xhtml <
text/html =
www/unknown =
#text/plain ; ; GuessText
text/x-tex = tth -g -w1 -r <
application/x-tex = tth -g -w1 -r <
#text/x-tex ; untex -a -e -giso ; TeXText
#application/x-tex ; untex -a -e -giso ; TeXText
#text/x-tex ; ; TeX
#application/x-tex ; ; TeX
application/pdf = pdftohtml -i -noframes -nomerge -stdout
#application/pdf ; pstotext ; Text
application/postscript = pstotext
application/msword = antiword -t
application/vnd.ms-excel = xlhtml -fw
application/vnd.ms-powerpoint = ppthtml
application/powerpoint = ppthtml
application/rtf = unrtf --nopict --html
# image/gif ; ; Image
# image/jpeg ; ; Image
# image/tiff ; ; Image
application/xml =
<STYLESHEET>
default = xsltproc $PLATFORM_ROOT/etc/alvis-nlpplatform/xsl/Default.xsl
</STYLESHEET>
SupplMagicFile = "$HOME/Recherche/Projets/ALVIS/Programs/WP5/CPAN/Alvis-NLPPlatform/etc/alvis-nlpplatform/mime/magic.TeX"
StoreInputFiles = 0
</CONVERTERS>
( run in 1.147 second using v1.01-cache-2.11-cpan-98e64b0badf )