ctakes-commits mailing list archives

Site index · List index
Message view « Date » · « Thread »
Top « Date » · « Thread »
From spmurph...@apache.org
Subject svn commit: r1423090 - in /incubator/ctakes/trunk/ctakes-core/src/main/resources/org/apache/ctakes/core/analysis_engine: ./ SentenceDetectorAnnotator.xml TokenizerAnnotator.xml
Date Mon, 17 Dec 2012 18:40:18 GMT
Author: spmurphy50
Date: Mon Dec 17 18:40:18 2012
New Revision: 1423090

URL: http://svn.apache.org/viewvc?rev=1423090&view=rev
Log:
CTAKES-101

Added:
    incubator/ctakes/trunk/ctakes-core/src/main/resources/org/apache/ctakes/core/analysis_engine/
    incubator/ctakes/trunk/ctakes-core/src/main/resources/org/apache/ctakes/core/analysis_engine/SentenceDetectorAnnotator.xml
  (with props)
    incubator/ctakes/trunk/ctakes-core/src/main/resources/org/apache/ctakes/core/analysis_engine/TokenizerAnnotator.xml
  (with props)

Added: incubator/ctakes/trunk/ctakes-core/src/main/resources/org/apache/ctakes/core/analysis_engine/SentenceDetectorAnnotator.xml
URL: http://svn.apache.org/viewvc/incubator/ctakes/trunk/ctakes-core/src/main/resources/org/apache/ctakes/core/analysis_engine/SentenceDetectorAnnotator.xml?rev=1423090&view=auto
==============================================================================
--- incubator/ctakes/trunk/ctakes-core/src/main/resources/org/apache/ctakes/core/analysis_engine/SentenceDetectorAnnotator.xml
(added)
+++ incubator/ctakes/trunk/ctakes-core/src/main/resources/org/apache/ctakes/core/analysis_engine/SentenceDetectorAnnotator.xml
Mon Dec 17 18:40:18 2012
@@ -0,0 +1,93 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+
+    Licensed to the Apache Software Foundation (ASF) under one
+    or more contributor license agreements.  See the NOTICE file
+    distributed with this work for additional information
+    regarding copyright ownership.  The ASF licenses this file
+    to you under the Apache License, Version 2.0 (the
+    "License"); you may not use this file except in compliance
+    with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing,
+    software distributed under the License is distributed on an
+    "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+    KIND, either express or implied.  See the License for the
+    specific language governing permissions and limitations
+    under the License.
+
+-->
+<taeDescription xmlns="http://uima.apache.org/resourceSpecifier">
+<frameworkImplementation>org.apache.uima.java</frameworkImplementation>
+<primitive>true</primitive>
+<annotatorImplementationName>org.apache.ctakes.core.ae.SentenceDetector</annotatorImplementationName>
+<analysisEngineMetaData>
+<name>Sentence Detector annotator</name>
+<description>Discovers sentence boundaries.</description>
+<version>2.1</version>
+<vendor>Mayo Clinic</vendor>
+<configurationParameters>
+<configurationParameter>
+<name>SegmentsToSkip</name>
+<type>String</type>
+<multiValued>true</multiValued>
+<mandatory>false</mandatory>
+</configurationParameter>
+</configurationParameters>
+<configurationParameterSettings>
+<nameValuePair>
+<name>SegmentsToSkip</name>
+<value>
+<array/>
+</value>
+</nameValuePair>
+</configurationParameterSettings>
+<typeSystemDescription/>
+<typePriorities/>
+<fsIndexCollection/>
+<capabilities>
+<capability>
+<inputs>
+<type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.syntax.BaseToken</type>
+</inputs>
+<outputs>
+<type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.textspan.Sentence</type>
+</outputs>
+<languagesSupported/>
+</capability>
+</capabilities>
+<operationalProperties>
+<modifiesCas>true</modifiesCas>
+<multipleDeploymentAllowed>true</multipleDeploymentAllowed>
+<outputsNewCASes>false</outputsNewCASes>
+</operationalProperties>
+</analysisEngineMetaData>
+<externalResourceDependencies>
+<externalResourceDependency>
+<key>MaxentModel</key>
+<description></description>
+<interfaceName>org.apache.ctakes.core.resource.MaxentModelResource</interfaceName>
+<optional>false</optional>
+</externalResourceDependency>
+</externalResourceDependencies>
+<resourceManagerConfiguration>
+<externalResources>
+<externalResource>
+<name>MaxentModelFile</name>
+<description></description>
+<fileResourceSpecifier>
+<fileUrl>file:org/apache/ctakes/core/sentdetect/sdmed.mod</fileUrl>
+</fileResourceSpecifier>
+<implementationName>org.apache.ctakes.core.resource.SuffixMaxentModelResourceImpl</implementationName>
+</externalResource>
+</externalResources>
+<externalResourceBindings>
+<externalResourceBinding>
+<key>MaxentModel</key>
+<resourceName>MaxentModelFile</resourceName>
+</externalResourceBinding>
+</externalResourceBindings>
+</resourceManagerConfiguration>
+</taeDescription>

Propchange: incubator/ctakes/trunk/ctakes-core/src/main/resources/org/apache/ctakes/core/analysis_engine/SentenceDetectorAnnotator.xml
------------------------------------------------------------------------------
    svn:mime-type = text/plain

Added: incubator/ctakes/trunk/ctakes-core/src/main/resources/org/apache/ctakes/core/analysis_engine/TokenizerAnnotator.xml
URL: http://svn.apache.org/viewvc/incubator/ctakes/trunk/ctakes-core/src/main/resources/org/apache/ctakes/core/analysis_engine/TokenizerAnnotator.xml?rev=1423090&view=auto
==============================================================================
--- incubator/ctakes/trunk/ctakes-core/src/main/resources/org/apache/ctakes/core/analysis_engine/TokenizerAnnotator.xml
(added)
+++ incubator/ctakes/trunk/ctakes-core/src/main/resources/org/apache/ctakes/core/analysis_engine/TokenizerAnnotator.xml
Mon Dec 17 18:40:18 2012
@@ -0,0 +1,76 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+
+    Licensed to the Apache Software Foundation (ASF) under one
+    or more contributor license agreements.  See the NOTICE file
+    distributed with this work for additional information
+    regarding copyright ownership.  The ASF licenses this file
+    to you under the Apache License, Version 2.0 (the
+    "License"); you may not use this file except in compliance
+    with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing,
+    software distributed under the License is distributed on an
+    "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+    KIND, either express or implied.  See the License for the
+    specific language governing permissions and limitations
+    under the License.
+
+-->
+<taeDescription xmlns="http://uima.apache.org/resourceSpecifier">
+<frameworkImplementation>org.apache.uima.java</frameworkImplementation>
+<primitive>true</primitive>
+<annotatorImplementationName>org.apache.ctakes.core.ae.TokenizerAnnotatorPTB</annotatorImplementationName>
+<analysisEngineMetaData>
+<name>TokenizerAnnotatorPTB</name>
+<description>Discovers tokens in the given text, following Penn TreeBank tokenization
rules.  These tokens consist of words, punctuation, etc...</description>
+<version>2.3</version>
+<vendor>Mayo Clinic</vendor>
+<configurationParameters>
+<configurationParameter>
+<name>SegmentsToSkip</name>
+<description>Segments to skip.</description>
+<type>String</type>
+<multiValued>true</multiValued>
+<mandatory>false</mandatory>
+</configurationParameter>
+</configurationParameters>
+<configurationParameterSettings>
+<nameValuePair>
+<name>SegmentsToSkip</name>
+<value>
+<array/>
+</value>
+</nameValuePair>
+</configurationParameterSettings>
+<typeSystemDescription>
+<imports>
+<import name="org.apache.ctakes.typesystem.types.TypeSystem"/>
+</imports>
+</typeSystemDescription>
+<typePriorities/>
+<fsIndexCollection/>
+<capabilities>
+<capability>
+<inputs>
+<type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.textspan.Segment</type>
+</inputs>
+<outputs>
+<type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.syntax.BaseToken</type>
+</outputs>
+<languagesSupported/>
+</capability>
+</capabilities>
+<operationalProperties>
+<modifiesCas>true</modifiesCas>
+<multipleDeploymentAllowed>true</multipleDeploymentAllowed>
+<outputsNewCASes>false</outputsNewCASes>
+</operationalProperties>
+</analysisEngineMetaData>
+<externalResourceDependencies>
+</externalResourceDependencies>
+<resourceManagerConfiguration>
+</resourceManagerConfiguration>
+</taeDescription>

Propchange: incubator/ctakes/trunk/ctakes-core/src/main/resources/org/apache/ctakes/core/analysis_engine/TokenizerAnnotator.xml
------------------------------------------------------------------------------
    svn:mime-type = text/plain



Mime
View raw message