incubator-ctakes-commits mailing list archives

Site index · List index
Message view « Date » · « Thread »
Top « Date » · « Thread »
From tm...@apache.org
Subject svn commit: r1404798 - /incubator/ctakes/trunk/ctakes-pos-tagger/desc/POSTagger.xml
Date Thu, 01 Nov 2012 22:09:27 GMT
Author: tmill
Date: Thu Nov  1 22:09:26 2012
New Revision: 1404798

URL: http://svn.apache.org/viewvc?rev=1404798&view=rev
Log:
Fix for cTAKES-60.  subiterator call was failing for single-token sentences since there was
no type priority.  Added type priority saying sentence is above basetoken.

Modified:
    incubator/ctakes/trunk/ctakes-pos-tagger/desc/POSTagger.xml

Modified: incubator/ctakes/trunk/ctakes-pos-tagger/desc/POSTagger.xml
URL: http://svn.apache.org/viewvc/incubator/ctakes/trunk/ctakes-pos-tagger/desc/POSTagger.xml?rev=1404798&r1=1404797&r2=1404798&view=diff
==============================================================================
--- incubator/ctakes/trunk/ctakes-pos-tagger/desc/POSTagger.xml (original)
+++ incubator/ctakes/trunk/ctakes-pos-tagger/desc/POSTagger.xml Thu Nov  1 22:09:26 2012
@@ -1,98 +1,105 @@
-<?xml version="1.0" encoding="UTF-8"?>
-<!--
-
-    Licensed to the Apache Software Foundation (ASF) under one
-    or more contributor license agreements.  See the NOTICE file
-    distributed with this work for additional information
-    regarding copyright ownership.  The ASF licenses this file
-    to you under the Apache License, Version 2.0 (the
-    "License"); you may not use this file except in compliance
-    with the License.  You may obtain a copy of the License at
-
-      http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing,
-    software distributed under the License is distributed on an
-    "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-    KIND, either express or implied.  See the License for the
-    specific language governing permissions and limitations
-    under the License.
-
--->
-<analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
-<frameworkImplementation>org.apache.uima.java</frameworkImplementation>
-<primitive>true</primitive>
-<annotatorImplementationName>org.apache.ctakes.postagger.POSTagger</annotatorImplementationName>
-<analysisEngineMetaData>
-<name>POSTagger</name>
-<description></description>
-<version>1.0</version>
-<vendor></vendor>
-<configurationParameters>
-<configurationParameter>
-<name>PosModelFile</name>
-<description>The file that contains the MaxEnt model used by the part of speech (POS)
tagger</description>
-<type>String</type>
-<multiValued>false</multiValued>
-<mandatory>true</mandatory>
-</configurationParameter>
-<configurationParameter>
-<name>TagDictionary</name>
-<description>The file contains a list of words, and for each word, the set of part
of speech tags to be considered for that word. For words in the tag dictionary, only the corresponding
tags in the tag dictionary are considered when tagging the word with a part of speech.</description>
-<type>String</type>
-<multiValued>false</multiValued>
-<mandatory>false</mandatory>
-</configurationParameter>
-<configurationParameter>
-<name>CaseSensitive</name>
-<type>Boolean</type>
-<multiValued>false</multiValued>
-<mandatory>false</mandatory>
-</configurationParameter>
-</configurationParameters>
-<configurationParameterSettings>
-<nameValuePair>
-<name>PosModelFile</name>
-<value>
-<string>org/apache/ctakes/postagger/models/mayo-pos.zip</string>
-</value>
-</nameValuePair>
-<nameValuePair>
-<name>CaseSensitive</name>
-<value>
-<boolean>true</boolean>
-</value>
-</nameValuePair>
-<nameValuePair>
-<name>TagDictionary</name>
-<value>
-<string>org/apache/ctakes/postagger/models/tag.dictionary.txt</string>
-</value>
-</nameValuePair>
-</configurationParameterSettings>
-<typeSystemDescription>
-<imports>
-</imports>
-</typeSystemDescription>
-<typePriorities/>
-<fsIndexCollection/>
-<capabilities>
-<capability>
-<inputs>
-<type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.textspan.Sentence</type>
-<type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.syntax.BaseToken</type>
-</inputs>
-<outputs>
-<type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.syntax.BaseToken</type>
-</outputs>
-<languagesSupported/>
-</capability>
-</capabilities>
-<operationalProperties>
-<modifiesCas>true</modifiesCas>
-<multipleDeploymentAllowed>true</multipleDeploymentAllowed>
-<outputsNewCASes>false</outputsNewCASes>
-</operationalProperties>
-</analysisEngineMetaData>
-<resourceManagerConfiguration/>
-</analysisEngineDescription>
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+
+    Licensed to the Apache Software Foundation (ASF) under one
+    or more contributor license agreements.  See the NOTICE file
+    distributed with this work for additional information
+    regarding copyright ownership.  The ASF licenses this file
+    to you under the Apache License, Version 2.0 (the
+    "License"); you may not use this file except in compliance
+    with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+    Unless required by applicable law or agreed to in writing,
+    software distributed under the License is distributed on an
+    "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+    KIND, either express or implied.  See the License for the
+    specific language governing permissions and limitations
+    under the License.
+
+-->
+<analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
+<frameworkImplementation>org.apache.uima.java</frameworkImplementation>
+<primitive>true</primitive>
+<annotatorImplementationName>org.apache.ctakes.postagger.POSTagger</annotatorImplementationName>
+<analysisEngineMetaData>
+<name>POSTagger</name>
+<description/>
+<version>1.0</version>
+<vendor/>
+<configurationParameters>
+<configurationParameter>
+<name>PosModelFile</name>
+<description>The file that contains the MaxEnt model used by the part of speech (POS)
tagger</description>
+<type>String</type>
+<multiValued>false</multiValued>
+<mandatory>true</mandatory>
+</configurationParameter>
+<configurationParameter>
+<name>TagDictionary</name>
+<description>The file contains a list of words, and for each word, the set of part
of speech tags to be considered for that word. For words in the tag dictionary, only the corresponding
tags in the tag dictionary are considered when tagging the word with a part of speech.</description>
+<type>String</type>
+<multiValued>false</multiValued>
+<mandatory>false</mandatory>
+</configurationParameter>
+<configurationParameter>
+<name>CaseSensitive</name>
+<type>Boolean</type>
+<multiValued>false</multiValued>
+<mandatory>false</mandatory>
+</configurationParameter>
+</configurationParameters>
+<configurationParameterSettings>
+<nameValuePair>
+<name>PosModelFile</name>
+<value>
+<string>org/apache/ctakes/postagger/models/mayo-pos.zip</string>
+</value>
+</nameValuePair>
+<nameValuePair>
+<name>CaseSensitive</name>
+<value>
+<boolean>true</boolean>
+</value>
+</nameValuePair>
+<nameValuePair>
+<name>TagDictionary</name>
+<value>
+<string>org/apache/ctakes/postagger/models/tag.dictionary.txt</string>
+</value>
+</nameValuePair>
+</configurationParameterSettings>
+<typeSystemDescription>
+<imports>
+<import name="org.apache.ctakes.typesystem.types.TypeSystem"/>
+</imports>
+</typeSystemDescription>
+<typePriorities>
+<priorityList>
+<type>org.apache.ctakes.typesystem.type.textspan.Segment</type>
+<type>org.apache.ctakes.typesystem.type.textspan.Sentence</type>
+<type>org.apache.ctakes.typesystem.type.syntax.BaseToken</type>
+</priorityList>
+</typePriorities>
+<fsIndexCollection/>
+<capabilities>
+<capability>
+<inputs>
+<type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.textspan.Sentence</type>
+<type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.syntax.BaseToken</type>
+</inputs>
+<outputs>
+<type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.syntax.BaseToken</type>
+</outputs>
+<languagesSupported/>
+</capability>
+</capabilities>
+<operationalProperties>
+<modifiesCas>true</modifiesCas>
+<multipleDeploymentAllowed>true</multipleDeploymentAllowed>
+<outputsNewCASes>false</outputsNewCASes>
+</operationalProperties>
+</analysisEngineMetaData>
+<resourceManagerConfiguration/>
+</analysisEngineDescription>



Mime
View raw message