Return-Path: X-Original-To: apmail-ctakes-commits-archive@www.apache.org Delivered-To: apmail-ctakes-commits-archive@www.apache.org Received: from mail.apache.org (hermes.apache.org [140.211.11.3]) by minotaur.apache.org (Postfix) with SMTP id 5230D10BD0 for ; Thu, 27 Mar 2014 17:47:40 +0000 (UTC) Received: (qmail 80838 invoked by uid 500); 27 Mar 2014 17:47:38 -0000 Delivered-To: apmail-ctakes-commits-archive@ctakes.apache.org Received: (qmail 79827 invoked by uid 500); 27 Mar 2014 17:47:31 -0000 Mailing-List: contact commits-help@ctakes.apache.org; run by ezmlm Precedence: bulk List-Help: List-Unsubscribe: List-Post: List-Id: Reply-To: dev@ctakes.apache.org Delivered-To: mailing list commits@ctakes.apache.org Received: (qmail 79500 invoked by uid 99); 27 Mar 2014 17:47:28 -0000 Received: from nike.apache.org (HELO nike.apache.org) (192.87.106.230) by apache.org (qpsmtpd/0.29) with ESMTP; Thu, 27 Mar 2014 17:47:28 +0000 X-ASF-Spam-Status: No, hits=-2000.0 required=5.0 tests=ALL_TRUSTED X-Spam-Check-By: apache.org Received: from [140.211.11.4] (HELO eris.apache.org) (140.211.11.4) by apache.org (qpsmtpd/0.29) with ESMTP; Thu, 27 Mar 2014 17:47:26 +0000 Received: from eris.apache.org (localhost [127.0.0.1]) by eris.apache.org (Postfix) with ESMTP id AD27B23889CB; Thu, 27 Mar 2014 17:47:04 +0000 (UTC) Content-Type: text/plain; charset="utf-8" MIME-Version: 1.0 Content-Transfer-Encoding: 7bit Subject: svn commit: r1582425 - /ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/DocTimeRelAnnotator.java Date: Thu, 27 Mar 2014 17:47:04 -0000 To: commits@ctakes.apache.org From: clin@apache.org X-Mailer: svnmailer-1.0.9 Message-Id: <20140327174704.AD27B23889CB@eris.apache.org> X-Virus-Checked: Checked by ClamAV on apache.org Author: clin Date: Thu Mar 27 17:47:04 2014 New Revision: 1582425 URL: http://svn.apache.org/r1582425 Log: Current DocTimeRel annotator with UMLS feature extractor. Modified: ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/DocTimeRelAnnotator.java Modified: ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/DocTimeRelAnnotator.java URL: http://svn.apache.org/viewvc/ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/DocTimeRelAnnotator.java?rev=1582425&r1=1582424&r2=1582425&view=diff ============================================================================== --- ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/DocTimeRelAnnotator.java (original) +++ ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/DocTimeRelAnnotator.java Thu Mar 27 17:47:04 2014 @@ -19,14 +19,19 @@ package org.apache.ctakes.temporal.ae; import java.io.File; +//import java.io.IOException; import java.util.List; +//import java.util.Map; import org.apache.ctakes.temporal.ae.feature.ClosestVerbExtractor; +//import org.apache.ctakes.temporal.ae.feature.CoveredTextToValuesExtractor; import org.apache.ctakes.temporal.ae.feature.DateAndMeasurementExtractor; import org.apache.ctakes.temporal.ae.feature.EventPropertyExtractor; import org.apache.ctakes.temporal.ae.feature.NearbyVerbTenseXExtractor; import org.apache.ctakes.temporal.ae.feature.SectionHeaderExtractor; import org.apache.ctakes.temporal.ae.feature.TimeXExtractor; +import org.apache.ctakes.temporal.ae.feature.UmlsSingleFeatureExtractor; +//import org.apache.ctakes.temporal.ae.feature.duration.DurationExpectationFeatureExtractor; import org.apache.ctakes.typesystem.type.syntax.BaseToken; import org.apache.ctakes.typesystem.type.textsem.EventMention; import org.apache.uima.UimaContext; @@ -51,6 +56,8 @@ import org.cleartk.classifier.jar.Generi import org.uimafit.factory.AnalysisEngineFactory; import org.uimafit.util.JCasUtil; +//import com.google.common.base.Charsets; + public class DocTimeRelAnnotator extends CleartkAnnotator { public static AnalysisEngineDescription createDataWriterDescription( @@ -83,7 +90,10 @@ public class DocTimeRelAnnotator extends private TimeXExtractor timeXExtractor; private EventPropertyExtractor genericExtractor; private DateAndMeasurementExtractor dateExtractor; - + private UmlsSingleFeatureExtractor umlsExtractor; +// private CoveredTextToValuesExtractor disSemExtractor; +// private DurationExpectationFeatureExtractor durationExtractor; + @Override public void initialize(UimaContext context) throws ResourceInitializationException { super.initialize(context); @@ -102,6 +112,14 @@ public class DocTimeRelAnnotator extends this.timeXExtractor = new TimeXExtractor(); this.genericExtractor = new EventPropertyExtractor(); this.dateExtractor = new DateAndMeasurementExtractor(); + this.umlsExtractor = new UmlsSingleFeatureExtractor(); +// try { +// Map word_disSem = CoveredTextToValuesExtractor.parseTextDoublesMap(new File("src/main/resources/embeddings.size25.txt"), Charsets.UTF_8); +// this.disSemExtractor = new CoveredTextToValuesExtractor("DisSemFeat", word_disSem); +// } catch (IOException e) { +// e.printStackTrace(); +// } +// this.durationExtractor = new DurationExpectationFeatureExtractor(); } @Override @@ -115,6 +133,9 @@ public class DocTimeRelAnnotator extends features.addAll(this.timeXExtractor.extract(jCas, eventMention)); //add the closest time expression types features.addAll(this.genericExtractor.extract(jCas, eventMention)); //add the closest time expression types features.addAll(this.dateExtractor.extract(jCas, eventMention)); //add the closest NE type + features.addAll(this.umlsExtractor.extract(jCas, eventMention)); //add umls features +// features.addAll(this.durationExtractor.extract(jCas, eventMention)); //add duration feature +// features.addAll(this.disSemExtractor.extract(jCas, eventMention)); //add distributional semantic features if (this.isTraining()) { String outcome = eventMention.getEvent().getProperties().getDocTimeRel(); this.dataWriter.write(new Instance(outcome, features));