incubator-connectors-commits mailing list archives

Site index · List index
Message view « Date » · « Thread »
Top « Date » · « Thread »
From kwri...@apache.org
Subject svn commit: r1139294 - in /incubator/lcf/trunk/framework: agents/src/main/java/org/apache/manifoldcf/agents/incrementalingest/ agents/src/main/java/org/apache/manifoldcf/agents/interfaces/ agents/src/main/java/org/apache/manifoldcf/agents/output/ pull-...
Date Fri, 24 Jun 2011 13:18:03 GMT
Author: kwright
Date: Fri Jun 24 13:18:03 2011
New Revision: 1139294

URL: http://svn.apache.org/viewvc?rev=1139294&view=rev
Log:
Add infrastructure necessary to make output connectors more capable of filtering documents
using a wide variety of criteria.  Part of CONNECTORS-214.

Modified:
    incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/incrementalingest/IncrementalIngester.java
    incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/interfaces/IIncrementalIngester.java
    incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/interfaces/IOutputConnector.java
    incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/output/BaseOutputConnector.java
    incubator/lcf/trunk/framework/pull-agent/src/main/java/org/apache/manifoldcf/crawler/interfaces/IFingerprintActivity.java
    incubator/lcf/trunk/framework/pull-agent/src/main/java/org/apache/manifoldcf/crawler/system/WorkerThread.java

Modified: incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/incrementalingest/IncrementalIngester.java
URL: http://svn.apache.org/viewvc/incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/incrementalingest/IncrementalIngester.java?rev=1139294&r1=1139293&r2=1139294&view=diff
==============================================================================
--- incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/incrementalingest/IncrementalIngester.java
(original)
+++ incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/incrementalingest/IncrementalIngester.java
Fri Jun 24 13:18:03 2011
@@ -178,10 +178,11 @@ public class IncrementalIngester extends
 
   /** Check if a mime type is indexable.
   *@param outputConnectionName is the name of the output connection associated with this
action.
+  *@param outputDescription is the output description string.
   *@param mimeType is the mime type to check.
   *@return true if the mimeType is indexable.
   */
-  public boolean checkMimeTypeIndexable(String outputConnectionName, String mimeType)
+  public boolean checkMimeTypeIndexable(String outputConnectionName, String outputDescription,
String mimeType)
     throws ManifoldCFException, ServiceInterruption
   {
     IOutputConnection connection = connectionManager.load(outputConnectionName);
@@ -191,7 +192,7 @@ public class IncrementalIngester extends
       throw new ServiceInterruption("Output connector not installed",0L);
     try
     {
-      return connector.checkMimeTypeIndexable(mimeType);
+      return connector.checkMimeTypeIndexable(outputDescription,mimeType);
     }
     finally
     {
@@ -201,10 +202,11 @@ public class IncrementalIngester extends
 
   /** Check if a file is indexable.
   *@param outputConnectionName is the name of the output connection associated with this
action.
+  *@param outputDescription is the output description string.
   *@param localFile is the local file to check.
   *@return true if the local file is indexable.
   */
-  public boolean checkDocumentIndexable(String outputConnectionName, File localFile)
+  public boolean checkDocumentIndexable(String outputConnectionName, String outputDescription,
File localFile)
     throws ManifoldCFException, ServiceInterruption
   {
     IOutputConnection connection = connectionManager.load(outputConnectionName);
@@ -214,7 +216,57 @@ public class IncrementalIngester extends
       throw new ServiceInterruption("Output connector not installed",0L);
     try
     {
-      return connector.checkDocumentIndexable(localFile);
+      return connector.checkDocumentIndexable(outputDescription,localFile);
+    }
+    finally
+    {
+      OutputConnectorFactory.release(connector);
+    }
+  }
+
+  /** Pre-determine whether a document's length is indexable by this connector.  This method
is used by participating repository connectors
+  * to help filter out documents that are too long to be indexable.
+  *@param outputConnectionName is the name of the output connection associated with this
action.
+  *@param outputDescription is the output description string.
+  *@param length is the length of the document.
+  *@return true if the file is indexable.
+  */
+  public boolean checkLengthIndexable(String outputConnectionName, String outputDescription,
long length)
+    throws ManifoldCFException, ServiceInterruption
+  {
+    IOutputConnection connection = connectionManager.load(outputConnectionName);
+    IOutputConnector connector = OutputConnectorFactory.grab(threadContext,connection.getClassName(),connection.getConfigParams(),connection.getMaxConnections());
+    if (connector == null)
+      // The connector is not installed; treat this as a service interruption.
+      throw new ServiceInterruption("Output connector not installed",0L);
+    try
+    {
+      return connector.checkLengthIndexable(outputDescription,length);
+    }
+    finally
+    {
+      OutputConnectorFactory.release(connector);
+    }
+  }
+
+  /** Pre-determine whether a document's URL is indexable by this connector.  This method
is used by participating repository connectors
+  * to help filter out documents that not indexable.
+  *@param outputConnectionName is the name of the output connection associated with this
action.
+  *@param outputDescription is the output description string.
+  *@param url is the url of the document.
+  *@return true if the file is indexable.
+  */
+  public boolean checkURLIndexable(String outputConnectionName, String outputDescription,
String url)
+    throws ManifoldCFException, ServiceInterruption
+  {
+    IOutputConnection connection = connectionManager.load(outputConnectionName);
+    IOutputConnector connector = OutputConnectorFactory.grab(threadContext,connection.getClassName(),connection.getConfigParams(),connection.getMaxConnections());
+    if (connector == null)
+      // The connector is not installed; treat this as a service interruption.
+      throw new ServiceInterruption("Output connector not installed",0L);
+    try
+    {
+      return connector.checkURLIndexable(outputDescription,url);
     }
     finally
     {

Modified: incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/interfaces/IIncrementalIngester.java
URL: http://svn.apache.org/viewvc/incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/interfaces/IIncrementalIngester.java?rev=1139294&r1=1139293&r2=1139294&view=diff
==============================================================================
--- incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/interfaces/IIncrementalIngester.java
(original)
+++ incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/interfaces/IIncrementalIngester.java
Fri Jun 24 13:18:03 2011
@@ -58,30 +58,53 @@ public interface IIncrementalIngester
   public void clearAll()
     throws ManifoldCFException;
 
+
+  /** Get an output version string for a document.
+  *@param outputConnectionName is the name of the output connection associated with this
action.
+  *@param spec is the output specification.
+  *@return the description string.
+  */
+  public String getOutputDescription(String outputConnectionName, OutputSpecification spec)
+    throws ManifoldCFException, ServiceInterruption;
+
   /** Check if a mime type is indexable.
   *@param outputConnectionName is the name of the output connection associated with this
action.
+  *@param outputDescription is the output description string.
   *@param mimeType is the mime type to check.
   *@return true if the mimeType is indexable.
   */
-  public boolean checkMimeTypeIndexable(String outputConnectionName, String mimeType)
+  public boolean checkMimeTypeIndexable(String outputConnectionName, String outputDescription,
String mimeType)
     throws ManifoldCFException, ServiceInterruption;
 
   /** Check if a file is indexable.
   *@param outputConnectionName is the name of the output connection associated with this
action.
+  *@param outputDescription is the output description string.
   *@param localFile is the local file to check.
   *@return true if the local file is indexable.
   */
-  public boolean checkDocumentIndexable(String outputConnectionName, File localFile)
+  public boolean checkDocumentIndexable(String outputConnectionName, String outputDescription,
File localFile)
     throws ManifoldCFException, ServiceInterruption;
 
-  /** Get an output version string for a document.
+  /** Pre-determine whether a document's length is indexable by this connector.  This method
is used by participating repository connectors
+  * to help filter out documents that are too long to be indexable.
   *@param outputConnectionName is the name of the output connection associated with this
action.
-  *@param spec is the output specification.
-  *@return the description string.
+  *@param outputDescription is the output description string.
+  *@param length is the length of the document.
+  *@return true if the file is indexable.
   */
-  public String getOutputDescription(String outputConnectionName, OutputSpecification spec)
+  public boolean checkLengthIndexable(String outputConnectionName, String outputDescription,
long length)
     throws ManifoldCFException, ServiceInterruption;
-    
+
+  /** Pre-determine whether a document's URL is indexable by this connector.  This method
is used by participating repository connectors
+  * to help filter out documents that not indexable.
+  *@param outputConnectionName is the name of the output connection associated with this
action.
+  *@param outputDescription is the output description string.
+  *@param url is the url of the document.
+  *@return true if the file is indexable.
+  */
+  public boolean checkURLIndexable(String outputConnectionName, String outputDescription,
String url)
+    throws ManifoldCFException, ServiceInterruption;
+
   /** Record a document version, but don't ingest it.
   * The purpose of this method is to keep track of the frequency at which ingestion "attempts"
take place.
   * ServiceInterruption is thrown if this action must be rescheduled.

Modified: incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/interfaces/IOutputConnector.java
URL: http://svn.apache.org/viewvc/incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/interfaces/IOutputConnector.java?rev=1139294&r1=1139293&r2=1139294&view=diff
==============================================================================
--- incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/interfaces/IOutputConnector.java
(original)
+++ incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/interfaces/IOutputConnector.java
Fri Jun 24 13:18:03 2011
@@ -73,35 +73,56 @@ public interface IOutputConnector extend
   public boolean requestInfo(Configuration output, String command)
     throws ManifoldCFException;
     
+    
+  /** Get an output version string, given an output specification.  The output version string
is used to uniquely describe the pertinent details of
+  * the output specification and the configuration, to allow the Connector Framework to determine
whether a document will need to be output again.
+  * Note that the contents of the document cannot be considered by this method, and that
a different version string (defined in IRepositoryConnector)
+  * is used to describe the version of the actual document.
+  *
+  * This method presumes that the connector object has been configured, and it is thus able
to communicate with the output data store should that be
+  * necessary.
+  *@param spec is the current output specification for the job that is doing the crawling.
+  *@return a string, of unlimited length, which uniquely describes output configuration and
specification in such a way that if two such strings are equal,
+  * the document will not need to be sent again to the output data store.
+  */
+  public String getOutputDescription(OutputSpecification spec)
+    throws ManifoldCFException, ServiceInterruption;
+
   /** Detect if a mime type is indexable or not.  This method is used by participating repository
connectors to pre-filter the number of
   * unusable documents that will be passed to this output connector.
+  *@param outputDescription is the document's output version.
   *@param mimeType is the mime type of the document.
   *@return true if the mime type is indexable by this connector.
   */
-  public boolean checkMimeTypeIndexable(String mimeType)
+  public boolean checkMimeTypeIndexable(String outputDescription, String mimeType)
     throws ManifoldCFException, ServiceInterruption;
 
   /** Pre-determine whether a document (passed here as a File object) is indexable by this
connector.  This method is used by participating
   * repository connectors to help reduce the number of unmanageable documents that are passed
to this output connector in advance of an
   * actual transfer.  This hook is provided mainly to support search engines that only handle
a small set of accepted file types.
+  *@param outputDescription is the document's output version.
   *@param localFile is the local file to check.
   *@return true if the file is indexable.
   */
-  public boolean checkDocumentIndexable(File localFile)
+  public boolean checkDocumentIndexable(String outputDescription, File localFile)
     throws ManifoldCFException, ServiceInterruption;
 
-  /** Get an output version string, given an output specification.  The output version string
is used to uniquely describe the pertinent details of
-  * the output specification and the configuration, to allow the Connector Framework to determine
whether a document will need to be output again.
-  * Note that the contents of the document cannot be considered by this method, and that
a different version string (defined in IRepositoryConnector)
-  * is used to describe the version of the actual document.
-  *
-  * This method presumes that the connector object has been configured, and it is thus able
to communicate with the output data store should that be
-  * necessary.
-  *@param spec is the current output specification for the job that is doing the crawling.
-  *@return a string, of unlimited length, which uniquely describes output configuration and
specification in such a way that if two such strings are equal,
-  * the document will not need to be sent again to the output data store.
+  /** Pre-determine whether a document's length is indexable by this connector.  This method
is used by participating repository connectors
+  * to help filter out documents that are too long to be indexable.
+  *@param outputDescription is the document's output version.
+  *@param length is the length of the document.
+  *@return true if the file is indexable.
   */
-  public String getOutputDescription(OutputSpecification spec)
+  public boolean checkLengthIndexable(String outputDescription, long length)
+    throws ManifoldCFException, ServiceInterruption;
+
+  /** Pre-determine whether a document's URL is indexable by this connector.  This method
is used by participating repository connectors
+  * to help filter out documents that are not worth indexing.
+  *@param outputDescription is the document's output version.
+  *@param url is the URL of the document.
+  *@return true if the file is indexable.
+  */
+  public boolean checkURLIndexable(String outputDescription, String url)
     throws ManifoldCFException, ServiceInterruption;
 
   /** Add (or replace) a document in the output data store using the connector.

Modified: incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/output/BaseOutputConnector.java
URL: http://svn.apache.org/viewvc/incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/output/BaseOutputConnector.java?rev=1139294&r1=1139293&r2=1139294&view=diff
==============================================================================
--- incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/output/BaseOutputConnector.java
(original)
+++ incubator/lcf/trunk/framework/agents/src/main/java/org/apache/manifoldcf/agents/output/BaseOutputConnector.java
Fri Jun 24 13:18:03 2011
@@ -80,6 +80,18 @@ public abstract class BaseOutputConnecto
 
   /** Detect if a mime type is indexable or not.  This method is used by participating repository
connectors to pre-filter the number of
   * unusable documents that will be passed to this output connector.
+  *@param outputDescription is the document's output version.
+  *@param mimeType is the mime type of the document.
+  *@return true if the mime type is indexable by this connector.
+  */
+  public boolean checkMimeTypeIndexable(String outputDescription, String mimeType)
+    throws ManifoldCFException, ServiceInterruption
+  {
+    return checkMimeTypeIndexable(mimeType);
+  }
+
+  /** Detect if a mime type is indexable or not.  This method is used by participating repository
connectors to pre-filter the number of
+  * unusable documents that will be passed to this output connector.
   *@param mimeType is the mime type of the document.
   *@return true if the mime type is indexable by this connector.
   */
@@ -92,6 +104,19 @@ public abstract class BaseOutputConnecto
   /** Pre-determine whether a document (passed here as a File object) is indexable by this
connector.  This method is used by participating
   * repository connectors to help reduce the number of unmanageable documents that are passed
to this output connector in advance of an
   * actual transfer.  This hook is provided mainly to support search engines that only handle
a small set of accepted file types.
+  *@param outputDescription is the document's output version.
+  *@param localFile is the local file to check.
+  *@return true if the file is indexable.
+  */
+  public boolean checkDocumentIndexable(String outputDescription, File localFile)
+    throws ManifoldCFException, ServiceInterruption
+  {
+    return checkDocumentIndexable(localFile);
+  }
+
+  /** Pre-determine whether a document (passed here as a File object) is indexable by this
connector.  This method is used by participating
+  * repository connectors to help reduce the number of unmanageable documents that are passed
to this output connector in advance of an
+  * actual transfer.  This hook is provided mainly to support search engines that only handle
a small set of accepted file types.
   *@param localFile is the local file to check.
   *@return true if the file is indexable.
   */
@@ -101,6 +126,30 @@ public abstract class BaseOutputConnecto
     return true;
   }
 
+  /** Pre-determine whether a document's length is indexable by this connector.  This method
is used by participating repository connectors
+  * to help filter out documents that are too long to be indexable.
+  *@param outputDescription is the document's output version.
+  *@param length is the length of the document.
+  *@return true if the file is indexable.
+  */
+  public boolean checkLengthIndexable(String outputDescription, long length)
+    throws ManifoldCFException, ServiceInterruption
+  {
+    return true;
+  }
+
+  /** Pre-determine whether a document's URL is indexable by this connector.  This method
is used by participating repository connectors
+  * to help filter out documents that are not worth indexing.
+  *@param outputDescription is the document's output version.
+  *@param url is the URL of the document.
+  *@return true if the file is indexable.
+  */
+  public boolean checkURLIndexable(String outputDescription, String url)
+    throws ManifoldCFException, ServiceInterruption
+  {
+    return true;
+  }
+
   /** Get an output version string, given an output specification.  The output version string
is used to uniquely describe the pertinent details of
   * the output specification and the configuration, to allow the Connector Framework to determine
whether a document will need to be output again.
   * Note that the contents of the document cannot be considered by this method, and that
a different version string (defined in IRepositoryConnector)

Modified: incubator/lcf/trunk/framework/pull-agent/src/main/java/org/apache/manifoldcf/crawler/interfaces/IFingerprintActivity.java
URL: http://svn.apache.org/viewvc/incubator/lcf/trunk/framework/pull-agent/src/main/java/org/apache/manifoldcf/crawler/interfaces/IFingerprintActivity.java?rev=1139294&r1=1139293&r2=1139294&view=diff
==============================================================================
--- incubator/lcf/trunk/framework/pull-agent/src/main/java/org/apache/manifoldcf/crawler/interfaces/IFingerprintActivity.java
(original)
+++ incubator/lcf/trunk/framework/pull-agent/src/main/java/org/apache/manifoldcf/crawler/interfaces/IFingerprintActivity.java
Fri Jun 24 13:18:03 2011
@@ -43,4 +43,19 @@ public interface IFingerprintActivity
   public boolean checkDocumentIndexable(File localFile)
     throws ManifoldCFException, ServiceInterruption;
 
+  /** Check whether a document of a specific length is indexable by the currently specified
output connector.
+  *@param length is the document length.
+  *@return true if the document is indexable.
+  */
+  public boolean checkLengthIndexable(long length)
+    throws ManifoldCFException, ServiceInterruption;
+
+  /** Pre-determine whether a document's URL is indexable by this connector.  This method
is used by participating repository connectors
+  * to help filter out documents that are not worth indexing.
+  *@param url is the URL of the document.
+  *@return true if the file is indexable.
+  */
+  public boolean checkURLIndexable(String url)
+    throws ManifoldCFException, ServiceInterruption;
+
 }

Modified: incubator/lcf/trunk/framework/pull-agent/src/main/java/org/apache/manifoldcf/crawler/system/WorkerThread.java
URL: http://svn.apache.org/viewvc/incubator/lcf/trunk/framework/pull-agent/src/main/java/org/apache/manifoldcf/crawler/system/WorkerThread.java?rev=1139294&r1=1139293&r2=1139294&view=diff
==============================================================================
--- incubator/lcf/trunk/framework/pull-agent/src/main/java/org/apache/manifoldcf/crawler/system/WorkerThread.java
(original)
+++ incubator/lcf/trunk/framework/pull-agent/src/main/java/org/apache/manifoldcf/crawler/system/WorkerThread.java
Fri Jun 24 13:18:03 2011
@@ -307,7 +307,7 @@ public class WorkerThread extends Thread
                       
                       HashMap abortSet = new HashMap();
                       ProcessActivity activity;
-                      VersionActivity versionActivity = new VersionActivity(connectionName,connMgr,jobManager,job,ingester,abortSet);
+                      VersionActivity versionActivity = new VersionActivity(connectionName,connMgr,jobManager,job,ingester,abortSet,outputVersion);
 
                       String aclAuthority = connection.getACLAuthority();
                       boolean isDefaultAuthority = (aclAuthority == null || aclAuthority.length()
== 0);
@@ -1119,11 +1119,13 @@ public class WorkerThread extends Thread
     protected IJobDescription job;
     protected IIncrementalIngester ingester;
     protected HashMap abortSet;
+    protected String outputVersion;
 
     /** Constructor.
     */
     public VersionActivity(String connectionName, IRepositoryConnectionManager connMgr,
-      IJobManager jobManager, IJobDescription job, IIncrementalIngester ingester, HashMap
abortSet)
+      IJobManager jobManager, IJobDescription job, IIncrementalIngester ingester, HashMap
abortSet,
+      String outputVersion)
     {
       this.connectionName = connectionName;
       this.connMgr = connMgr;
@@ -1131,6 +1133,7 @@ public class WorkerThread extends Thread
       this.job = job;
       this.ingester = ingester;
       this.abortSet = abortSet;
+      this.outputVersion = outputVersion;
     }
 
     /** Check whether a mime type is indexable by the currently specified output connector.
@@ -1140,7 +1143,7 @@ public class WorkerThread extends Thread
     public boolean checkMimeTypeIndexable(String mimeType)
       throws ManifoldCFException, ServiceInterruption
     {
-      return ingester.checkMimeTypeIndexable(job.getOutputConnectionName(),mimeType);
+      return ingester.checkMimeTypeIndexable(job.getOutputConnectionName(),outputVersion,mimeType);
     }
 
     /** Check whether a document is indexable by the currently specified output connector.
@@ -1150,7 +1153,28 @@ public class WorkerThread extends Thread
     public boolean checkDocumentIndexable(File localFile)
       throws ManifoldCFException, ServiceInterruption
     {
-      return ingester.checkDocumentIndexable(job.getOutputConnectionName(),localFile);
+      return ingester.checkDocumentIndexable(job.getOutputConnectionName(),outputVersion,localFile);
+    }
+
+    /** Check whether a document of a specified length is indexable by the currently specified
output connector.
+    *@param length is the length to check.
+    *@return true if the document is indexable.
+    */
+    public boolean checkLengthIndexable(long length)
+      throws ManifoldCFException, ServiceInterruption
+    {
+      return ingester.checkLengthIndexable(job.getOutputConnectionName(),outputVersion,length);
+    }
+
+    /** Pre-determine whether a document's URL is indexable by this connector.  This method
is used by participating repository connectors
+    * to help filter out documents that are not worth indexing.
+    *@param url is the URL of the document.
+    *@return true if the file is indexable.
+    */
+    public boolean checkURLIndexable(String url)
+      throws ManifoldCFException, ServiceInterruption
+    {
+      return ingester.checkURLIndexable(job.getOutputConnectionName(),outputVersion,url);
     }
 
     /** Record time-stamped information about the activity of the connector.
@@ -1902,7 +1926,7 @@ public class WorkerThread extends Thread
     public boolean checkMimeTypeIndexable(String mimeType)
       throws ManifoldCFException, ServiceInterruption
     {
-      return ingester.checkMimeTypeIndexable(job.getOutputConnectionName(),mimeType);
+      return ingester.checkMimeTypeIndexable(job.getOutputConnectionName(),outputVersion,mimeType);
     }
 
     /** Check whether a document is indexable by the currently specified output connector.
@@ -1912,7 +1936,28 @@ public class WorkerThread extends Thread
     public boolean checkDocumentIndexable(File localFile)
       throws ManifoldCFException, ServiceInterruption
     {
-      return ingester.checkDocumentIndexable(job.getOutputConnectionName(),localFile);
+      return ingester.checkDocumentIndexable(job.getOutputConnectionName(),outputVersion,localFile);
+    }
+
+    /** Check whether a document of a specified length is indexable by the currently specified
output connector.
+    *@param length is the length to check.
+    *@return true if the document is indexable.
+    */
+    public boolean checkLengthIndexable(long length)
+      throws ManifoldCFException, ServiceInterruption
+    {
+      return ingester.checkLengthIndexable(job.getOutputConnectionName(),outputVersion,length);
+    }
+
+    /** Pre-determine whether a document's URL is indexable by this connector.  This method
is used by participating repository connectors
+    * to help filter out documents that are not worth indexing.
+    *@param url is the URL of the document.
+    *@return true if the file is indexable.
+    */
+    public boolean checkURLIndexable(String url)
+      throws ManifoldCFException, ServiceInterruption
+    {
+      return ingester.checkURLIndexable(job.getOutputConnectionName(),outputVersion,url);
     }
 
     /** Create a global string from a simple string.



Mime
View raw message