Return-Path: X-Original-To: archive-asf-public-internal@cust-asf2.ponee.io Delivered-To: archive-asf-public-internal@cust-asf2.ponee.io Received: from cust-asf.ponee.io (cust-asf.ponee.io [163.172.22.183]) by cust-asf2.ponee.io (Postfix) with ESMTP id 0BDCF200B25 for ; Wed, 8 Jun 2016 23:59:02 +0200 (CEST) Received: by cust-asf.ponee.io (Postfix) id 05820160A2E; Wed, 8 Jun 2016 21:59:02 +0000 (UTC) Delivered-To: archive-asf-public@cust-asf.ponee.io Received: from mail.apache.org (hermes.apache.org [140.211.11.3]) by cust-asf.ponee.io (Postfix) with SMTP id 23C51160A0E for ; Wed, 8 Jun 2016 23:59:00 +0200 (CEST) Received: (qmail 37818 invoked by uid 500); 8 Jun 2016 21:59:00 -0000 Mailing-List: contact dev-help@apex.apache.org; run by ezmlm Precedence: bulk List-Help: List-Unsubscribe: List-Post: List-Id: Reply-To: dev@apex.apache.org Delivered-To: mailing list dev@apex.apache.org Received: (qmail 37804 invoked by uid 99); 8 Jun 2016 21:59:00 -0000 Received: from pnap-us-west-generic-nat.apache.org (HELO spamd3-us-west.apache.org) (209.188.14.142) by apache.org (qpsmtpd/0.29) with ESMTP; Wed, 08 Jun 2016 21:59:00 +0000 Received: from localhost (localhost [127.0.0.1]) by spamd3-us-west.apache.org (ASF Mail Server at spamd3-us-west.apache.org) with ESMTP id A30DA1805A8 for ; Wed, 8 Jun 2016 21:58:59 +0000 (UTC) X-Virus-Scanned: Debian amavisd-new at spamd3-us-west.apache.org X-Spam-Flag: NO X-Spam-Score: -5.446 X-Spam-Level: X-Spam-Status: No, score=-5.446 tagged_above=-999 required=6.31 tests=[KAM_LAZY_DOMAIN_SECURITY=1, RCVD_IN_DNSWL_HI=-5, RCVD_IN_MSPIKE_H3=-0.01, RCVD_IN_MSPIKE_WL=-0.01, RP_MATCHES_RCVD=-1.426] autolearn=disabled Received: from mx1-lw-eu.apache.org ([10.40.0.8]) by localhost (spamd3-us-west.apache.org [10.40.0.10]) (amavisd-new, port 10024) with ESMTP id igEywh9P5T0W for ; Wed, 8 Jun 2016 21:58:58 +0000 (UTC) Received: from mail.apache.org (hermes.apache.org [140.211.11.3]) by mx1-lw-eu.apache.org (ASF Mail Server at mx1-lw-eu.apache.org) with SMTP id 471A45F23E for ; Wed, 8 Jun 2016 21:58:57 +0000 (UTC) Received: (qmail 37795 invoked by uid 99); 8 Jun 2016 21:58:56 -0000 Received: from git1-us-west.apache.org (HELO git1-us-west.apache.org) (140.211.11.23) by apache.org (qpsmtpd/0.29) with ESMTP; Wed, 08 Jun 2016 21:58:56 +0000 Received: by git1-us-west.apache.org (ASF Mail Server at git1-us-west.apache.org, from userid 33) id 6A96DE00A7; Wed, 8 Jun 2016 21:58:56 +0000 (UTC) From: brennonyork To: dev@apex.incubator.apache.org Reply-To: dev@apex.incubator.apache.org References: In-Reply-To: Subject: [GitHub] apex-malhar pull request #315: [APEXMALHAR-2102] Support clone partitioner Content-Type: text/plain Message-Id: <20160608215856.6A96DE00A7@git1-us-west.apache.org> Date: Wed, 8 Jun 2016 21:58:56 +0000 (UTC) archived-at: Wed, 08 Jun 2016 21:59:02 -0000 Github user brennonyork commented on a diff in the pull request: https://github.com/apache/apex-malhar/pull/315#discussion_r66348405 --- Diff: library/src/main/java/com/datatorrent/lib/partitioner/ClonePartitioner.java --- @@ -0,0 +1,143 @@ +/** + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ +package com.datatorrent.lib.partitioner; + +import java.io.Serializable; +import java.util.ArrayList; +import java.util.Collection; +import java.util.List; +import java.util.Map; +import java.util.Set; + +import javax.validation.constraints.Min; + +import org.slf4j.Logger; +import org.slf4j.LoggerFactory; + +import com.google.common.collect.Lists; +import com.google.common.collect.Sets; + +import com.datatorrent.api.DefaultPartition; +import com.datatorrent.api.Operator; +import com.datatorrent.api.Operator.InputPort; +import com.datatorrent.api.Partitioner; + +/** + * This is a simple partitioner, which replicates data across all partitions of an operator. + * + * @param The type of the operator + * @since 2.0.0 + */ +public class ClonePartitioner implements Partitioner, Serializable +{ + private static final Logger logger = LoggerFactory.getLogger(ClonePartitioner.class); + + private static final long serialVersionUID = 201462371710L; + /** + * The number of partitions for the default partitioner to create. + */ + @Min(1) + private int partitionCount = 1; + + /** + * This creates a partitioner which creates only one partition. + */ + public ClonePartitioner() + { + } + + /** + * This constructor is used to create the partitioner from a property. + * @param value A string which is an integer of the number of partitions to create + */ + public ClonePartitioner(String value) + { + this(Integer.parseInt(value)); + } + + /** + * This creates a partitioner which creates partitonCount partitions. + * @param partitionCount The number of partitions to create. + */ + public ClonePartitioner(int partitionCount) + { + this.partitionCount = partitionCount; + } + + /** + * This method sets the number of partitions for the ClonePartitioner to create. + * @param partitionCount The number of partitions to create. + */ + public void setPartitionCount(int partitionCount) + { + this.partitionCount = partitionCount; + } + + /** + * This method gets the number of partitions for the ClonePartitioner to create. + * @return The number of partitions to create. + */ + public int getPartitionCount() + { + return partitionCount; + } + + @Override + public Collection> definePartitions(Collection> partitions, PartitioningContext context) + { + final int newPartitionCount = DefaultPartition.getRequiredPartitionCount(context, this.partitionCount); + logger.debug("define partitions, partitionCount current {} requested {}", partitions.size(), newPartitionCount); + + //Get a partition + DefaultPartition partition = (DefaultPartition)partitions.iterator().next(); + ArrayList> newPartitions; + + // first call to define partitions + newPartitions = Lists.newArrayList(); + + Set partSet = Sets.newHashSet(); + + // Add as many partitions as we wish to have + for (int partitionCounter = 0; partitionCounter < newPartitionCount; partitionCounter++) { + DefaultPartition partitionToAdd = new DefaultPartition(partition.getPartitionedInstance()); + newPartitions.add(partitionToAdd); + partSet.add(partitionCounter); + } + + // For every partition, accept all data from all the input ports by defining a mask that accepts the data for + // every partitionId for every allocated partition and associate all partitions with every port. + List> inputPortList = context.getInputPorts(); + if (inputPortList != null) { + for (InputPort port : inputPortList) { + for (int i = 0; i < newPartitions.size(); i++) { + newPartitions.get(i).getPartitionKeys().put(port, new PartitionKeys(i, partSet)); + } + } + } + + logger.debug("new partition size {}", newPartitions.size()); + return newPartitions; + } + + @Override + public void partitioned(Map> partitions) + { + //Do nothing --- End diff -- nit: space after `//` --- If your project is set up for it, you can reply to this email and have your reply appear on GitHub as well. If your project does not have this feature enabled and wishes so, or if the feature is enabled but not working, please contact infrastructure at infrastructure@apache.org or file a JIRA ticket with INFRA. ---