apex-dev mailing list archives

Site index · List index
Message view « Date » · « Thread »
Top « Date » · « Thread »
From "ASF GitHub Bot (JIRA)" <j...@apache.org>
Subject [jira] [Commented] (APEXMALHAR-2011) POJO to Avro record converter
Date Wed, 16 Mar 2016 07:31:33 GMT

    [ https://issues.apache.org/jira/browse/APEXMALHAR-2011?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=15196946#comment-15196946
] 

ASF GitHub Bot commented on APEXMALHAR-2011:
--------------------------------------------

Github user chinmaykolhatkar commented on a diff in the pull request:

    https://github.com/apache/incubator-apex-malhar/pull/211#discussion_r56291316
  
    --- Diff: contrib/src/main/java/com/datatorrent/contrib/avro/AvroToPojo.java ---
    @@ -0,0 +1,428 @@
    +/**
    + * Licensed to the Apache Software Foundation (ASF) under one
    + * or more contributor license agreements.  See the NOTICE file
    + * distributed with this work for additional information
    + * regarding copyright ownership.  The ASF licenses this file
    + * to you under the Apache License, Version 2.0 (the
    + * "License"); you may not use this file except in compliance
    + * with the License.  You may obtain a copy of the License at
    + *
    + *   http://www.apache.org/licenses/LICENSE-2.0
    + *
    + * Unless required by applicable law or agreed to in writing,
    + * software distributed under the License is distributed on an
    + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
    + * KIND, either express or implied.  See the License for the
    + * specific language governing permissions and limitations
    + * under the License.
    + */
    +
    +package com.datatorrent.contrib.avro;
    +
    +import java.io.ByteArrayOutputStream;
    +import java.io.IOException;
    +import java.io.ObjectOutputStream;
    +import java.util.ArrayList;
    +import java.util.List;
    +import java.util.StringTokenizer;
    +
    +import org.slf4j.Logger;
    +import org.slf4j.LoggerFactory;
    +
    +import org.apache.avro.AvroRuntimeException;
    +import org.apache.avro.Schema;
    +import org.apache.avro.Schema.Field;
    +import org.apache.avro.generic.GenericRecord;
    +import org.apache.commons.lang3.ClassUtils;
    +import org.apache.hadoop.classification.InterfaceStability;
    +
    +import com.google.common.collect.Lists;
    +
    +import com.datatorrent.api.AutoMetric;
    +import com.datatorrent.api.Context;
    +import com.datatorrent.api.Context.OperatorContext;
    +import com.datatorrent.api.Context.PortContext;
    +import com.datatorrent.api.DefaultInputPort;
    +import com.datatorrent.api.DefaultOutputPort;
    +import com.datatorrent.api.Operator;
    +import com.datatorrent.api.annotation.InputPortFieldAnnotation;
    +import com.datatorrent.api.annotation.OutputPortFieldAnnotation;
    +import com.datatorrent.lib.util.FieldInfo;
    +import com.datatorrent.lib.util.FieldInfo.SupportType;
    +import com.datatorrent.lib.util.PojoUtils;
    +
    +/**
    + * <p>
    + * AvroToPojo
    + * </p>
    + * A generic implementation for conversion from Avro to POJO. The POJO class
    + * name & field mapping should be provided by the user. If this mapping is not
    + * provided then reflection is used to determine this mapping. As of now only
    + * primitive types are supported.
    + *
    + * @displayName Avro To Pojo
    + * @category Converter
    + * @tags avro
    + * @since 3.3.0
    + */
    +
    +@InterfaceStability.Evolving
    +public class AvroToPojo implements Operator
    +{
    +
    +  private List<Field> columnNames;
    +
    +  private Class<?> cls;
    +
    +  private static final String FIELD_SEPARATOR = ":";
    +  private static final String RECORD_SEPARATOR = ",";
    +
    +  private String genericRecordToPOJOFieldsMapping = null;
    +
    +  public String getGenericRecordToPOJOFieldsMapping()
    +  {
    +    return genericRecordToPOJOFieldsMapping;
    +  }
    +
    +  public void setGenericRecordToPOJOFieldsMapping(String genericRecordToPOJOFieldsMapping)
    +  {
    +    this.genericRecordToPOJOFieldsMapping = genericRecordToPOJOFieldsMapping;
    +  }
    +
    +  private String schemaFile;
    +
    +  private Schema schema;
    +
    +  private List<FieldInfo> fieldInfos;
    +
    +  private transient List<ActiveFieldInfo> columnFieldSetters = null;
    +
    +  @AutoMetric
    +  int recordCnt = 0;
    +
    +  @AutoMetric
    +  int errorCnt = 0;
    +
    +  @AutoMetric
    +  int fieldErrorCnt = 0;
    +
    +  public void parseSchema() throws IOException
    +  {
    +    setSchema(new Schema.Parser().parse(getSchemaString()));
    +  }
    +
    +  public String getSchemaString()
    +  {
    +    return schemaFile;
    +  }
    +
    +  public void setSchemaString(String schemaFile)
    +  {
    +    this.schemaFile = schemaFile;
    +  }
    +
    +  public Schema getSchema()
    +  {
    +    return schema;
    +  }
    +
    +  public void setSchema(Schema schema)
    +  {
    +    this.schema = schema;
    +  }
    +
    +  public byte[] serialize(Object obj) throws IOException
    --- End diff --
    
    Does this need to be public? Is this used from outside of this class?


> POJO to Avro record converter
> -----------------------------
>
>                 Key: APEXMALHAR-2011
>                 URL: https://issues.apache.org/jira/browse/APEXMALHAR-2011
>             Project: Apache Apex Malhar
>          Issue Type: New Feature
>            Reporter: devendra tagare
>
> We are looking to develop a record converter which would take a POJO as an input and
emit a Generic record as the output based on the given Avro schema.
> The expected inputs for this operator would be,
> 1.Class Name of the incoming POJO
> 2.Avro schema for the Generic Record to emit.
> This operator would receive an Object on its input port and emit a Generic record on
the output port.
> To start with, we would handle primitive types and then go on to handle complex types.
> Thanks,
> Dev



--
This message was sent by Atlassian JIRA
(v6.3.4#6332)

Mime
View raw message