Examples of com.datasalt.pangool.io.Tuple$IDontKnowHowToCopyThisStuff

com.datasalt.pangool.io.Tuple
Thrown by {@link #deepCopy(ITuple,java.util.Map)} in the case of fieldof a type that Pangool doesn't know how to copy it. In this case, a solution should be to provide a proper {@link FieldClonator}for the particular field.

  
  private static CachedTuples createCachedTuples(TupleMRConfig config){
    SerializationInfo serInfo = config.getSerializationInfo();
    boolean multipleSources = config.getNumIntermediateSchemas() >= 2;
    CachedTuples r = new CachedTuples();
    r.commonTuple = new Tuple(serInfo.getCommonSchema()); 
    for (Schema sourceSchema : config.getIntermediateSchemas()){
      r.resultTuples.add(new Tuple(sourceSchema));
    }
    
    if (multipleSources){
      for(Schema specificSchema : serInfo.getSpecificSchemas()){
        r.specificTuples.add(new Tuple(specificSchema));
      }
    } 
    return r;
  }

View Full Code Here

   * Moves data between a Record and a Tuple
   */
  public ITuple toTuple(Record record, ITuple reuse) throws IOException {
    ITuple tuple = reuse;
    if (tuple == null){
      tuple = new Tuple(pangoolSchema);
    }
    
    Schema pangoolSchema = tuple.getSchema();
    for(org.apache.avro.Schema.Field avroField : avroSchema.getFields()) {
      int pos = avroField.pos();

View Full Code Here

      int newSize = 0;
      if(line == null) {
        this.line = new Text();
      }
      if(tuple == null) {
        this.tuple = new Tuple(schema);
      }
      while(position < end) {
        newSize = in.readLine(line, maxLineLength,
            Math.max((int) Math.min(Integer.MAX_VALUE, end - position), maxLineLength));

View Full Code Here

  }


  @Override
  public ITuple deserialize(ITuple tuple) throws IOException {
    if(tuple == null) {
      tuple = new Tuple(schemaToDeserialize);
    }
    readFields(tuple, deserializers);
    return tuple;
  }

View Full Code Here

    // Use a HashSet to calculate the total vocabulary size
    Set<String> vocabulary = new HashSet<String>();
    // Read tuples from generate job
    for(FileStatus fileStatus : fileSystem.globStatus(generatedModel)) {
      TupleFile.Reader reader = new TupleFile.Reader(fileSystem, conf, fileStatus.getPath());
      Tuple tuple = new Tuple(reader.getSchema());
      while(reader.next(tuple)) {
        // Read Tuple
        Integer count = (Integer) tuple.get("count");
        Category category = (Category) tuple.get("category");
        String word = tuple.get("word").toString();
        vocabulary.add(word);
        tokensPerCategory.put(category, MapUtils.getInteger(tokensPerCategory, category, 0) + count);
        wordCountPerCategory.get(category).put(word, count);
      }
    }

View Full Code Here

  private static class TweetsMapper extends TupleMapper<AvroWrapper<Record>,NullWritable> {


    private Tuple tuple;
    public void setup(TupleMRContext context, Collector collector) 
        throws IOException, InterruptedException {
      tuple = new Tuple(context.getTupleMRConfig().getIntermediateSchema("tweet"));
    };

View Full Code Here

  @SuppressWarnings("serial")
  private static class RetweetsMapper extends TupleMapper<LongWritable,Text> {
    private Tuple tuple;
    public void setup(TupleMRContext context, Collector collector) 
        throws IOException, InterruptedException {
      tuple = new Tuple(context.getTupleMRConfig().getIntermediateSchema("retweet"));
    };

View Full Code Here

    protected ObjectMapper mapper;


    public void setup(TupleMRContext context, Collector collector) 
        throws IOException, InterruptedException {
      this.mapper = new ObjectMapper();
      tuple = new Tuple(context.getTupleMRConfig().getIntermediateSchema(0));
      record = new Record(getAvroSchema());
      tuple.set("my_avro",record);
    };

View Full Code Here


    private Tuple tuple;


    public void setup(TupleMRContext context, Collector collector) throws IOException,
        InterruptedException {
      tuple = new Tuple(context.getTupleMRConfig().getIntermediateSchema("tweet"));
    };

View Full Code Here

  private static class RetweetsMapper extends TupleMapper<LongWritable, Text> {
    private Tuple tuple;


    public void setup(TupleMRContext context, Collector collector) throws IOException,
        InterruptedException {
      tuple = new Tuple(context.getTupleMRConfig().getIntermediateSchema("retweet"));
    };

View Full Code Here

0 1 2 3 4 5 6 7 8 9

TOP

Related Classes of com.datasalt.pangool.io.Tuple$IDontKnowHowToCopyThisStuff

com.datasalt.pangool.examples.avro.AvroCustomSerializationJob$TokenizeMapper

com.datasalt.pangool.examples.avro.AvroTopicalWordCount$TokenizeMapper

com.datasalt.pangool.examples.avro.AvroTweetsJoin$RetweetsMapper

com.datasalt.pangool.examples.avro.AvroTweetsJoin$TweetsMapper

com.datasalt.pangool.examples.avro.TestAvroTopicalWordCount

com.datasalt.pangool.examples.gameoflife.GameOfLifeJob

com.datasalt.pangool.examples.movingaverage.MovingAverage$URLVisitsProcessor

com.datasalt.pangool.examples.naivebayes.NaiveBayesClassifier

com.datasalt.pangool.examples.naivebayes.NaiveBayesGenerate

com.datasalt.pangool.examples.secondarysort.SecondarySort$IProcessor

All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.