Package org.apache.accumulo.tserver

Source Code of org.apache.accumulo.tserver.InMemoryMap$LocalityGroupMap

/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements.  See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License.  You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.accumulo.tserver;

import java.io.IOException;
import java.io.Serializable;
import java.util.ArrayList;
import java.util.Collection;
import java.util.Collections;
import java.util.Comparator;
import java.util.HashMap;
import java.util.HashSet;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.Map.Entry;
import java.util.Set;
import java.util.SortedMap;
import java.util.UUID;
import java.util.concurrent.ConcurrentSkipListMap;
import java.util.concurrent.atomic.AtomicBoolean;
import java.util.concurrent.atomic.AtomicInteger;
import java.util.concurrent.atomic.AtomicLong;

import org.apache.accumulo.core.conf.AccumuloConfiguration;
import org.apache.accumulo.core.conf.Property;
import org.apache.accumulo.core.data.ByteSequence;
import org.apache.accumulo.core.data.ColumnUpdate;
import org.apache.accumulo.core.data.Key;
import org.apache.accumulo.core.data.Mutation;
import org.apache.accumulo.core.data.Range;
import org.apache.accumulo.core.data.Value;
import org.apache.accumulo.core.file.FileSKVIterator;
import org.apache.accumulo.core.file.FileSKVWriter;
import org.apache.accumulo.core.file.rfile.RFile;
import org.apache.accumulo.core.file.rfile.RFileOperations;
import org.apache.accumulo.core.iterators.IteratorEnvironment;
import org.apache.accumulo.core.iterators.SkippingIterator;
import org.apache.accumulo.core.iterators.SortedKeyValueIterator;
import org.apache.accumulo.core.iterators.SortedMapIterator;
import org.apache.accumulo.core.iterators.WrappingIterator;
import org.apache.accumulo.core.iterators.system.InterruptibleIterator;
import org.apache.accumulo.core.iterators.system.LocalityGroupIterator;
import org.apache.accumulo.core.iterators.system.LocalityGroupIterator.LocalityGroup;
import org.apache.accumulo.core.iterators.system.SourceSwitchingIterator;
import org.apache.accumulo.core.iterators.system.SourceSwitchingIterator.DataSource;
import org.apache.accumulo.core.util.CachedConfiguration;
import org.apache.accumulo.core.util.LocalityGroupUtil;
import org.apache.accumulo.core.util.LocalityGroupUtil.LocalityGroupConfigurationError;
import org.apache.accumulo.core.util.LocalityGroupUtil.Partitioner;
import org.apache.accumulo.core.util.UtilWaitThread;
import org.apache.accumulo.server.conf.ServerConfiguration;
import org.apache.accumulo.server.trace.TraceFileSystem;
import org.apache.commons.lang.mutable.MutableLong;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.log4j.Logger;

class MemKeyComparator implements Comparator<Key>, Serializable {
 
  private static final long serialVersionUID = 1L;

  @Override
  public int compare(Key k1, Key k2) {
    int cmp = k1.compareTo(k2);
   
    if (cmp == 0) {
      if (k1 instanceof MemKey)
        if (k2 instanceof MemKey)
          cmp = ((MemKey) k2).kvCount - ((MemKey) k1).kvCount;
        else
          cmp = 1;
      else if (k2 instanceof MemKey)
        cmp = -1;
    }
   
    return cmp;
  }
}

class PartialMutationSkippingIterator extends SkippingIterator implements InterruptibleIterator {
 
  int kvCount;
 
  public PartialMutationSkippingIterator(SortedKeyValueIterator<Key,Value> source, int maxKVCount) {
    setSource(source);
    this.kvCount = maxKVCount;
  }
 
  @Override
  protected void consume() throws IOException {
    while (getSource().hasTop() && ((MemKey) getSource().getTopKey()).kvCount > kvCount)
      getSource().next();
  }
 
  @Override
  public SortedKeyValueIterator<Key,Value> deepCopy(IteratorEnvironment env) {
    return new PartialMutationSkippingIterator(getSource().deepCopy(env), kvCount);
  }
 
  @Override
  public void setInterruptFlag(AtomicBoolean flag) {
    ((InterruptibleIterator) getSource()).setInterruptFlag(flag);
  }
 
}

class MemKeyConversionIterator extends WrappingIterator implements InterruptibleIterator {
  MemKey currKey = null;
  Value currVal = null;

  public MemKeyConversionIterator(SortedKeyValueIterator<Key,Value> source) {
    super();
    setSource(source);
  }

  @Override
  public SortedKeyValueIterator<Key,Value> deepCopy(IteratorEnvironment env) {
    return new MemKeyConversionIterator(getSource().deepCopy(env));
  }
 
  @Override
  public Key getTopKey() {
    return currKey;
  }
 
  @Override
  public Value getTopValue() {
    return currVal;
  }
 
  private void getTopKeyVal() {
    Key k = super.getTopKey();
    Value v = super.getTopValue();
    if (k instanceof MemKey || k == null) {
      currKey = (MemKey) k;
      currVal = v;
      return;
    }
    currVal = new Value(v);
    int mc = MemValue.splitKVCount(currVal);
    currKey = new MemKey(k, mc);

  }
 
  public void next() throws IOException {
    super.next();
    if (hasTop())
      getTopKeyVal();
  }

  public void seek(Range range, Collection<ByteSequence> columnFamilies, boolean inclusive) throws IOException {
    super.seek(range, columnFamilies, inclusive);
   
    if (hasTop())
      getTopKeyVal();

    Key k = range.getStartKey();
    if (k instanceof MemKey && hasTop()) {
      while (hasTop() && currKey.compareTo(k) < 0)
        next();
    }
  }

  @Override
  public void setInterruptFlag(AtomicBoolean flag) {
    ((InterruptibleIterator) getSource()).setInterruptFlag(flag);
  }

}

public class InMemoryMap {
  private SimpleMap map = null;
 
  private static final Logger log = Logger.getLogger(InMemoryMap.class);
 
  private volatile String memDumpFile = null;
  private final String memDumpDir;

  private Map<String,Set<ByteSequence>> lggroups;
 
  public InMemoryMap(boolean useNativeMap, String memDumpDir) {
    this(new HashMap<String,Set<ByteSequence>>(), useNativeMap, memDumpDir);
  }

  public InMemoryMap(Map<String,Set<ByteSequence>> lggroups, boolean useNativeMap, String memDumpDir) {
    this.memDumpDir = memDumpDir;
    this.lggroups = lggroups;
   
    if (lggroups.size() == 0)
      map = newMap(useNativeMap);
    else
      map = new LocalityGroupMap(lggroups, useNativeMap);
  }
 
  public InMemoryMap(AccumuloConfiguration config) throws LocalityGroupConfigurationError {
    this(LocalityGroupUtil.getLocalityGroups(config), config.getBoolean(Property.TSERV_NATIVEMAP_ENABLED), config.get(Property.TSERV_MEMDUMP_DIR));
  }
 
  private static SimpleMap newMap(boolean useNativeMap) {
    if (useNativeMap && NativeMap.isLoaded()) {
      try {
        return new NativeMapWrapper();
      } catch (Throwable t) {
        log.error("Failed to create native map", t);
      }
    }
   
    return new DefaultMap();
  }
 
  private interface SimpleMap {
    Value get(Key key);
   
    Iterator<Entry<Key,Value>> iterator(Key startKey);
   
    int size();
   
    InterruptibleIterator skvIterator();
   
    void delete();
   
    long getMemoryUsed();
   
    void mutate(List<Mutation> mutations, int kvCount);
  }
 
  private static class LocalityGroupMap implements SimpleMap {
   
    private Map<ByteSequence,MutableLong> groupFams[];
   
    // the last map in the array is the default locality group
    private SimpleMap maps[];
    private Partitioner partitioner;
    private List<Mutation>[] partitioned;
    private Set<ByteSequence> nonDefaultColumnFamilies;
   
    @SuppressWarnings("unchecked")
    LocalityGroupMap(Map<String,Set<ByteSequence>> groups, boolean useNativeMap) {
      this.groupFams = new Map[groups.size()];
      this.maps = new SimpleMap[groups.size() + 1];
      this.partitioned = new List[groups.size() + 1];
      this.nonDefaultColumnFamilies = new HashSet<ByteSequence>();
     
      for (int i = 0; i < maps.length; i++) {
        maps[i] = newMap(useNativeMap);
      }

      int count = 0;
      for (Set<ByteSequence> cfset : groups.values()) {
        HashMap<ByteSequence,MutableLong> map = new HashMap<ByteSequence,MutableLong>();
        for (ByteSequence bs : cfset)
          map.put(bs, new MutableLong(1));
        this.groupFams[count++] = map;
        nonDefaultColumnFamilies.addAll(cfset);
      }
     
      partitioner = new LocalityGroupUtil.Partitioner(this.groupFams);
     
      for (int i = 0; i < partitioned.length; i++) {
        partitioned[i] = new ArrayList<Mutation>();
      }
    }

    @Override
    public Value get(Key key) {
      throw new UnsupportedOperationException();
    }
   
    @Override
    public Iterator<Entry<Key,Value>> iterator(Key startKey) {
      throw new UnsupportedOperationException();
    }
   
    @Override
    public int size() {
      int sum = 0;
      for (SimpleMap map : maps)
        sum += map.size();
      return sum;
    }
   
    @Override
    public InterruptibleIterator skvIterator() {
      LocalityGroup groups[] = new LocalityGroup[maps.length];
      for (int i = 0; i < groups.length; i++) {
        if (i < groupFams.length)
          groups[i] = new LocalityGroup(maps[i].skvIterator(), groupFams[i], false);
        else
          groups[i] = new LocalityGroup(maps[i].skvIterator(), null, true);
      }


      return new LocalityGroupIterator(groups, nonDefaultColumnFamilies);
    }
   
    @Override
    public void delete() {
      for (SimpleMap map : maps)
        map.delete();
    }
   
    @Override
    public long getMemoryUsed() {
      long sum = 0;
      for (SimpleMap map : maps)
        sum += map.getMemoryUsed();
      return sum;
    }
   
    @Override
    public synchronized void mutate(List<Mutation> mutations, int kvCount) {
      // this method is synchronized because it reuses objects to avoid allocation,
      // currently, the method that calls this is synchronized so there is no
      // loss in parallelism.... synchronization was added here for future proofing
     
      try{
        partitioner.partition(mutations, partitioned);
       
        for (int i = 0; i < partitioned.length; i++) {
          if (partitioned[i].size() > 0) {
            maps[i].mutate(partitioned[i], kvCount);
            for (Mutation m : partitioned[i])
              kvCount += m.getUpdates().size();
          }
        }
      } finally {
        // clear immediately so mutations can be garbage collected
        for (List<Mutation> list : partitioned) {
          list.clear();
        }
      }
    }
   
  }

  private static class DefaultMap implements SimpleMap {
    private ConcurrentSkipListMap<Key,Value> map = new ConcurrentSkipListMap<Key,Value>(new MemKeyComparator());
    private AtomicLong bytesInMemory = new AtomicLong();
    private AtomicInteger size = new AtomicInteger();
   
    public void put(Key key, Value value) {
      // Always a MemKey, so account for the kvCount int
      bytesInMemory.addAndGet(key.getLength() + 4);
      bytesInMemory.addAndGet(value.getSize());
      if (map.put(key, value) == null)
        size.incrementAndGet();
    }
   
    public Value get(Key key) {
      return map.get(key);
    }
   
    public Iterator<Entry<Key,Value>> iterator(Key startKey) {
      Key lk = new Key(startKey);
      SortedMap<Key,Value> tm = map.tailMap(lk);
      return tm.entrySet().iterator();
    }
   
    public int size() {
      return size.get();
    }
   
    public synchronized InterruptibleIterator skvIterator() {
      if (map == null)
        throw new IllegalStateException();
     
      return new SortedMapIterator(map);
    }
   
    public synchronized void delete() {
      map = null;
    }
   
    public long getOverheadPerEntry() {
      // all of the java objects that are used to hold the
      // data and make it searchable have overhead... this
      // overhead is estimated using test.EstimateInMemMapOverhead
      // and is in bytes.. the estimates were obtained by running
      // java 6_16 in 64 bit server mode
     
      return 200;
    }
   
    @Override
    public void mutate(List<Mutation> mutations, int kvCount) {
      for (Mutation m : mutations) {
        for (ColumnUpdate cvp : m.getUpdates()) {
          Key newKey = new MemKey(m.getRow(), cvp.getColumnFamily(), cvp.getColumnQualifier(), cvp.getColumnVisibility(), cvp.getTimestamp(), cvp.isDeleted(),
              false, kvCount++);
          Value value = new Value(cvp.getValue());
          put(newKey, value);
        }
      }
    }
   
    @Override
    public long getMemoryUsed() {
      return bytesInMemory.get() + (size() * getOverheadPerEntry());
    }
  }
 
  private static class NativeMapWrapper implements SimpleMap {
    private NativeMap nativeMap;
   
    NativeMapWrapper() {
      nativeMap = new NativeMap();
    }
   
    public Value get(Key key) {
      return nativeMap.get(key);
    }
   
    public Iterator<Entry<Key,Value>> iterator(Key startKey) {
      return nativeMap.iterator(startKey);
    }
   
    public int size() {
      return nativeMap.size();
    }
   
    public InterruptibleIterator skvIterator() {
      return (InterruptibleIterator) nativeMap.skvIterator();
    }
   
    public void delete() {
      nativeMap.delete();
    }
   
    public long getMemoryUsed() {
      return nativeMap.getMemoryUsed();
    }
   
    @Override
    public void mutate(List<Mutation> mutations, int kvCount) {
      nativeMap.mutate(mutations, kvCount);
    }
  }
 
  private AtomicInteger nextKVCount = new AtomicInteger(1);
  private AtomicInteger kvCount = new AtomicInteger(0);

  private Object writeSerializer = new Object();
 
  /**
   * Applies changes to a row in the InMemoryMap
   *
   */
  public void mutate(List<Mutation> mutations) {
    int numKVs = 0;
    for (int i = 0; i < mutations.size(); i++)
      numKVs += mutations.get(i).size();
   
    // Can not update mutationCount while writes that started before
    // are in progress, this would cause partial mutations to be seen.
    // Also, can not continue until mutation count is updated, because
    // a read may not see a successful write. Therefore writes must
    // wait for writes that started before to finish.
    //
    // using separate lock from this map, to allow read/write in parallel
    synchronized (writeSerializer ) {
      int kv = nextKVCount.getAndAdd(numKVs);
      try {
        map.mutate(mutations, kv);
      } finally {
        kvCount.set(kv + numKVs - 1);
      }
    }
  }
 
  /**
   * Returns a long representing the size of the InMemoryMap
   *
   * @return bytesInMemory
   */
  public synchronized long estimatedSizeInBytes() {
    if (map == null)
      return 0;
   
    return map.getMemoryUsed();
  }
 
  Iterator<Map.Entry<Key,Value>> iterator(Key startKey) {
    return map.iterator(startKey);
  }
 
  public long getNumEntries() {
    return map.size();
  }
 
  private final Set<MemoryIterator> activeIters = Collections.synchronizedSet(new HashSet<MemoryIterator>());
 
  class MemoryDataSource implements DataSource {
   
    boolean switched = false;
    private InterruptibleIterator iter;
    private List<FileSKVIterator> readers;
   
    MemoryDataSource() {
      this(new ArrayList<FileSKVIterator>());
    }
   
    public MemoryDataSource(List<FileSKVIterator> readers) {
      this.readers = readers;
    }
   
    @Override
    public boolean isCurrent() {
      if (switched)
        return true;
      else
        return memDumpFile == null;
    }
   
    @Override
    public DataSource getNewDataSource() {
      if (switched)
        throw new IllegalStateException();
     
      if (!isCurrent()) {
        switched = true;
        iter = null;
      }
     
      return this;
    }
   
    @Override
    public SortedKeyValueIterator<Key,Value> iterator() throws IOException {
      if (iter == null)
        if (!switched)
          iter = map.skvIterator();
        else {
         
          Configuration conf = CachedConfiguration.getInstance();
          FileSystem fs = TraceFileSystem.wrap(FileSystem.getLocal(conf));
         
          FileSKVIterator reader = new RFileOperations().openReader(memDumpFile, true, fs, conf, ServerConfiguration.getSiteConfiguration());

          readers.add(reader);
         
          iter = new MemKeyConversionIterator(reader);
        }
     
      return iter;
    }
   
    @Override
    public DataSource getDeepCopyDataSource(IteratorEnvironment env) {
      return new MemoryDataSource(readers);
    }
   
  }
 
  class MemoryIterator extends WrappingIterator implements InterruptibleIterator {
   
    private AtomicBoolean closed;
    private SourceSwitchingIterator ssi;
    private MemoryDataSource mds;
   
    protected SortedKeyValueIterator<Key,Value> getSource() {
      if (closed.get())
        throw new IllegalStateException("Memory iterator is closed");
      return super.getSource();
    }
   
    private MemoryIterator(InterruptibleIterator source) {
      this(source, new AtomicBoolean(false));
    }
   
    private MemoryIterator(SortedKeyValueIterator<Key,Value> source, AtomicBoolean closed) {
      setSource(source);
      this.closed = closed;
    }
   
    public SortedKeyValueIterator<Key,Value> deepCopy(IteratorEnvironment env) {
      return new MemoryIterator(getSource().deepCopy(env), closed);
    }
   
    public void close() {
     
      synchronized (this) {
        if (closed.compareAndSet(false, true)) {
         
          for (FileSKVIterator reader : mds.readers)
            try {
              reader.close();
            } catch (IOException e) {
              log.warn(e, e);
            }
        }
      }
     
      // remove outside of sync to avoid deadlock
      activeIters.remove(this);
    }
   
    private synchronized boolean switchNow() throws IOException {
      if (closed.get())
        return false;
     
      ssi.switchNow();
      return true;
    }
   
    @Override
    public void setInterruptFlag(AtomicBoolean flag) {
      ((InterruptibleIterator) getSource()).setInterruptFlag(flag);
    }
   
    private void setSSI(SourceSwitchingIterator ssi) {
      this.ssi = ssi;
    }
   
    public void setMDS(MemoryDataSource mds) {
      this.mds = mds;
    }
   
  }
 
  public synchronized MemoryIterator skvIterator() {
    if (map == null)
      throw new NullPointerException();
   
    if (deleted)
      throw new IllegalStateException("Can not obtain iterator after map deleted");
   
    int mc = kvCount.get();
    MemoryDataSource mds = new MemoryDataSource();
    SourceSwitchingIterator ssi = new SourceSwitchingIterator(new MemoryDataSource());
    MemoryIterator mi = new MemoryIterator(new PartialMutationSkippingIterator(ssi, mc));
    mi.setSSI(ssi);
    mi.setMDS(mds);
    activeIters.add(mi);
    return mi;
  }
 
  public SortedKeyValueIterator<Key,Value> compactionIterator() {
   
    if (nextKVCount.get() - 1 != kvCount.get())
      throw new IllegalStateException("Memory map in unexpected state : nextKVCount = " + nextKVCount.get() + " kvCount = "
          + kvCount.get());
   
    return map.skvIterator();
  }
 
  private boolean deleted = false;
 
  public void delete(long waitTime) {
   
    synchronized (this) {
      if (deleted)
        throw new IllegalStateException("Double delete");
     
      deleted = true;
    }
   
    long t1 = System.currentTimeMillis();
   
    while (activeIters.size() > 0 && System.currentTimeMillis() - t1 < waitTime) {
      UtilWaitThread.sleep(50);
    }
   
    if (activeIters.size() > 0) {
      // dump memmap exactly as is to a tmp file on disk, and switch scans to that temp file
      try {
        Configuration conf = CachedConfiguration.getInstance();
        FileSystem fs = TraceFileSystem.wrap(FileSystem.getLocal(conf));
       
        String tmpFile = memDumpDir + "/memDump" + UUID.randomUUID() + "." + RFile.EXTENSION;
       
        Configuration newConf = new Configuration(conf);
        newConf.setInt("io.seqfile.compress.blocksize", 100000);
       
        FileSKVWriter out = new RFileOperations().openWriter(tmpFile, fs, newConf, ServerConfiguration.getSiteConfiguration());
       
        InterruptibleIterator iter = map.skvIterator();
      
        HashSet<ByteSequence> allfams= new HashSet<ByteSequence>();
       
        for(Entry<String, Set<ByteSequence>> entry : lggroups.entrySet()){
          allfams.addAll(entry.getValue());
          out.startNewLocalityGroup(entry.getKey(), entry.getValue());
          iter.seek(new Range(), entry.getValue(), true);
          dumpLocalityGroup(out, iter);
        }
       
        out.startDefaultLocalityGroup();
        iter.seek(new Range(), allfams, false);
      
        dumpLocalityGroup(out, iter);
       
        out.close();
       
        log.debug("Created mem dump file " + tmpFile);
       
        memDumpFile = tmpFile;
       
        synchronized (activeIters) {
          for (MemoryIterator mi : activeIters) {
            mi.switchNow();
          }
        }
       
        // rely on unix behavior that file will be deleted when last
        // reader closes it
        fs.delete(new Path(memDumpFile), true);
       
      } catch (IOException ioe) {
        log.error("Failed to create mem dump file ", ioe);
       
        while (activeIters.size() > 0) {
          UtilWaitThread.sleep(100);
        }
      }
     
    }
   
    SimpleMap tmpMap = map;
   
    synchronized (this) {
      map = null;
    }
   
    tmpMap.delete();
  }

  private void dumpLocalityGroup(FileSKVWriter out, InterruptibleIterator iter) throws IOException {
    while (iter.hasTop() && activeIters.size() > 0) {
      // RFile does not support MemKey, so we move the kv count into the value only for the RFile.
      // There is no need to change the MemKey to a normal key because the kvCount info gets lost when it is written
      Value newValue = new MemValue(iter.getTopValue(), ((MemKey) iter.getTopKey()).kvCount);
      out.append(iter.getTopKey(), newValue);
      iter.next();

    }
  }
}
TOP

Related Classes of org.apache.accumulo.tserver.InMemoryMap$LocalityGroupMap

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.