Source Code of org.apache.flink.runtime.jobgraph.JobGraph

/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */


package org.apache.flink.runtime.jobgraph;


import java.io.IOException;
import java.io.ObjectInputStream;
import java.io.ObjectOutputStream;
import java.net.InetSocketAddress;
import java.util.ArrayList;
import java.util.Collections;
import java.util.Iterator;
import java.util.LinkedHashMap;
import java.util.LinkedHashSet;
import java.util.List;
import java.util.Map;


import org.apache.flink.api.common.InvalidProgramException;
import org.apache.flink.configuration.Configuration;
import org.apache.flink.core.fs.FSDataInputStream;
import org.apache.flink.core.fs.FileSystem;
import org.apache.flink.core.fs.Path;
import org.apache.flink.core.io.IOReadableWritable;
import org.apache.flink.core.memory.DataInputView;
import org.apache.flink.core.memory.DataInputViewStream;
import org.apache.flink.core.memory.DataOutputView;
import org.apache.flink.core.memory.DataOutputViewStream;
import org.apache.flink.runtime.blob.BlobClient;
import org.apache.flink.runtime.blob.BlobKey;
import org.apache.flink.types.StringValue;


/**
 * A job graph represents an entire Flink runtime job.
 */
public class JobGraph implements IOReadableWritable {


  // --------------------------------------------------------------------------------------------
  // Members that define the structure / topology of the graph
  // --------------------------------------------------------------------------------------------
  
  /** List of task vertices included in this job graph. */
  private final Map<JobVertexID, AbstractJobVertex> taskVertices = new LinkedHashMap<JobVertexID, AbstractJobVertex>();


  /** The job configuration attached to this job. */
  private final Configuration jobConfiguration = new Configuration();


  /** Set of JAR files required to run this job. */
  private final transient List<Path> userJars = new ArrayList<Path>();


  /** Set of blob keys identifying the JAR files required to run this job. */
  private final List<BlobKey> userJarBlobKeys = new ArrayList<BlobKey>();
  
  /** ID of this job. */
  private final JobID jobID;


  /** Name of this job. */
  private String jobName;
  
  /** The number of times that failed tasks should be re-executed */
  private int numExecutionRetries;
  
  /** flag to enable queued scheduling */
  private boolean allowQueuedScheduling;
  
  // --------------------------------------------------------------------------------------------
  
  /**
   * Constructs a new job graph with no name and a random job ID.
   */
  public JobGraph() {
    this((String) null);
  }


  /**
   * Constructs a new job graph with the given name and a random job ID.
   * 
   * @param jobName The name of the job
   */
  public JobGraph(String jobName) {
    this(null, jobName);
  }
  
  /**
   * Constructs a new job graph with the given name and a random job ID.
   * 
   * @param jobId The id of the job
   * @param jobName The name of the job
   */
  public JobGraph(JobID jobId, String jobName) {
    this.jobID = jobId == null ? new JobID() : jobId;;
    this.jobName = jobName == null ? "(unnamed job)" : jobName;
  }
  
  /**
   * Constructs a new job graph with no name and a random job ID.
   * 
   * @param vertices The vertices to add to the graph.
   */
  public JobGraph(AbstractJobVertex... vertices) {
    this(null, vertices);
  }


  /**
   * Constructs a new job graph with the given name and a random job ID.
   * 
   * @param jobName The name of the job.
   * @param vertices The vertices to add to the graph.
   */
  public JobGraph(String jobName, AbstractJobVertex... vertices) {
    this(null, jobName, vertices);
  }
  
  /**
   * Constructs a new job graph with the given name and a random job ID.
   * 
   * @param jobId The id of the job.
   * @param jobName The name of the job.
   * @param vertices The vertices to add to the graph.
   */
  public JobGraph(JobID jobId, String jobName, AbstractJobVertex... vertices) {
    this(jobId, jobName);
    
    for (AbstractJobVertex vertex : vertices) {
      addVertex(vertex);
    }
  }


  // --------------------------------------------------------------------------------------------
  
  /**
   * Returns the ID of the job.
   * 
   * @return the ID of the job
   */
  public JobID getJobID() {
    return this.jobID;
  }
  
  /**
   * Returns the name assigned to the job graph.
   * 
   * @return the name assigned to the job graph
   */
  public String getName() {
    return this.jobName;
  }


  /**
   * Returns the configuration object for this job if it is set.
   * 
   * @return the configuration object for this job, or <code>null</code> if it is not set
   */
  public Configuration getJobConfiguration() {
    return this.jobConfiguration;
  }
  
  /**
   * Sets the number of times that failed tasks are re-executed. A value of zero
   * effectively disables fault tolerance. A value of {@code -1} indicates that the system
   * default value (as defined in the configuration) should be used.
   * 
   * @param numberOfExecutionRetries The number of times the system will try to re-execute failed tasks.
   */
  public void setNumberOfExecutionRetries(int numberOfExecutionRetries) {
    if (numberOfExecutionRetries < -1) {
      throw new IllegalArgumentException("The number of execution retries must be non-negative, or -1 (use system default)");
    }
    this.numExecutionRetries = numberOfExecutionRetries;
  }
  
  /**
   * Gets the number of times the system will try to re-execute failed tasks. A value
   * of {@code -1} indicates that the system default value (as defined in the configuration)
   * should be used.
   * 
   * @return The number of times the system will try to re-execute failed tasks.
   */
  public int getNumberOfExecutionRetries() {
    return numExecutionRetries;
  }
  
  public void setAllowQueuedScheduling(boolean allowQueuedScheduling) {
    this.allowQueuedScheduling = allowQueuedScheduling;
  }
  
  public boolean getAllowQueuedScheduling() {
    return allowQueuedScheduling;
  }


  /**
   * Adds a new task vertex to the job graph if it is not already included.
   * 
   * @param vertex
   *        the new task vertex to be added
   */
  public void addVertex(AbstractJobVertex vertex) {
    final JobVertexID id = vertex.getID();
    AbstractJobVertex previous = taskVertices.put(id, vertex);
    
    // if we had a prior association, restore and throw an exception
    if (previous != null) {
      taskVertices.put(id, previous);
      throw new IllegalArgumentException("The JobGraph already contains a vertex with that id.");
    }
  }


  /**
   * Returns an Iterable to iterate all vertices registered with the job graph.
   * 
   * @return an Iterable to iterate all vertices registered with the job graph
   */
  public Iterable<AbstractJobVertex> getVertices() {
    return this.taskVertices.values();
  }
  
  /**
   * Returns an array of all job vertices that are registered with the job graph. The order in which the vertices
   * appear in the list is not defined.
   * 
   * @return an array of all job vertices that are registered with the job graph
   */
  public AbstractJobVertex[] getVerticesAsArray() {
    return this.taskVertices.values().toArray(new AbstractJobVertex[this.taskVertices.size()]);
  }


  /**
   * Returns the number of all vertices.
   * 
   * @return The number of all vertices.
   */
  public int getNumberOfVertices() {
    return this.taskVertices.size();
  }


  /**
   * Searches for a vertex with a matching ID and returns it.
   * 
   * @param id
   *        the ID of the vertex to search for
   * @return the vertex with the matching ID or <code>null</code> if no vertex with such ID could be found
   */
  public AbstractJobVertex findVertexByID(JobVertexID id) {
    return this.taskVertices.get(id);
  }
  
  // --------------------------------------------------------------------------------------------


  public List<AbstractJobVertex> getVerticesSortedTopologicallyFromSources() throws InvalidProgramException {
    // early out on empty lists
    if (this.taskVertices.isEmpty()) {
      return Collections.emptyList();
    }
    
    ArrayList<AbstractJobVertex> sorted = new ArrayList<AbstractJobVertex>(this.taskVertices.size());
    LinkedHashSet<AbstractJobVertex> remaining = new LinkedHashSet<AbstractJobVertex>(this.taskVertices.values());
    
    // start by finding the vertices with no input edges
    // and the ones with disconnected inputs (that refer to some standalone data set)
    {
      Iterator<AbstractJobVertex> iter = remaining.iterator();
      while (iter.hasNext()) {
        AbstractJobVertex vertex = iter.next();
        
        if (vertex.hasNoConnectedInputs()) {
          sorted.add(vertex);
          iter.remove();
        }
      }
    }
    
    int startNodePos = 0;
    
    // traverse from the nodes that were added until we found all elements
    while (!remaining.isEmpty()) {
      
      // first check if we have more candidates to start traversing from. if not, then the
      // graph is cyclic, which is not permitted
      if (startNodePos >= sorted.size()) {
        throw new InvalidProgramException("The job graph is cyclic.");
      }
      
      AbstractJobVertex current = sorted.get(startNodePos++);
      addNodesThatHaveNoNewPredecessors(current, sorted, remaining);
    }
    
    return sorted;
  }
  
  private void addNodesThatHaveNoNewPredecessors(AbstractJobVertex start, ArrayList<AbstractJobVertex> target, LinkedHashSet<AbstractJobVertex> remaining) {
    
    // forward traverse over all produced data sets and all their consumers
    for (IntermediateDataSet dataSet : start.getProducedDataSets()) {
      for (JobEdge edge : dataSet.getConsumers()) {
        
        // a vertex can be added, if it has no predecessors that are still in the 'remaining' set
        AbstractJobVertex v = edge.getTarget();
        if (!remaining.contains(v)) {
          continue;
        }
        
        boolean hasNewPredecessors = false;
        
        for (JobEdge e : v.getInputs()) {
          // skip the edge through which we came
          if (e == edge) {
            continue;
          }
          
          IntermediateDataSet source = e.getSource();
          if (remaining.contains(source.getProducer())) {
            hasNewPredecessors = true;
            break;
          }
        }
        
        if (!hasNewPredecessors) {
          target.add(v);
          remaining.remove(v);
          addNodesThatHaveNoNewPredecessors(v, target, remaining);
        }
      }
    }
  }
  
  // --------------------------------------------------------------------------------------------
  //  Serialization / Deserialization
  // --------------------------------------------------------------------------------------------
  
  @Override
  public void read(DataInputView in) throws IOException {
    // write the simple fields
    this.jobID.read(in);
    this.jobName = StringValue.readString(in);
    this.jobConfiguration.read(in);
    this.numExecutionRetries = in.readInt();
    this.allowQueuedScheduling = in.readBoolean();
    
    final int numVertices = in.readInt();
    
    @SuppressWarnings("resource")
    ObjectInputStream ois = new ObjectInputStream(new DataInputViewStream(in));
    for (int i = 0; i < numVertices; i++) {
      try {
        AbstractJobVertex vertex = (AbstractJobVertex) ois.readObject();
        taskVertices.put(vertex.getID(), vertex);
      }
      catch (ClassNotFoundException e) {
        throw new IOException(e);
      }
    }
    ois.close();


    // Read required jar files
    readJarBlobKeys(in);
  }




  @Override
  public void write(DataOutputView out) throws IOException {
    
    // write the simple fields
    this.jobID.write(out);
    StringValue.writeString(this.jobName, out);
    this.jobConfiguration.write(out);
    out.writeInt(numExecutionRetries);
    out.writeBoolean(allowQueuedScheduling);
    
    // write the task vertices using java serialization (to resolve references in the object graph)
    out.writeInt(taskVertices.size());
    
    ObjectOutputStream oos = new ObjectOutputStream(new DataOutputViewStream(out));
    for (AbstractJobVertex vertex : this.taskVertices.values()) {
      oos.writeObject(vertex);
    }
    oos.close();
    
    // Write out all required jar files
    writeJarBlobKeys(out);
  }


  /**
   * Writes the BLOB keys of the jar files required to run this job to the given {@link org.apache.flink.core.memory.DataOutputView}.
   *
   * @param out
   *        the data output to write the BLOB keys to
   * @throws IOException
   *         thrown if an error occurs while writing to the data output
   */
  private void writeJarBlobKeys(final DataOutputView out) throws IOException {


    out.writeInt(this.userJarBlobKeys.size());


    for (final Iterator<BlobKey> it = this.userJarBlobKeys.iterator(); it.hasNext();) {
      it.next().write(out);
    }
  }


  /**
   * Reads the BLOB keys for the JAR files required to run this job and registers them.
   *
   * @param in
   *        the data stream to read the BLOB keys from
   * @throws IOException
   *         thrown if an error occurs while reading the stream
   */
  private void readJarBlobKeys(final DataInputView in) throws IOException {


    // Do jar files follow;
    final int numberOfBlobKeys = in.readInt();


    for (int i = 0; i < numberOfBlobKeys; ++i) {
      final BlobKey key = new BlobKey();
      key.read(in);
      this.userJarBlobKeys.add(key);
    }
  }




  // --------------------------------------------------------------------------------------------
  //  Handling of attached JAR files
  // --------------------------------------------------------------------------------------------
  
  /**
   * Adds the path of a JAR file required to run the job on a task manager.
   * 
   * @param jar
   *        path of the JAR file required to run the job on a task manager
   */
  public void addJar(Path jar) {
    if (jar == null) {
      throw new IllegalArgumentException();
    }


    if (!userJars.contains(jar)) {
      userJars.add(jar);
    }
  }


  /**
   * Returns a set of BLOB keys referring to the JAR files required to run this job.
   *
   * @return set of BLOB keys referring to the JAR files required to run this job
   */
  public List<BlobKey> getUserJarBlobKeys() {


    return this.userJarBlobKeys;
  }


  /**
   * Uploads the previously added user jar file to the job manager through the job manager's BLOB server.
   *
   * @param serverAddress
   *        the network address of the BLOB server
   * @throws IOException
   *         thrown if an I/O error occurs during the upload
   */
  public void uploadRequiredJarFiles(final InetSocketAddress serverAddress) throws IOException {


    if (this.userJars.isEmpty()) {
      return;
    }


    BlobClient bc = null;
    try {


      bc = new BlobClient(serverAddress);


      for (final Iterator<Path> it = this.userJars.iterator(); it.hasNext();) {


        final Path jar = it.next();
        final FileSystem fs = jar.getFileSystem();
        FSDataInputStream is = null;
        try {
          is = fs.open(jar);
          final BlobKey key = bc.put(is);
          this.userJarBlobKeys.add(key);
        } finally {
          if (is != null) {
            is.close();
          }
        }
      }


    } finally {
      if (bc != null) {
        bc.close();
      }
    }
  }
}
Source Code of org.apache.flink.runtime.jobgraph.JobGraph

Related Classes of org.apache.flink.runtime.jobgraph.JobGraph