All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.hadoop.hive.llap.shufflehandler.DirWatcher Maven / Gradle / Ivy

There is a newer version: 4.0.1
Show newest version
/*
 * Licensed under the Apache License, Version 2.0 (the "License");
 *  you may not use this file except in compliance with the License.
 *  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 *  Unless required by applicable law or agreed to in writing, software
 *  distributed under the License is distributed on an "AS IS" BASIS,
 *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 *  See the License for the specific language governing permissions and
 *  limitations under the License.
 */

package org.apache.hadoop.hive.llap.shufflehandler;

import static java.nio.file.StandardWatchEventKinds.ENTRY_CREATE;
import static java.nio.file.StandardWatchEventKinds.OVERFLOW;

import java.io.IOException;
import java.nio.file.DirectoryStream;
import java.nio.file.FileSystems;
import java.nio.file.Files;
import java.nio.file.Path;
import java.nio.file.WatchEvent;
import java.nio.file.WatchKey;
import java.nio.file.WatchService;
import java.util.LinkedList;
import java.util.List;
import java.util.concurrent.Callable;
import java.util.concurrent.ConcurrentHashMap;
import java.util.concurrent.ConcurrentMap;
import java.util.concurrent.DelayQueue;
import java.util.concurrent.Delayed;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.Executors;
import java.util.concurrent.TimeUnit;
import java.util.concurrent.atomic.AtomicBoolean;

import com.google.common.util.concurrent.ListenableFuture;
import com.google.common.util.concurrent.ListeningExecutorService;
import com.google.common.util.concurrent.MoreExecutors;
import com.google.common.util.concurrent.ThreadFactoryBuilder;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.apache.hadoop.hive.llap.shufflehandler.ShuffleHandler.AttemptPathIdentifier;

class DirWatcher {

  private static final Logger LOG = LoggerFactory.getLogger(DirWatcher.class);

  private static enum Type {
    BASE, // App Base Dir / ${dagDir}
    OUTPUT, // appBase/output/
    FINAL, // appBase/output/attemptDir
  }


  private static final String OUTPUT = "output";

  private final AttemptRegistrationListener listener;

  private final WatchService watchService;
  private final AtomicBoolean shutdown = new AtomicBoolean(false);
  private final WatcherCallable watcherCallable = new WatcherCallable();
  private final ListeningExecutorService watcherExecutorService;
  private volatile ListenableFuture watcherFuture;

  private final DelayQueue watchedPathQueue = new DelayQueue<>();
  private final WatchExpirerCallable expirerCallable = new WatchExpirerCallable();
  private final ListeningExecutorService expirerExecutorService;
  private volatile ListenableFuture expirerFuture;

  private final ConcurrentMap foundAttempts = new ConcurrentHashMap<>();
  private final ConcurrentMap watchedPaths = new ConcurrentHashMap<>();
  private final ConcurrentMap> watchesPerAttempt = new ConcurrentHashMap<>();

  DirWatcher(AttemptRegistrationListener listener) throws IOException {
    this.watchService = FileSystems.getDefault().newWatchService();
    this.listener = listener;
    ExecutorService executor1 = Executors.newFixedThreadPool(1,
        new ThreadFactoryBuilder().setDaemon(true).setNameFormat("DirWatcher").build());
    watcherExecutorService = MoreExecutors.listeningDecorator(executor1);

    ExecutorService executor2 = Executors.newFixedThreadPool(1,
        new ThreadFactoryBuilder().setDaemon(true).setNameFormat("WatchExpirer").build());
    expirerExecutorService = MoreExecutors.listeningDecorator(executor2);
  }

  /**
   * Register a base dir for an application
   * @param pathString the full path including jobId, user - /${local.dir}/appCache/${appId}/userCache/${user}
   * @param appId the appId
   * @param user the user
   * @param expiry when to expire the watch - in ms
   * @throws IOException
   */
  void registerDagDir(String pathString, String appId, int dagIdentifier, String user, long expiry) throws IOException {
    // The path string contains the dag Identifier
    Path path = FileSystems.getDefault().getPath(pathString);
    WatchedPathInfo watchedPathInfo =
        new WatchedPathInfo(System.currentTimeMillis() + expiry, Type.BASE, appId, dagIdentifier,
            user);
    watchedPaths.put(path, watchedPathInfo);
    WatchKey watchKey = path.register(watchService, ENTRY_CREATE);
    watchedPathInfo.setWatchKey(watchKey);
    watchedPathQueue.add(watchedPathInfo);

    // TODO Watches on the output dirs need to be cancelled at some point. For now - via the expiry.
  }

  void unregisterDagDir(String pathString, String appId, int dagIdentifier) {
    // TODO Implement to remove all watches for the specified pathString and it's sub-tree
  }

  /**
   * Invoke when a pathIdentifier has been found, or is no longer of interest
   * @param pathIdentifier
   */
  void attemptInfoFound(AttemptPathIdentifier pathIdentifier) {
    cancelWatchesForAttempt(pathIdentifier);
  }

  void start() {
    watcherFuture = watcherExecutorService.submit(watcherCallable);
    expirerFuture = expirerExecutorService.submit(expirerCallable);
  }

  void stop() throws IOException {
    shutdown.set(true);
    if (watcherFuture != null) {
      watcherFuture.cancel(true);
    }
    if (expirerFuture != null) {
      expirerFuture.cancel(true);
    }
    watchService.close();
    watcherExecutorService.shutdownNow();
    expirerExecutorService.shutdownNow();
  }



  private void registerDir(Path path, WatchedPathInfo watchedPathInfo) {
    watchedPaths.put(path, watchedPathInfo);
    try {
      WatchKey watchKey = path.register(watchService, ENTRY_CREATE);
      watchedPathInfo.setWatchKey(watchKey);
      watchedPathQueue.add(watchedPathInfo);
      if (watchedPathInfo.type == Type.FINAL) {
        trackWatchForAttempt(watchedPathInfo, watchKey);
      }
    } catch (IOException e) {
      LOG.warn("Unable to setup watch for: " + path);
    }
  }

  private void trackWatchForAttempt(WatchedPathInfo watchedPathInfo, WatchKey watchKey) {
    assert watchedPathInfo.pathIdentifier != null;
    // TODO May be possible to do finer-grained locks.
    synchronized (watchesPerAttempt) {
      List list = watchesPerAttempt.get(watchedPathInfo.pathIdentifier);
      if (list == null) {
        list = new LinkedList<>();
        watchesPerAttempt.put(watchedPathInfo.pathIdentifier, list);
      }
      list.add(watchKey);
    }
  }

  private void cancelWatchesForAttempt(AttemptPathIdentifier pathIdentifier) {
    // TODO May be possible to do finer-grained locks.
    synchronized(watchesPerAttempt) {
      List list = watchesPerAttempt.remove(pathIdentifier);
      if (list != null) {
        for (WatchKey watchKey : list) {
          watchKey.cancel();
        }
      }
    }
  }

  public void watch() {
    while (!shutdown.get()) {
      WatchKey watchKey;
      try {
        watchKey = watchService.take();
      } catch (InterruptedException e) {
        if (shutdown.get()) {
          LOG.info("Shutting down watcher");
          break;
        } else {
          LOG.error("Watcher interrupted before being shutdown");
          throw new RuntimeException("Watcher interrupted before being shutdown", e);
        }
      }
      Path watchedPath = (Path) watchKey.watchable();
      WatchedPathInfo parentWatchedPathInfo = watchedPaths.get(watchedPath);
      boolean cancelledWatch = false;
      for (WatchEvent rawEvent : watchKey.pollEvents()) {
        if (rawEvent.kind().equals(OVERFLOW)) {
          // Ignoring and continuing to watch for additional elements in the dir.
          continue;
        }

        WatchEvent event = (WatchEvent) rawEvent;
        WatchedPathInfo watchedPathInfo;
        Path resolvedPath;

        switch (parentWatchedPathInfo.type) {
          case BASE:
            // Add the output dir to the watch set, scan it, and cancel current watch.
            if (event.context().getFileName().toString().equals(OUTPUT)) {
              resolvedPath = watchedPath.resolve(event.context());
              watchedPathInfo = new WatchedPathInfo(parentWatchedPathInfo, Type.OUTPUT, null);
              registerDir(resolvedPath, watchedPathInfo);
              // Scan the "output" directory for existing files, and add watches
              try (DirectoryStream dirStream = Files.newDirectoryStream(resolvedPath)) {
                for (Path path : dirStream) {
                  // This would be an attempt directory. Add a watch, and track it.
                  if (path.toFile().isDirectory()) {
                    watchedPathInfo = new WatchedPathInfo(parentWatchedPathInfo, Type.FINAL, path.getFileName().toString());
                    registerDir(path, watchedPathInfo);
                    scanForFinalFiles(watchedPathInfo, path);
                  } else {
                    LOG.warn("Ignoring unexpected file: " + path);
                  }
                }
              } catch (IOException e) {
                LOG.warn("Unable to list files under: " + resolvedPath);
              }
              // Cancel the watchKey since the output dir has been found.
              cancelledWatch = true;
              watchKey.cancel();
            } else {
              LOG.warn("DEBUG: Found unexpected directory while looking for OUTPUT: " + event.context() + " under " + watchedPath);
            }
            break;
          case OUTPUT:
            // Add the attemptDir to the watch set, scan it and add to the list of found files
            resolvedPath = watchedPath.resolve(event.context());
            // New attempt path crated. Add a watch on it, and scan it for existing files.
            watchedPathInfo = new WatchedPathInfo(parentWatchedPathInfo, Type.FINAL, event.context().getFileName().toString());
            registerDir(resolvedPath, watchedPathInfo);
            scanForFinalFiles(watchedPathInfo, resolvedPath);

            break;
          case FINAL:
            resolvedPath = watchedPath.resolve(event.context());
            if (event.context().getFileName().toString().equals(ShuffleHandler.DATA_FILE_NAME)) {
              registerFoundAttempt(parentWatchedPathInfo.pathIdentifier, null, resolvedPath);
            } else if (event.context().getFileName().toString().equals(ShuffleHandler.INDEX_FILE_NAME)) {
              registerFoundAttempt(parentWatchedPathInfo.pathIdentifier, resolvedPath, null);
            } else {
              LOG.warn("Ignoring unexpected file: " + watchedPath.resolve(event.context()));
            }
            break;
        }

      }
      if (!cancelledWatch) {
        boolean valid = watchKey.reset();
        if (!valid) {
          LOG.warn("DEBUG: WatchKey: " + watchKey.watchable() + " no longer valid");
        }
      }
    }
  }

  private void scanForFinalFiles(WatchedPathInfo watchedPathInfo, Path path) {
    try (DirectoryStream dirStream = Files.newDirectoryStream(path) ) {
      for (Path p : dirStream) {
        if (p.getFileName().toString().equals(ShuffleHandler.DATA_FILE_NAME)) {
          registerFoundAttempt(watchedPathInfo.pathIdentifier, null, path);
        } else if (p.getFileName().toString().equals(ShuffleHandler.INDEX_FILE_NAME)) {
          registerFoundAttempt(watchedPathInfo.pathIdentifier, path, null);
        } else {
          LOG.warn("Ignoring unknown file: " + p.getFileName());
        }
      }
    } catch (IOException e) {
      LOG.warn("Unable to open dir stream for attemptDir: " + path);
    }
  }

  private void registerFoundAttempt(AttemptPathIdentifier pathIdentifier, Path indexFile, Path dataFile) {
    FoundPathInfo pathInfo = foundAttempts.get(pathIdentifier);
    if (pathInfo == null) {
      pathInfo = new FoundPathInfo(indexFile, dataFile);
      foundAttempts.put(pathIdentifier, pathInfo);
    }
    if (pathInfo.isComplete()) {
      // Inform the shuffle handler
      listener.registerAttemptDirs(pathIdentifier,
          new ShuffleHandler.AttemptPathInfo(new org.apache.hadoop.fs.Path(indexFile.toUri()),
              new org.apache.hadoop.fs.Path(dataFile.toUri())));
      // Cancel existing watches
      cancelWatchesForAttempt(pathIdentifier);
      // Cleanup structures
      foundAttempts.remove(pathIdentifier);
    }
  }

  private class WatcherCallable implements Callable {

    @Override
    public Void call() throws Exception {
      watch();
      return null;
    }
  }

  private class WatchExpirerCallable implements Callable {

    @Override
    public Void call() {
      while (!shutdown.get()) {
        // Relying on watchService.close to clean up all pending watches
        WatchedPathInfo pathInfo;
        try {
          pathInfo = watchedPathQueue.take();
        } catch (InterruptedException e) {
          if (shutdown.get()) {
            LOG.info("Shutting down WatchExpirer");
            break;
          } else {
            LOG.error("WatchExpirer interrupted before being shutdown");
            throw new RuntimeException("WatchExpirer interrupted before being shutdown", e);
          }
        }
        WatchKey watchKey = pathInfo.getWatchKey();
        if (watchKey != null && watchKey.isValid()) {
          watchKey.cancel();
        }
      }
      return null;
    }
  }


  private static class FoundPathInfo {
    Path indexPath;
    Path dataPath;

    public FoundPathInfo(Path indexPath, Path dataPath) {
      this.indexPath = indexPath;
      this.dataPath = dataPath;
    }

    boolean isComplete() {
      return indexPath != null && dataPath != null;
    }
  }

  private static class WatchedPathInfo implements Delayed {
    final long expiry;
    final Type type;
    final String appId;
    final int dagId;
    final String user;
    final String attemptId;
    final AttemptPathIdentifier pathIdentifier;
    WatchKey watchKey;

    public WatchedPathInfo(long expiry, Type type, String jobId, int dagId, String user) {
      this.expiry = expiry;
      this.type = type;
      this.appId = jobId;
      this.dagId = dagId;
      this.user = user;
      this.attemptId = null;
      this.pathIdentifier = null;
    }

    public WatchedPathInfo(WatchedPathInfo other, Type type, String attemptId) {
      this.expiry = other.expiry;
      this.appId = other.appId;
      this.user = other.user;
      this.dagId = other.dagId;
      this.type = type;
      this.attemptId = attemptId;
      if (attemptId != null) {
        pathIdentifier = new AttemptPathIdentifier(appId, dagId, user, attemptId);
      } else {
        pathIdentifier = null;
      }
    }

    synchronized void setWatchKey(WatchKey watchKey) {
      this.watchKey = watchKey;
    }

    synchronized WatchKey getWatchKey() {
      return this.watchKey;
    }

    @Override
    public long getDelay(TimeUnit unit) {
      return expiry - System.currentTimeMillis();
    }

    @Override
    public int compareTo(Delayed o) {
      WatchedPathInfo other = (WatchedPathInfo)o;
      if (other.expiry > this.expiry) {
        return -1;
      } else if (other.expiry < this.expiry) {
        return 1;
      } else {
        return 0;
      }
    }
  }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy