org.apache.hadoop.streaming.JarBuilder Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of hadoop-streaming Show documentation
Show all versions of hadoop-streaming Show documentation
Apache Hadoop MapReduce Streaming
The newest version!
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.hadoop.streaming;
import java.io.*;
import java.util.*;
import java.util.jar.*;
import java.util.zip.ZipException;
/**
* This class is the main class for generating job.jar
* for Hadoop Streaming jobs. It includes the files specified
* with the -file option and includes them in the jar. Also,
* hadoop-streaming is a user level appplication, so all the classes
* with hadoop-streaming that are needed in the job are also included
* in the job.jar.
*/
public class JarBuilder {
public JarBuilder() {
}
public void setVerbose(boolean v) {
this.verbose = v;
}
public void merge(List srcNames, List srcUnjar, String dstJar) throws IOException {
String source = null;
JarOutputStream jarOut = null;
JarFile jarSource = null;
jarOut = new JarOutputStream(new FileOutputStream(dstJar));
boolean throwing = false;
try {
if (srcNames != null) {
Iterator iter = srcNames.iterator();
while (iter.hasNext()) {
source = (String) iter.next();
File fsource = new File(source);
String base = getBasePathInJarOut(source);
if (!fsource.exists()) {
throwing = true;
throw new FileNotFoundException(fsource.getAbsolutePath());
}
if (fsource.isDirectory()) {
addDirectory(jarOut, base, fsource, 0);
} else {
addFileStream(jarOut, base, fsource);
}
}
}
if (srcUnjar != null) {
Iterator iter = srcUnjar.iterator();
while (iter.hasNext()) {
source = (String) iter.next();
jarSource = new JarFile(source);
addJarEntries(jarOut, jarSource);
jarSource.close();
}
}
} finally {
try {
jarOut.close();
} catch (ZipException z) {
if (!throwing) {
throw new IOException(z.toString());
}
}
}
}
protected String fileExtension(String file) {
int leafPos = file.lastIndexOf('/');
if (leafPos == file.length() - 1) return "";
String leafName = file.substring(leafPos + 1);
int dotPos = leafName.lastIndexOf('.');
if (dotPos == -1) return "";
String ext = leafName.substring(dotPos + 1);
return ext;
}
/** @return empty or a jar base path. Must not start with '/' */
protected String getBasePathInJarOut(String sourceFile) {
// TaskRunner will unjar and append to classpath: .:classes/:lib/*
String ext = fileExtension(sourceFile);
if (ext.equals("class")) {
return "classes/"; // or ""
} else if (ext.equals("jar") || ext.equals("zip")) {
return "lib/";
} else {
return "";
}
}
private void addJarEntries(JarOutputStream dst, JarFile src) throws IOException {
Enumeration entries = src.entries();
JarEntry entry = null;
while (entries.hasMoreElements()) {
entry = (JarEntry) entries.nextElement();
//if (entry.getName().startsWith("META-INF/")) continue;
InputStream in = src.getInputStream(entry);
addNamedStream(dst, entry.getName(), in);
}
}
/** @param name path in jar for this jar element. Must not start with '/' */
void addNamedStream(JarOutputStream dst, String name, InputStream in) throws IOException {
if (verbose) {
System.err.println("JarBuilder.addNamedStream " + name);
}
try {
dst.putNextEntry(new JarEntry(name));
int bytesRead = 0;
while ((bytesRead = in.read(buffer, 0, BUFF_SIZE)) != -1) {
dst.write(buffer, 0, bytesRead);
}
} catch (ZipException ze) {
if (ze.getMessage().indexOf("duplicate entry") >= 0) {
if (verbose) {
System.err.println(ze + " Skip duplicate entry " + name);
}
} else {
throw ze;
}
} finally {
in.close();
dst.flush();
dst.closeEntry();
}
}
void addFileStream(JarOutputStream dst, String jarBaseName, File file) throws IOException {
FileInputStream in = new FileInputStream(file);
try {
String name = jarBaseName + file.getName();
addNamedStream(dst, name, in);
} finally {
in.close();
}
}
void addDirectory(JarOutputStream dst, String jarBaseName, File dir, int depth) throws IOException {
File[] contents = dir.listFiles();
if (contents != null) {
for (int i = 0; i < contents.length; i++) {
File f = contents[i];
String fBaseName = (depth == 0) ? "" : dir.getName();
if (jarBaseName.length() > 0) {
fBaseName = jarBaseName + "/" + fBaseName;
}
if (f.isDirectory()) {
addDirectory(dst, fBaseName, f, depth + 1);
} else {
addFileStream(dst, fBaseName + "/", f);
}
}
}
}
/** Test program */
public static void main(String args[]) {
// args = new String[] { "C:/Temp/merged.jar", "C:/jdk1.5.0/jre/lib/ext/dnsns.jar", "/Temp/addtojar2.log", "C:/jdk1.5.0/jre/lib/ext/mtest.jar", "C:/Temp/base"};
if (args.length < 2) {
System.err.println("Usage: JarFiles merged.jar [src.jar | dir | file ]+");
} else {
JarBuilder jarFiles = new JarBuilder();
List names = new ArrayList();
List unjar = new ArrayList();
for (int i = 1; i < args.length; i++) {
String f = args[i];
String ext = jarFiles.fileExtension(f);
boolean expandAsJar = ext.equals("jar") || ext.equals("zip");
if (expandAsJar) {
unjar.add(f);
} else {
names.add(f);
}
}
try {
jarFiles.merge(names, unjar, args[0]);
Date lastMod = new Date(new File(args[0]).lastModified());
System.out.println("Merge done to " + args[0] + " " + lastMod);
} catch (Exception ge) {
ge.printStackTrace(System.err);
}
}
}
private static final int BUFF_SIZE = 32 * 1024;
private byte buffer[] = new byte[BUFF_SIZE];
protected boolean verbose = false;
}
© 2015 - 2024 Weber Informatics LLC | Privacy Policy