All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.antbrains.urlcrawler.db.ViewFailedTask Maven / Gradle / Ivy

package com.antbrains.urlcrawler.db;

import java.io.BufferedReader;
import java.io.FileInputStream;
import java.io.InputStreamReader; 
import java.util.ArrayList;
import java.util.List;

import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.hbase.HBaseConfiguration;
import org.apache.hadoop.hbase.client.Connection;
import org.apache.hadoop.hbase.client.ConnectionFactory;
import org.apache.log4j.Logger;

import com.google.gson.Gson;
 

public class ViewFailedTask {
	protected static Logger logger=Logger.getLogger(ViewFailedTask.class);
	public static void main(String[] args)  throws Exception{
		if(args.length<2){
			System.err.println("need at least 2 arg:  zk dbName [total]");
			System.exit(-1);
		}
		Configuration myConf = HBaseConfiguration.create();
		myConf.set("hbase.zookeeper.quorum", args[0]);
		String dbName=args[1];
		int total=1000;
		if(args.length>2){
		    total=Integer.parseInt(args[2]);
		}
		Gson gson=new Gson();
		Connection conn =ConnectionFactory.createConnection(myConf);
        Listtasks=HbaseTool.getFailedTasks(dbName, conn, total, 0);
        for(CrawlTask task:tasks){
            System.out.println(gson.toJson(task));
        }
		conn.close();
	}

}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy