shell调用mapreduce无法执行后续脚本问题

时间:2022-01-23 11:33:27

把mapreduce打成jar包然后用shell去调用,但是mapreduce执行结束后,总是卡在那里不会继续往下执行,今天写了个循环来检测,可以达到目的。

#!/bin/sh
set -x
deal_date=${1:-`date --date '1 days ago' +%Y%m%d`}
deal_date=20140616
hadoop fs -rmr /user/hdfs/result/TermActiveJob/${deal_date}/
java -classpath /home/mapreduceProgram/dotStat/dotstat_v2-0.0.1-SNAPSHOT.jar com.winksi.dotstat.TermActiveJob ${deal_date} &
# &符号是让上面的语句在后台执行,然后无间歇的执行下面的语句
while true
do
  sleep 1s #1秒钟循环一次
  hadoop fs -test -e /user/hdfs/result/TermActiveJob/${deal_date}/part*   #该文件时mapreduce执行结束后生成的文件
   if [ $? -ne 0 ]; then
     echo "Directory not exists!"
   else
     echo "it is exist!"
     ps -ef  |grep TermActiveJob  |awk '{print $2}'  |while read pid   #如果生成的文件存在,那么就杀死mapreduce的进程
        do
                kill -9 $pid
        done
     #进行后续的收尾操作
     mkdir /root/hanfeng/shell/TermActiveJob
     cd /root/hanfeng/shell/TermActiveJob
     rm -rf *
     hadoop fs -get /user/hdfs/result/TermActiveJob/${deal_date}/part*
     cat part* > result.txt
     echo "DELETE FROM term_active wHERE cur_time=${deal_date} ;" | mysql -h172.16.1.81 -P3308 -uadmin -ptonggangdasha reportdb
     echo "LOAD DATA local INFILE 'result.txt' INTO TABLE term_active FIELDS TERMINATED BY ',' LINES TERMINATED BY '\n' (adccompany,cityId,av,model,num,cur_time) ;" | mysql -h172.16.1.81 -P3308 -uadmin -ptonggangdasha reportdb;
     break
    fi
done

echo "Finish"

------------------------------------------------------------------------------------------------------------------------

重大发现:在老大的指点下,发现执行mapreduce无返回,是我代码的问题,后来经改正,代码如下:

public class ZdwsCombineJob extends Configured implements Tool{  //我之前就是没有实现Configured 和Tool,而是直接用main函数执行JOB,才不能结束的
	public static String date;
	public static String month;
	private int reducernum;
	public ZdwsCombineJob(int i){
		reducernum = i;
	}
	public static void main(String argv[]) throws Exception{
	
		if(argv.length != 0){
			date = argv[0];
			month = date.toString().substring(0, 6);
		}else{
			Date yesterdayDate = new Date(new Date().getTime() - 1*24*60*60*1000);
			date = DateUtils.getDotActionDate(yesterdayDate); //20140501
			month = DateUtils.getCurrentMonth(yesterdayDate);
		}
                //这里需要用线程来启动任务,执行结束后才能退出
                int	exit  = ToolRunner.run(new ZdwsCombineJob(48), argv);
		System.exit(exit);
	}

	@Override
	public int run(String[] args) throws Exception {
		Configuration conf = getConf();
		conf.set("fs.default.name", "hdfs://172.16.1.50:8020");  
		String input="/user/hdfs/source/db/cust_phone/cust_phone.txt";
		StringBuffer sb = new StringBuffer();
		sb.append("/user/hdfs/source/log/qymp/").append(month).append("/qymp_").append(date).append(".dat");
		String output="/user/hdfs/combine/ZdwsCombine/"+date+"/";
		Job job = new Job(conf, "ZdwsCombine");
		job.setJarByClass(ZdwsCombineJob.class);
		job.setMapperClass(ZdwsCombineMapper.class);
		job.setReducerClass(ZdwsCombineReducer.class);
		job.setOutputKeyClass(Text.class);
		job.setOutputValueClass(Text.class);
		FileInputFormat.addInputPath(job, new Path(input));
		FileInputFormat.addInputPath(job, new Path(sb.toString()));
		FileOutputFormat.setOutputPath(job, new Path(output));
		job.setNumReduceTasks(reducernum);
		job.waitForCompletion(true) ;

		return 0;
	}
}


这样的话,直接shell调用就可以了:

#!/bin/sh
set -x
deal_date=${1:-`date --date '1 days ago' +%Y%m%d`}
deal_date=20140617
hadoop fs -rmr /user/hdfs/combine/ZdwsCombine/${deal_date}/
java -classpath /home/mapreduceProgram/dotStat/dotstat_v2-0.0.1-SNAPSHOT.jar com.winksi.dotstat.ZdwsCombineJob ${deal_date}
mkdir /root/hanfeng/shell/ZdwsCombineJob
cd /root/hanfeng/shell/ZdwsCombineJob
rm -rf *
hive -S -e "alter table call_show_zdws add partition (dt='${deal_date}') location '/user/hdfs/combine/ZdwsCombine/${deal_date}'"
hive -S -e 'select phone,adccompany,cur_time,ip,model,av,enterpriseId,count(*),count(distinct(imsi)) from call_show_zdws where dt='${deal_date}' group by phone,adccompany,cur_time,ip,model,av,enterpriseId' > result.txt
echo "DELETE FROM call_show_zdws wHERE cur_time=${deal_date} ;" | mysql -h172.16.1.81 -P3308 -uadmin -ptonggangdasha reportdb
echo "LOAD DATA local INFILE 'result.txt' INTO TABLE call_show_zdws FIELDS TERMINATED BY '\t' LINES TERMINATED BY '\n' (phone,adccompany,cur_time,cityId,model,av,enterpriseId,pv,uv) ;" | mysql -h172.16.1.81 -P3308 -uadmin -ptonggangdasha reportdb;