import java.io.IOException;
import java.net.URI; import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.NullWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.JobID;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.hadoop.mapreduce.TaskAttemptID;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.input.FileSplit;
import org.apache.hadoop.mapreduce.lib.input.TextInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
import org.apache.hadoop.mapreduce.lib.output.TextOutputFormat;
import org.apache.hadoop.util.GenericOptionsParser; public class GetIDMapReduce {
public static void main(String[] args) throws IOException, ClassNotFoundException, InterruptedException {
Configuration conf = new Configuration();
// String[] otherArgs = new GenericOptionsParser(conf, args).getRemainingArgs();
if(args.length!=2){
System.err.println("Usage databaseV1 <inputpath> <outputpath>");
} Job job = Job.getInstance(conf, GetIDMapReduce.class.getSimpleName() + "1");
job.setJarByClass(GetIDMapReduce.class);
job.setMapOutputKeyClass(Text.class);
job.setMapOutputValueClass(Text.class);
job.setOutputKeyClass(Text.class);
job.setOutputValueClass(NullWritable.class);
job.setMapperClass(MyMapper1.class);
job.setNumReduceTasks(0);
job.setInputFormatClass(TextInputFormat.class);
job.setOutputFormatClass(TextOutputFormat.class);
FileInputFormat.addInputPath(job, new Path(args[0]));
FileOutputFormat.setOutputPath(job, new Path(args[1]));
job.waitForCompletion(true);
}
public static class MyMapper1 extends Mapper<LongWritable, Text, Text, NullWritable>{
@Override
protected void map(LongWritable key, Text value, Mapper<LongWritable, Text, Text, NullWritable>.Context context)
throws IOException, InterruptedException { FileSplit fileSplit=(FileSplit) context.getInputSplit();
String pathname=fileSplit.getPath().getName();
JobID jobid=context.getJobID(); //获取jobid
LongWritable keyout=context.getCurrentKey(); //获取key偏移量
Text valueout=context.getCurrentValue(); //获取一行的值
String jobname=context.getJobName(); //获得job名字
TaskAttemptID taskid=context.getTaskAttemptID(); //获得taskid
float progress=context.getProgress(); //获取任务执行进度
String jar = context.getJar(); //作业运行之前,往集群拷贝的作业资源jar
//String status = context.getStatus();
String user = context.getUser(); //获取当前用户
//String[] fileTimestamps = context.getFileTimestamps();
int numReduceTasks = context.getNumReduceTasks(); //获得reduce的数量
//Path[] fileClassPaths = context.getFileClassPaths();
Configuration configuration = context.getConfiguration(); //获得作业配置文件
//RawComparator<?> groupingComparator = context.getGroupingComparator();
boolean jobSetupCleanupNeeded = context.getJobSetupCleanupNeeded(); //Get whether job-setup and job-cleanup is needed for the job
int maxMapAttempts = context.getMaxMapAttempts(); //the max number of attempts per map task
int maxReduceAttempts = context.getMaxReduceAttempts(); //he max number of attempts per reduce task.
//@SuppressWarnings("deprecation")
//Path[] localCacheFiles = context.getLocalCacheFiles();
//OutputCommitter outputCommitter = context.getOutputCommitter();
Path workingDirectory = context.getWorkingDirectory(); //工作目录
boolean nextKeyValue = context.nextKeyValue(); //下一个键值对
//URI[] cacheFiles = context.getCacheFiles();
URI[] cacheArchives = context.getCacheArchives(); //Get cache archives set in the Configuration
Path[] archiveClassPaths = context.getArchiveClassPaths();//Get the archive entries in classpath as an array of Path
boolean profileEnabled = context.getProfileEnabled();//Get whether the task profiling is enabled.
//String profileParams = context.getProfileParams();
@SuppressWarnings("deprecation")
boolean symlink = context.getSymlink();// Originally intended to check if symlinks should be used, but currently symlinks cannot be disabled
//RawComparator<?> sortComparator = context.getSortComparator();
//int hashCode = context.hashCode();
context.write(new Text("===================================================================================="), NullWritable.get());
context.write(new Text("pathname--"+pathname), NullWritable.get());
context.write(new Text("jobid--"+jobid.toString()), NullWritable.get());
context.write(new Text("keyout--"+keyout.toString()), NullWritable.get());
context.write(new Text("keyout--"+valueout), NullWritable.get());
context.write(new Text("jobname--"+jobname), NullWritable.get());
context.write(new Text("taskid--"+taskid.toString()), NullWritable.get());
context.write(new Text("progress--"+progress), NullWritable.get());
context.write(new Text("jar--"+jar.toString()), NullWritable.get());
//context.write(new Text("status--"+status), NullWritable.get());
context.write(new Text("user--"+user), NullWritable.get());
//context.write(new Text("fileTimestamps--"+fileTimestamps), NullWritable.get());
context.write(new Text("numReduceTasks--"+numReduceTasks), NullWritable.get());
//context.write(new Text("fileClassPaths--"+fileClassPaths), NullWritable.get());
context.write(new Text("configuration--"+configuration), NullWritable.get());
//context.write(new Text("groupingComparator--"+groupingComparator), NullWritable.get());
context.write(new Text("jobSetupCleanupNeeded--"+jobSetupCleanupNeeded), NullWritable.get());
context.write(new Text("maxMapAttempts--"+maxMapAttempts), NullWritable.get());
context.write(new Text("maxReduceAttempts--"+maxReduceAttempts), NullWritable.get());
//context.write(new Text("localCacheFiles--"+localCacheFiles), NullWritable.get());
//context.write(new Text("outputCommitter--"+outputCommitter), NullWritable.get());
context.write(new Text("workingDirectory--"+workingDirectory), NullWritable.get());
context.write(new Text("nextKeyValue--"+nextKeyValue), NullWritable.get());
//context.write(new Text("cacheFiles--"+cacheFiles), NullWritable.get());
context.write(new Text("cacheArchives--"+cacheArchives), NullWritable.get());
context.write(new Text("archiveClassPaths--"+archiveClassPaths), NullWritable.get());
context.write(new Text("profileEnabled--"+profileEnabled), NullWritable.get());
//context.write(new Text("profileParams--"+profileParams), NullWritable.get());
context.write(new Text("symlink--"+symlink), NullWritable.get());
//context.write(new Text("sortComparator--"+sortComparator), NullWritable.get());
//context.write(new Text("hashCode--"+hashCode), NullWritable.get());
}
}
}

注:并非原著,备注下来方便后面自己查看

hadoop上下文信息获取方法的更多相关文章

  1. spring上下文快速获取方法

    import org.springframework.beans.BeansException;import org.springframework.context.ApplicationContex ...

  2. JavaScript获取客户端计算机硬件及系统等信息的方法

    JavaScript获取客户端计算机硬件及系统等信息的方法 JavaScript 获取客户端计算机硬件及系统信息 通过WMI来实现获取客户端计算机硬件及系统信息: function getSysInf ...

  3. AspectJ获取方法注解的信息

    在使用Aspectj获取方法注解信息的时候,可以使用下面的代码片段: /** * Get value of annotated method parameter */ private <T ex ...

  4. PHP获取http头信息和CI中获取HTTP头信息的方法

    CI中获取HTTP头信息的方法: $this->input->request_headers() 在不支持apache_request_headers()的非Apache环境非常有用.返回 ...

  5. Request获取url各种信息的方法

    1.Request获取url各种信息的方法 测试的url地址:http://www.test.com/testweb/default.aspx, 结果如下: Request.ApplicationPa ...

  6. Oracle 和 SQLSERVER 重新获取统计信息的方法

    1. Oracle 重新获取统计信息的命令 exec dbms_stats.gather_schema_stats(ownname =>) # 需要修改 ownername options 指定 ...

  7. httpclient接口测试完整用例以及获取信息的方法

    原文地址https://blog.csdn.net/fhaohaizi/article/details/78088075 原文地址https://blog.csdn.net/fhaohaizi/art ...

  8. java反射子之获取方法信息(二)

    一.获取方法 1.方法作用. 2. 二.获取方法信息.(修饰符,返回值,方法名称,参数列表,抛出的异常). ############################################## ...

  9. laravel中单独获取一个错误信息的方法

    获取单独的错误信息的方法

随机推荐

  1. WPF 之 DataTemplate 实例(摘抄)

     

  2. SAX解析xml (遍历DOM树各节点)

    本文参考 http://yangjunfeng.iteye.com/blog/401377 1. books.xml <?xml version="1.0" encoding ...

  3. Bi-LSTM-CRF for Sequence Labeling

    做了一段时间的Sequence Labeling的工作,发现在NER任务上面,很多论文都采用LSTM-CRFs的结构.CRF在最后一层应用进来可以考虑到概率最大的最优label路径,可以提高指标. 一 ...

  4. [转]什么是CNN、RNN、LSTM

    . 全连层 每个神经元输入: 每个神经元输出: (通过一个激活函数) 2. RNN(Recurrent Neural Network) 与传统的神经网络不通,RNN与时间有关. 3. LSTM(Lon ...

  5. Python--day40--全局解释器锁

    1,起一百个线程和起一百个进程所花的时间对比(开启效率的较量): import time from threading import Thread from multiprocessing impor ...

  6. UVA 11400"Lighting System Design"

    传送门 错误思路 正解 AC代码 参考资料: [1]:https://www.cnblogs.com/Kiraa/p/5510757.html 题意: 现给你一套照明系统,这套照明系统共包含 n 种类 ...

  7. 备战省赛组队训练赛第十七场(UPC)

    upc:传送门 A: 题解[1] G: 题解[1] D,G,H,J,L 题解 by 鲁东大学

  8. jQuery---鼠标滚轮控制div横向滚动条左右移动

    HTML <div class="table-responsive"> <div class="fhtable" style="wi ...

  9. 2018宁夏邀请赛 L Continuous Intervals(单调栈+线段树)

    2018宁夏邀请赛 L Continuous Intervals(单调栈+线段树) 传送门:https://nanti.jisuanke.com/t/41296 题意: 给一个数列A 问在数列A中有多 ...

  10. 树莓派4安装ftp服务端

    vsftpd是开源的轻量级的常用ftp服务器.   1,安装vsftpd服务器 (约400KB) sudo apt-get install vsftpd     2,启动ftp服务 sudo serv ...