<batch:job id="newsSimJob" >
<batch:step id="news_sim_script_step" next="news_sim_hdp_step" >
<batch:tasklet ref="news_sim_script_tasklet" />
</batch:step>
<batch:step id="news_sim_hdp_step" next="news_sim_cp2local_step" >
<batch:tasklet ref="news_sim_tasklet" />
</batch:step>
<batch:step id="news_sim_cp2local_step" next="new_sim_redis_step" >
<batch:tasklet ref="news_sim_cp2local_tasklet" />
</batch:step>
<batch:step id="new_sim_redis_step">
<batch:tasklet ref="simOutputTask" />
</batch:step>
</batch:job>
<hdp:job id="news_convert_sim_job"
input-path="${sim.input.path}/news/length/" output-path="${sim.output.path}/news/convert/"
mapper="com.xxx.wap.algorithm.mapred.sim.SimConver tJob.MapClass"
reducer="com.xxx.wap.algorithm.mapred.sim.SimConve rtJob.Reduce"
jar="${jar.file.path}"
input-format="org.apache.hadoop.mapreduce.lib.input.Text InputFormat"
output-format="org.apache.hadoop.mapreduce.lib.output.Seq uenceFileOutputFormat"
map-key="org.apache.hadoop.io.Text"
map-value="com.xxx.wap.algorithm.model.sim.SimKeyValue "
key="org.apache.hadoop.io.Text"
value="com.xxx.wap.algorithm.model.sim.SimKeyValue Set"
configuration-ref="hadoopConfiguration"
scope="prototype"
/>
if i execute the job again,i must write this configuration again???how to create a different hadoop job with <hdp:job


Reply With Quote