Hive 避免小文件

set mapred.max.split.size=256000000;

set mapred.min.split.size.per.node=100000000;
set mapred.min.split.size.per.rack=100000000;
set hive.input.format=org.apache.hadoop.hive.ql.io.CombineHiveInputFormat;
set hive.merge.mapfiles = true;
set hive.merge.mapredfiles = true ;
set hive.merge.size.per.task = 256000000;
set hive.merge.smallfiles.avgsize=16000000 ;
posted @ 2022-04-29 14:25  小白啊小白,Fighting  阅读(57)  评论(0编辑  收藏  举报