hive中的sql运行日志如下:
2022-10-17 10:33:04 INFO Diagnostic Messages for this Task:
2022-10-17 10:33:04 INFO Error: java.io.IOException: java.lang.reflect.InvocationTargetException
2022-10-17 10:33:04 INFO at org.apache.hadoop.hive.io.HiveIOExceptionHandlerChain.handleRecordReaderCreationException(HiveIOExceptionHandlerChain.java:97)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hive.io.HiveIOExceptionHandlerUtil.handleRecordReaderCreationException(HiveIOExceptionHandlerUtil.java:57)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hive.shims.HadoopShimsSecure$CombineFileRecordReader.initNextRecordReader(HadoopShimsSecure.java:266)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hive.shims.HadoopShimsSecure$CombineFileRecordReader.(HadoopShimsSecure.java:213)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hive.shims.HadoopShimsSecure$CombineFileInputFormatShim.getRecordReader(HadoopShimsSecure.java:333)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hive.ql.io.CombineHiveInputFormat.getRecordReader(CombineHiveInputFormat.java:729)
2022-10-17 10:33:04 INFO at org.apache.hadoop.mapred.MapTask$TrackedRecordReader.(MapTask.java:169)
2022-10-17 10:33:04 INFO at org.apache.hadoop.mapred.MapTask.runOldMapper(MapTask.java:432)
2022-10-17 10:33:04 INFO at org.apache.hadoop.mapred.MapTask.run(MapTask.java:343)
2022-10-17 10:33:04 INFO at org.apache.hadoop.mapred.YarnChild$2.run(YarnChild.java:169)
2022-10-17 10:33:04 INFO at java.security.AccessController.doPrivileged(Native Method)
2022-10-17 10:33:04 INFO at javax.security.auth.Subject.doAs(Subject.java:422)
2022-10-17 10:33:04 INFO at org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1995)
2022-10-17 10:33:04 INFO at org.apache.hadoop.mapred.YarnChild.main(YarnChild.java:162)
2022-10-17 10:33:04 INFO Caused by: java.lang.reflect.InvocationTargetException
2022-10-17 10:33:04 INFO at sun.reflect.NativeConstructorAccessorImpl.newInstance0(Native Method)
2022-10-17 10:33:04 INFO at sun.reflect.NativeConstructorAccessorImpl.newInstance(NativeConstructorAccessorImpl.java:62)
2022-10-17 10:33:04 INFO at sun.reflect.DelegatingConstructorAccessorImpl.newInstance(DelegatingConstructorAccessorImpl.java:45)
2022-10-17 10:33:04 INFO at java.lang.reflect.Constructor.newInstance(Constructor.java:423)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hive.shims.HadoopShimsSecure$CombineFileRecordReader.initNextRecordReader(HadoopShimsSecure.java:252)
2022-10-17 10:33:04 INFO … 11 more
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.server.namenode.INodeFile.valueOf(INodeFile.java:86)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.server.namenode.INodeFile.valueOf(INodeFile.java:76)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.server.namenode.FSDirStatAndListingOp.getBlockLocations(FSDirStatAndListingOp.java:155)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.server.namenode.FSNamesystem.getBlockLocations(FSNamesystem.java:2150)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.server.namenode.NameNodeRpcServer.getBlockLocations(NameNodeRpcServer.java:795)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.protocolPB.ClientNamenodeProtocolServerSideTranslatorPB.getBlockLocations(ClientNamenodeProtocolServerSideTranslatorPB.java:493)
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.ProtobufRpcEngine S e r v e r Server ServerProtoBufRpcInvoker.call(ProtobufRpcEngine.java:554)
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.RPC$Server.call(RPC.java:1105)
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.Server$RpcCall.run(Server.java:1069)
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.Server$RpcCall.run(Server.java:996)
2022-10-17 10:33:04 INFO at java.base/javax.security.auth.Subject.doAs(Subject.java:423)
2022-10-17 10:33:04 INFO at org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:2010)
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.Server$Handler.run(Server.java:3061)
2022-10-17 10:33:04 INFO
2022-10-17 10:33:04 INFO at sun.reflect.NativeConstructorAccessorImpl.newInstance0(Native Method)
2022-10-17 10:33:04 INFO at sun.reflect.NativeConstructorAccessorImpl.newInstance(NativeConstructorAccessorImpl.java:62)
2022-10-17 10:33:04 INFO at sun.reflect.DelegatingConstructorAccessorImpl.newInstance(DelegatingConstructorAccessorImpl.java:45)
2022-10-17 10:33:04 INFO at java.lang.reflect.Constructor.newInstance(Constructor.java:423)
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.RemoteException.instantiateException(RemoteException.java:106)
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.RemoteException.unwrapRemoteException(RemoteException.java:73)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.DFSClient.callGetBlockLocations(DFSClient.java:951)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.DFSClient.getLocatedBlocks(DFSClient.java:938)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.DFSClient.getLocatedBlocks(DFSClient.java:927)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.DFSClient.open(DFSClient.java:1105)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.DistributedFileSystem$4.doCall(DistributedFileSystem.java:381)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.DistributedFileSystem$4.doCall(DistributedFileSystem.java:376)
2022-10-17 10:33:04 INFO at org.apache.hadoop.fs.FileSystemLinkResolver.resolve(FileSystemLinkResolver.java:81)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.DistributedFileSystem.open(DistributedFileSystem.java:399)
2022-10-17 10:33:04 INFO at org.apache.hadoop.fs.FileSystem.open(FileSystem.java:900)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hive.ql.io.orc.ReaderImpl.extractMetaInfoFromFooter(ReaderImpl.java:356)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hive.ql.io.orc.ReaderImpl.(ReaderImpl.java:317)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hive.ql.io.orc.OrcFile.createReader(OrcFile.java:190)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hive.ql.io.orc.OrcInputFormat.getRecordReader(OrcInputFormat.java:1121)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hive.ql.io.CombineHiveRecordReader.(CombineHiveRecordReader.java:67)
2022-10-17 10:33:04 INFO … 16 more
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.server.namenode.INodeFile.valueOf(INodeFile.java:86)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.server.namenode.INodeFile.valueOf(INodeFile.java:76)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.server.namenode.FSDirStatAndListingOp.getBlockLocations(FSDirStatAndListingOp.java:155)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.server.namenode.FSNamesystem.getBlockLocations(FSNamesystem.java:2150)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.server.namenode.NameNodeRpcServer.getBlockLocations(NameNodeRpcServer.java:795)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.protocolPB.ClientNamenodeProtocolServerSideTranslatorPB.getBlockLocations(ClientNamenodeProtocolServerSideTranslatorPB.java:493)
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.ProtobufRpcEngine S e r v e r Server ServerProtoBufRpcInvoker.call(ProtobufRpcEngine.java:554)
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.RPC$Server.call(RPC.java:1105)
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.Server$RpcCall.run(Server.java:1069)
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.Server$RpcCall.run(Server.java:996)
2022-10-17 10:33:04 INFO at java.base/javax.security.auth.Subject.doAs(Subject.java:423)
2022-10-17 10:33:04 INFO at org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:2010)
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.Server$Handler.run(Server.java:3061)
2022-10-17 10:33:04 INFO
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.Client.getRpcResponse(Client.java:1665)
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.Client.call(Client.java:1611)
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.Client.call(Client.java:1509)
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.ProtobufRpcEngine$Invoker.invoke(ProtobufRpcEngine.java:257)
2022-10-17 10:33:04 INFO at org.apache.hadoop.ipc.ProtobufRpcEngine$Invoker.invoke(ProtobufRpcEngine.java:131)
2022-10-17 10:33:04 INFO at com.sun.proxy.$Proxy14.getBlockLocations(Unknown Source)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.protocolPB.ClientNamenodeProtocolTranslatorPB.getBlockLocations(ClientNamenodeProtocolTranslatorPB.java:364)
2022-10-17 10:33:04 INFO at sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)
2022-10-17 10:33:04 INFO at sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62)
2022-10-17 10:33:04 INFO at sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
2022-10-17 10:33:04 INFO at java.lang.reflect.Method.invoke(Method.java:498)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.ObserverReadProxyProvider$ObserverReadInvocationHandler.invoke(ObserverReadProxyProvider.java:524)
2022-10-17 10:33:04 INFO at com.sun.proxy.$Proxy11.getBlockLocations(Unknown Source)
2022-10-17 10:33:04 INFO at sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)
2022-10-17 10:33:04 INFO at sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62)
2022-10-17 10:33:04 INFO at sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
2022-10-17 10:33:04 INFO at java.lang.reflect.Method.invoke(Method.java:498)
2022-10-17 10:33:04 INFO at org.apache.hadoop.io.retry.RetryInvocationHandler.invokeMethod(RetryInvocationHandler.java:434)
2022-10-17 10:33:04 INFO at org.apache.hadoop.io.retry.RetryInvocationHandler$Call.invokeMethod(RetryInvocationHandler.java:166)
2022-10-17 10:33:04 INFO at org.apache.hadoop.io.retry.RetryInvocationHandler$Call.invoke(RetryInvocationHandler.java:158)
2022-10-17 10:33:04 INFO at org.apache.hadoop.io.retry.RetryInvocationHandler$Call.invokeOnce(RetryInvocationHandler.java:96)
2022-10-17 10:33:04 INFO at org.apache.hadoop.io.retry.RetryInvocationHandler.invoke(RetryInvocationHandler.java:360)
2022-10-17 10:33:04 INFO at com.sun.proxy.$Proxy11.getBlockLocations(Unknown Source)
2022-10-17 10:33:04 INFO at org.apache.hadoop.hdfs.DFSClient.callGetBlockLocations(DFSClient.java:949)
2022-10-17 10:33:04 INFO … 29 more
2022-10-17 10:33:04 INFO
2022-10-17 10:33:04 INFO
2022-10-17 10:33:04 INFO FAILED: Execution Error, return code 2 from org.apache.hadoop.hive.ql.exec.mr.MapRedTask
根据上述日志分析,是因为sql中缺失必要的参数导致。开启MR中间压缩,然后把压缩方式修改为snappy压缩即可。
SET hive.exec.compress.intermediate=TRUE;
SET mapred.map.output.compression.codec=org.apache.hadoop.io.compress.SnappyCodec;
SET mapred.output.compression.codec=org.apache.hadoop.io.compress.SnappyCodec;