I have a table with orc files on hdfs and I want to read it by spark but I got error. there are 14 files in hdfs directory and I can not read the last file.
I used hive –orcfiledump {file path} but I got same error:
Exception in thread "main" com.google.protobuf.InvalidProtocolBufferException: While parsing a protocol message, the input ended unexpectedly in the middle of a field. This could mean either than the input has been truncated or that an embedded message misreported its own length.
at com.google.protobuf.InvalidProtocolBufferException.truncatedMessage(InvalidProtocolBufferException.java:70)
at com.google.protobuf.CodedInputStream.readRawBytes(CodedInputStream.java:789)
at com.google.protobuf.CodedInputStream.readBytes(CodedInputStream.java:329)
at com.google.protobuf.UnknownFieldSet$Builder.mergeFieldFrom(UnknownFieldSet.java:484)
at com.google.protobuf.GeneratedMessage.parseUnknownField(GeneratedMessage.java:193)
at org.apache.orc.OrcProto$PostScript.<init>(OrcProto.java:18532)
at org.apache.orc.OrcProto$PostScript.<init>(OrcProto.java:18490)
at org.apache.orc.OrcProto$PostScript$1.parsePartialFrom(OrcProto.java:18628)
at org.apache.orc.OrcProto$PostScript$1.parsePartialFrom(OrcProto.java:18623)
at com.google.protobuf.AbstractParser.parseFrom(AbstractParser.java:89)
at com.google.protobuf.AbstractParser.parseFrom(AbstractParser.java:95)
at com.google.protobuf.AbstractParser.parseFrom(AbstractParser.java:49)
at org.apache.orc.OrcProto$PostScript.parseFrom(OrcProto.java:19022)
at org.apache.orc.impl.ReaderImpl.extractPostScript(ReaderImpl.java:437)
at org.apache.orc.impl.ReaderImpl.extractFileTail(ReaderImpl.java:566)
at org.apache.orc.impl.ReaderImpl.<init>(ReaderImpl.java:371)
at org.apache.orc.OrcFile.createReader(OrcFile.java:342)
at org.apache.orc.tools.FileDump.getReader(FileDump.java:241)
at org.apache.orc.tools.FileDump.printMetaDataImpl(FileDump.java:300)
at org.apache.orc.tools.FileDump.printMetaData(FileDump.java:274)
at org.apache.orc.tools.FileDump.main(FileDump.java:135)
at org.apache.orc.tools.FileDump.main(FileDump.java:142)
at sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)
at sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62)
at sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
at java.lang.reflect.Method.invoke(Method.java:498)
at org.apache.hadoop.util.RunJar.run(RunJar.java:318)
at org.apache.hadoop.util.RunJar.main(RunJar.java:232)