Description
I'm not sure which class in the stack trace below is responsible for attempting to seek past the end of file.
2007-07-16 20:31:40,598 INFO org.apache.hadoop.mapred.TaskInProgress: Error from task_200707162028_0014_m_000000_0: java.io.IOException: Cannot seek after EOF
at org.apache.hadoop.dfs.DFSClient$DFSInputStream.seek(DFSClient.java:1040)
at org.apache.hadoop.fs.FSDataInputStream.seek(FSDataInputStream.java:37)
at org.apache.hadoop.fs.ChecksumFileSystem$ChecksumFSInputChecker.readChunk(ChecksumFileSystem.java:188)
at org.apache.hadoop.fs.FSInputChecker.readChecksumChunk(FSInputChecker.java:234)
at org.apache.hadoop.fs.FSInputChecker.fill(FSInputChecker.java:176)
at org.apache.hadoop.fs.FSInputChecker.read1(FSInputChecker.java:193)
at org.apache.hadoop.fs.FSInputChecker.read(FSInputChecker.java:157)
at org.apache.hadoop.fs.FSInputChecker.readFully(FSInputChecker.java:353)
at org.apache.hadoop.fs.FSInputChecker.seek(FSInputChecker.java:331)
at org.apache.hadoop.fs.FSInputChecker.skip(FSInputChecker.java:306)
at java.io.FilterInputStream.skip(FilterInputStream.java:125)
at java.io.FilterInputStream.skip(FilterInputStream.java:125)
at com.yahoo.pig.impl.io.InputStreamPosition.skip(InputStreamPosition.java:55)
at java.io.BufferedInputStream.skip(BufferedInputStream.java:349)
at java.io.FilterInputStream.skip(FilterInputStream.java:125)
at com.yahoo.pig.impl.builtin.RandomSampleLoader.getNext(RandomSampleLoader.java:34)
at com.yahoo.pig.impl.mapreduceExec.PigInputFormat$PigRecordReader.next(PigInputFormat.java:169)
at org.apache.hadoop.mapred.MapTask$1.next(MapTask.java:171)
at com.yahoo.pig.impl.mapreduceExec.PigMapReduce.run(PigMapReduce.java:98)
at org.apache.hadoop.mapred.MapTask.run(MapTask.java:189)
at org.apache.hadoop.mapred.TaskTracker$Child.main(TaskTracker.java:1771)