Created
September 10, 2021 14:44
-
-
Save nsivabalan/a9d992793be449012109e73fc70b0d74 to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
21/09/10 14:34:34 WARN DagScheduler: Executing node "first_delete" :: {"name":"ec2e6f6d-8685-4828-831e-fba844da1ef2","num_partitions_delete":50,"num_records_delete":8000,"config":"first_delete"} | |
21/09/10 14:38:35 ERROR Executor: Exception in task 0.0 in stage 106.0 (TID 2445) | |
java.io.InterruptedIOException: getFileStatus on s3a://siva-test-bucket-june-16/hudi_testing/hudi_metadata1/output/1970/01/15/76112e22-c3b9-4497-9e9b-2c5a449d7477-0_20-21-148_20210910143308.parquet: com.amazonaws.SdkClientException: Unable to execute HTTP request: Timeout waiting for connection from pool | |
at org.apache.hadoop.fs.s3a.S3AUtils.translateInterruptedException(S3AUtils.java:352) | |
at org.apache.hadoop.fs.s3a.S3AUtils.translateException(S3AUtils.java:177) | |
at org.apache.hadoop.fs.s3a.S3AUtils.translateException(S3AUtils.java:151) | |
at org.apache.hadoop.fs.s3a.S3AFileSystem.s3GetFileStatus(S3AFileSystem.java:2201) | |
at org.apache.hadoop.fs.s3a.S3AFileSystem.innerGetFileStatus(S3AFileSystem.java:2163) | |
at org.apache.hadoop.fs.s3a.S3AFileSystem.getFileStatus(S3AFileSystem.java:2102) | |
at org.apache.parquet.hadoop.ParquetReader$Builder.build(ParquetReader.java:300) | |
at org.apache.hudi.io.storage.HoodieParquetReader.getRecordIterator(HoodieParquetReader.java:65) | |
at org.apache.hudi.integ.testsuite.reader.DFSHoodieDatasetInputReader.readColumnarOrLogFiles(DFSHoodieDatasetInputReader.java:269) | |
at org.apache.hudi.integ.testsuite.reader.DFSHoodieDatasetInputReader.lambda$generateUpdates$c53fa10$1(DFSHoodieDatasetInputReader.java:215) | |
at org.apache.spark.api.java.JavaPairRDD$.$anonfun$toScalaFunction$1(JavaPairRDD.scala:1041) | |
at scala.collection.Iterator$$anon$10.next(Iterator.scala:459) | |
at scala.collection.Iterator$$anon$11.nextCur(Iterator.scala:484) | |
at scala.collection.Iterator$$anon$11.hasNext(Iterator.scala:490) | |
at scala.collection.Iterator$$anon$10.hasNext(Iterator.scala:458) | |
at scala.collection.Iterator$$anon$10.hasNext(Iterator.scala:458) | |
at scala.collection.Iterator$$anon$10.hasNext(Iterator.scala:458) | |
at org.apache.spark.shuffle.sort.BypassMergeSortShuffleWriter.write(BypassMergeSortShuffleWriter.java:155) | |
at org.apache.spark.shuffle.ShuffleWriteProcessor.write(ShuffleWriteProcessor.scala:59) | |
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:99) | |
at org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:52) | |
at org.apache.spark.scheduler.Task.run(Task.scala:127) | |
at org.apache.spark.executor.Executor$TaskRunner.$anonfun$run$3(Executor.scala:446) | |
at org.apache.spark.util.Utils$.tryWithSafeFinally(Utils.scala:1377) | |
at org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:449) | |
at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149) | |
at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624) | |
at java.lang.Thread.run(Thread.java:748) | |
Caused by: com.amazonaws.SdkClientException: Unable to execute HTTP request: Timeout waiting for connection from pool | |
at com.amazonaws.http.AmazonHttpClient$RequestExecutor.handleRetryableException(AmazonHttpClient.java:1116) | |
at com.amazonaws.http.AmazonHttpClient$RequestExecutor.executeHelper(AmazonHttpClient.java:1066) | |
at com.amazonaws.http.AmazonHttpClient$RequestExecutor.doExecute(AmazonHttpClient.java:743) | |
at com.amazonaws.http.AmazonHttpClient$RequestExecutor.executeWithTimer(AmazonHttpClient.java:717) | |
at com.amazonaws.http.AmazonHttpClient$RequestExecutor.execute(AmazonHttpClient.java:699) | |
at com.amazonaws.http.AmazonHttpClient$RequestExecutor.access$500(AmazonHttpClient.java:667) | |
at com.amazonaws.http.AmazonHttpClient$RequestExecutionBuilderImpl.execute(AmazonHttpClient.java:649) | |
at com.amazonaws.http.AmazonHttpClient.execute(AmazonHttpClient.java:513) | |
at com.amazonaws.services.s3.AmazonS3Client.invoke(AmazonS3Client.java:4368) | |
at com.amazonaws.services.s3.AmazonS3Client.invoke(AmazonS3Client.java:4315) | |
at com.amazonaws.services.s3.AmazonS3Client.getObjectMetadata(AmazonS3Client.java:1271) | |
at org.apache.hadoop.fs.s3a.S3AFileSystem.lambda$getObjectMetadata$4(S3AFileSystem.java:1249) | |
at org.apache.hadoop.fs.s3a.Invoker.retryUntranslated(Invoker.java:322) | |
at org.apache.hadoop.fs.s3a.Invoker.retryUntranslated(Invoker.java:285) | |
at org.apache.hadoop.fs.s3a.S3AFileSystem.getObjectMetadata(S3AFileSystem.java:1246) | |
at org.apache.hadoop.fs.s3a.S3AFileSystem.s3GetFileStatus(S3AFileSystem.java:2183) | |
... 24 more | |
Caused by: com.amazonaws.thirdparty.apache.http.conn.ConnectionPoolTimeoutException: Timeout waiting for connection from pool | |
at com.amazonaws.thirdparty.apache.http.impl.conn.PoolingHttpClientConnectionManager.leaseConnection(PoolingHttpClientConnectionManager.java:313) | |
at com.amazonaws.thirdparty.apache.http.impl.conn.PoolingHttpClientConnectionManager$1.get(PoolingHttpClientConnectionManager.java:279) | |
at sun.reflect.GeneratedMethodAccessor13.invoke(Unknown Source) | |
at sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43) | |
at java.lang.reflect.Method.invoke(Method.java:498) | |
at com.amazonaws.http.conn.ClientConnectionRequestFactory$Handler.invoke(ClientConnectionRequestFactory.java:70) | |
at com.amazonaws.http.conn.$Proxy17.get(Unknown Source) | |
at com.amazonaws.thirdparty.apache.http.impl.execchain.MainClientExec.execute(MainClientExec.java:191) | |
at com.amazonaws.thirdparty.apache.http.impl.execchain.ProtocolExec.execute(ProtocolExec.java:185) | |
at com.amazonaws.thirdparty.apache.http.impl.client.InternalHttpClient.doExecute(InternalHttpClient.java:185) | |
at com.amazonaws.thirdparty.apache.http.impl.client.CloseableHttpClient.execute(CloseableHttpClient.java:83) | |
at com.amazonaws.thirdparty.apache.http.impl.client.CloseableHttpClient.execute(CloseableHttpClient.java:56) | |
at com.amazonaws.http.apache.client.impl.SdkHttpClient.execute(SdkHttpClient.java:72) | |
at com.amazonaws.http.AmazonHttpClient$RequestExecutor.executeOneRequest(AmazonHttpClient.java:1238) | |
at com.amazonaws.http.AmazonHttpClient$RequestExecutor.executeHelper(AmazonHttpClient.java:1058) | |
... 38 more | |
21/09/10 14:38:35 WARN TaskSetManager: Lost task 0.0 in stage 106.0 (TID 2445, ip-172-31-41-108.us-east-2.compute.internal, executor driver): java.io.InterruptedIOException: getFileStatus on s3a://siva-test-bucket-june-16/hudi_testing/hudi_metadata1/output/1970/01/15/76112e22-c3b9-4497-9e9b-2c5a449d7477-0_20-21-148_20210910143308.parquet: com.amazonaws.SdkClientException: Unable to execute HTTP request: Timeout waiting for connection from pool |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment