Skip to content
Draft
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
36 commits
Select commit Hold shift + click to select a range
b141f2b
FLINK-38350: Upgrading Hadoop to 3.4.2
pra91 Sep 12, 2025
8782768
FLINK-38350: Upgrading Hadoop to 3.4.2
pra91 Sep 12, 2025
471f2af
FLINK-38350: Enhance HadoopS3AccessHelper with proper exception handl…
Sep 16, 2025
6bdefc7
Enhance HadoopS3AccessHelper with comprehensive property copying from…
Sep 17, 2025
e0ea4ed
Fix S3 upload callback issue with Hadoop 3.4.2
Sep 17, 2025
837c00b
Implement S3 callbacks without reflection for Hadoop 3.4.2
Sep 17, 2025
8931338
Fix S3 multipart upload NoSuchUploadException with client consistency
Sep 17, 2025
6b82c21
Fix S5cmd integration test and checkpoint race condition
Sep 17, 2025
ef3c988
feat: Comprehensive S3 client improvements for Hadoop 3.4.2 compatibi…
Sep 18, 2025
0a649c6
fix: Apply Spotless formatting fix for release branch
Sep 18, 2025
4b224b3
feat: Modernize S3 Hadoop filesystem architecture with comprehensive …
Sep 18, 2025
c2a5d9d
refactor: Simplify S3 client architecture to single cached client
Sep 18, 2025
4be0668
fix: Restore accidentally deleted HadoopS3FileSystemTest.java
Sep 18, 2025
0cf2405
fix: Add Java 8 compatibility for release-1.20 branch
Sep 18, 2025
3e99ac9
fix: Improve NoSuchUploadException handling in S3 multipart uploads
Sep 18, 2025
868628e
fix: Correct SSL configuration in S3ConfigurationBuilder
Sep 18, 2025
fec58fd
refactor: Simplify S3 architecture by removing complex components
Sep 18, 2025
f90e504
CRITICAL FIX: Eliminate S3 client resource leaks causing E2E test ins…
Sep 18, 2025
b9fd874
Fix unit test on release branch: Update test expectations after remov…
Sep 18, 2025
067c1ad
Fix S3 client null config issue with lazy initialization
Sep 19, 2025
8bc379c
CRITICAL FIX: Implement shared S3 client with reference counting to p…
Sep 19, 2025
1d9c46c
Fix E2E test SSL/networking issues by removing custom HTTP client con…
Sep 19, 2025
4dd6186
Upgrade Hadoop to 3.4.2 and resolve Netty conflicts
Sep 22, 2025
a30d78c
Fix S3 endpoint backward compatibility for Hadoop 3.4.2 upgrade
Sep 23, 2025
7c6f944
Add Hadoop credential provider compatibility for S3 client
Sep 23, 2025
cae7bac
Add Hadoop internal S3 client reflection approach for credential comp…
Oct 3, 2025
3e9c88e
Eliminate custom S3 client - use only Hadoop's S3A client for all ope…
Oct 8, 2025
8a1e657
Downgrade Hadoop from 3.4.2 to 3.3.6 due to requester-pays regression
Oct 15, 2025
943fae6
Add explicit requester-pays configuration mapping
Oct 15, 2025
d4eb43a
Add debug logging for requester-pays configuration
Oct 15, 2025
17fee69
Fix LOG import and checkstyle violations
Oct 15, 2025
a4072e5
Enhanced requester-pays debugging and configuration
Oct 15, 2025
160b95d
Add ERROR-level logging for debugging requester-pays issue
Oct 15, 2025
856f0eb
Remove debug logging - clean production version
Oct 15, 2025
7aafbda
Add requester-pays
Oct 15, 2025
ec1c3c2
Add conditional write logging to HadoopS3AccessHelper
Oct 21, 2025
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
56 changes: 56 additions & 0 deletions deploy-test-jar.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,56 @@
#!/bin/bash

# Deploy Hadoop 3.4.2 Test JAR to Local Repository
# This script deploys the S3 Hadoop JAR with a custom version to avoid conflicts with official releases

set -e

echo "🚀 Deploying Flink S3 Hadoop 3.4.2 Test JAR..."

# Configuration
JAR_FILE="flink-filesystems/flink-s3-fs-hadoop/target/flink-s3-fs-hadoop-1.20-SNAPSHOT.jar"
GROUP_ID="org.apache.flink"
ARTIFACT_ID="flink-s3-fs-hadoop-3.4.2-test"
VERSION="1.20-SNAPSHOT-hadoop-3.4.2-test"

# Check if JAR exists
if [ ! -f "$JAR_FILE" ]; then
echo "❌ Error: JAR file not found at $JAR_FILE"
echo "Please run the build first: ./mvnw clean package -pl flink-filesystems/flink-s3-fs-hadoop -DskipTests"
exit 1
fi

echo "📦 JAR file: $JAR_FILE"
echo "🏷️ Group ID: $GROUP_ID"
echo "🏷️ Artifact ID: $ARTIFACT_ID"
echo "🏷️ Version: $VERSION"

# Deploy to local repository
echo "📤 Deploying to local Maven repository..."
mvn install:install-file \
-Dfile="$JAR_FILE" \
-DgroupId="$GROUP_ID" \
-DartifactId="$ARTIFACT_ID" \
-Dversion="$VERSION" \
-Dpackaging=jar \
-DgeneratePom=true

echo "✅ Successfully deployed!"
echo ""
echo "📋 To use this JAR in your project, add this dependency:"
echo ""
echo "<dependency>"
echo " <groupId>$GROUP_ID</groupId>"
echo " <artifactId>$ARTIFACT_ID</artifactId>"
echo " <version>$VERSION</version>"
echo "</dependency>"
echo ""
echo "🔍 JAR location in local repository:"
echo "~/.m2/repository/org/apache/flink/flink-s3-fs-hadoop-3.4.2-test/$VERSION/"
echo ""
echo "🎯 This JAR includes:"
echo " ✅ Hadoop 3.4.2 upgrade (from 3.3.6)"
echo " ✅ Netty conflict resolution"
echo " ✅ S3 endpoint backward compatibility"
echo " ✅ IAM credential provider compatibility"
echo " ✅ Hadoop internal S3 client reflection approach"
10 changes: 10 additions & 0 deletions flink-filesystems/flink-s3-fs-base/pom.xml
Original file line number Diff line number Diff line change
Expand Up @@ -183,6 +183,11 @@ under the License.
<groupId>org.slf4j</groupId>
<artifactId>slf4j-reload4j</artifactId>
</exclusion>
<!-- Exclude unshaded Netty to prevent conflicts with flink-shaded-netty -->
<exclusion>
<groupId>io.netty</groupId>
<artifactId>*</artifactId>
</exclusion>
</exclusions>
</dependency>

Expand Down Expand Up @@ -238,6 +243,11 @@ under the License.
<groupId>org.slf4j</groupId>
<artifactId>slf4j-reload4j</artifactId>
</exclusion>
<!-- Exclude unshaded Netty to prevent conflicts with flink-shaded-netty -->
<exclusion>
<groupId>io.netty</groupId>
<artifactId>*</artifactId>
</exclusion>
</exclusions>
</dependency>

Expand Down
10 changes: 10 additions & 0 deletions flink-filesystems/flink-s3-fs-hadoop/pom.xml
Original file line number Diff line number Diff line change
Expand Up @@ -31,6 +31,11 @@ under the License.

<packaging>jar</packaging>

<properties>
<!-- S5CmdOnHadoopS3FileSystemITCase uses ArraysAsListSerializer indirectly -->
<surefire.module.config>--add-opens=java.base/java.util=ALL-UNNAMED</surefire.module.config>
</properties>

<dependencyManagement>
<dependencies>
<!-- Override the flink-parent dependencyManagement definition for hadoop-common to ensure
Expand All @@ -48,6 +53,11 @@ under the License.
<groupId>org.slf4j</groupId>
<artifactId>slf4j-reload4j</artifactId>
</exclusion>
<!-- Exclude unshaded Netty to prevent conflicts with flink-shaded-netty -->
<exclusion>
<groupId>io.netty</groupId>
<artifactId>*</artifactId>
</exclusion>
</exclusions>
</dependency>

Expand Down
Loading