From 8cc4a6734339f4fecdaab5165167c933122d2e79 Mon Sep 17 00:00:00 2001 From: roryqi Date: Thu, 13 Apr 2023 10:19:36 +0800 Subject: [PATCH] Revert "[#772] fix(kerberos): cache proxy user ugi to avoid memory leak (#773)" This reverts commit 89c2b922379d06029378650a33346b4e97cfbb02. --- .../security/HadoopSecurityContext.java | 24 +------------------ .../security/HadoopSecurityContextTest.java | 18 -------------- 2 files changed, 1 insertion(+), 41 deletions(-) diff --git a/common/src/main/java/org/apache/uniffle/common/security/HadoopSecurityContext.java b/common/src/main/java/org/apache/uniffle/common/security/HadoopSecurityContext.java index 1d8349f9cb..49083d365c 100644 --- a/common/src/main/java/org/apache/uniffle/common/security/HadoopSecurityContext.java +++ b/common/src/main/java/org/apache/uniffle/common/security/HadoopSecurityContext.java @@ -19,20 +19,17 @@ import java.io.IOException; import java.security.PrivilegedExceptionAction; -import java.util.Map; import java.util.concurrent.Callable; import java.util.concurrent.Executors; import java.util.concurrent.ScheduledExecutorService; import java.util.concurrent.TimeUnit; -import com.google.common.annotations.VisibleForTesting; import org.apache.commons.lang3.StringUtils; import org.apache.hadoop.conf.Configuration; import org.apache.hadoop.security.UserGroupInformation; import org.slf4j.Logger; import org.slf4j.LoggerFactory; -import org.apache.uniffle.common.util.JavaUtils; import org.apache.uniffle.common.util.ThreadUtils; public class HadoopSecurityContext implements SecurityContext { @@ -42,12 +39,6 @@ public class HadoopSecurityContext implements SecurityContext { private UserGroupInformation loginUgi; private ScheduledExecutorService refreshScheduledExecutor; - // The purpose of the proxy user ugi cache is to prevent the creation of - // multiple cache keys for the same user, scheme, and authority in the Hadoop filesystem. - // Without this cache, large amounts of unnecessary filesystem instances could be stored in memory, - // leading to potential memory leaks. For more information on this issue, refer to #706. - private Map proxyUserUgiPool; - public HadoopSecurityContext( String krb5ConfPath, String keytabFile, @@ -85,7 +76,6 @@ public HadoopSecurityContext( refreshIntervalSec, refreshIntervalSec, TimeUnit.SECONDS); - proxyUserUgiPool = JavaUtils.newConcurrentMap(); } private void authRefresh() { @@ -105,10 +95,8 @@ public T runSecured(String user, Callable securedCallable) throws Excepti // Run with the proxy user. if (!user.equals(loginUgi.getShortUserName())) { - UserGroupInformation proxyUserUgi = - proxyUserUgiPool.computeIfAbsent(user, x -> UserGroupInformation.createProxyUser(x, loginUgi)); return executeWithUgiWrapper( - proxyUserUgi, + UserGroupInformation.createProxyUser(user, loginUgi), securedCallable ); } @@ -126,20 +114,10 @@ private T executeWithUgiWrapper(UserGroupInformation ugi, Callable callab return ugi.doAs((PrivilegedExceptionAction) callable::call); } - // Only for tests - @VisibleForTesting - Map getProxyUserUgiPool() { - return proxyUserUgiPool; - } - @Override public void close() throws IOException { if (refreshScheduledExecutor != null) { refreshScheduledExecutor.shutdown(); } - if (proxyUserUgiPool != null) { - proxyUserUgiPool.clear(); - proxyUserUgiPool = null; - } } } diff --git a/common/src/test/java/org/apache/uniffle/common/security/HadoopSecurityContextTest.java b/common/src/test/java/org/apache/uniffle/common/security/HadoopSecurityContextTest.java index 38a34db1f6..53ad36b231 100644 --- a/common/src/test/java/org/apache/uniffle/common/security/HadoopSecurityContextTest.java +++ b/common/src/test/java/org/apache/uniffle/common/security/HadoopSecurityContextTest.java @@ -18,13 +18,10 @@ package org.apache.uniffle.common.security; import java.util.concurrent.Callable; -import java.util.concurrent.atomic.AtomicReference; import org.apache.commons.lang3.StringUtils; import org.apache.hadoop.fs.FileStatus; -import org.apache.hadoop.fs.FileSystem; import org.apache.hadoop.fs.Path; -import org.apache.hadoop.security.UserGroupInformation; import org.junit.jupiter.api.BeforeAll; import org.junit.jupiter.api.Test; @@ -69,28 +66,13 @@ public void testSecuredCallable() throws Exception { // case3: run by the proxy user Path pathWithAlexUser = new Path("/alex/HadoopSecurityContextTest"); - AtomicReference ugi1 = new AtomicReference<>(); context.runSecured("alex", (Callable) () -> { - ugi1.set(UserGroupInformation.getCurrentUser()); kerberizedHdfs.getFileSystem().mkdirs(pathWithAlexUser); return null; }); fileStatus = kerberizedHdfs.getFileSystem().getFileStatus(pathWithAlexUser); assertEquals("alex", fileStatus.getOwner()); - // case4: run by the proxy user again, it will always return the same - // ugi and filesystem instance. - AtomicReference ugi2 = new AtomicReference<>(); - context.runSecured("alex", (Callable) () -> { - ugi2.set(UserGroupInformation.getCurrentUser()); - return null; - }); - assertTrue(ugi1.get() == ugi2.get()); - assertTrue(ugi1.get() == context.getProxyUserUgiPool().get("alex")); - - FileSystem fileSystem1 = context.runSecured("alex", () -> FileSystem.get(kerberizedHdfs.getConf())); - FileSystem fileSystem2 = context.runSecured("alex", () -> FileSystem.get(kerberizedHdfs.getConf())); - assertTrue(fileSystem1 == fileSystem2); } }