CLOUDSTACK-9564: Fix memory leaks in VmwareContextPool

In a recent management server crash, it was found that the largest contributor
to memory leak was in VmwareContextPool where a registry is held (arraylist)
that grows indefinitely. The list itself is not used anywhere or consumed. There
exists a hashmap (pool) that returns a list of contexts for existing poolkey
(address/username) that is used instead.

This fixes the issue by removing the arraylist registry, and limiting the
length of the context list for a given poolkey.

Signed-off-by: Rohit Yadav <rohit.yadav@shapeblue.com>
This commit is contained in:
Rohit Yadav 2016-10-25 15:20:33 +05:30
parent 5d7288b858
commit 90a3d97c5e
7 changed files with 209 additions and 95 deletions

View File

@ -77,7 +77,6 @@ public class VmwareContextFactory {
context.registerStockObject("noderuninfo", String.format("%d-%d", s_clusterMgr.getManagementNodeId(), s_clusterMgr.getCurrentRunId()));
context.setPoolInfo(s_pool, VmwareContextPool.composePoolKey(vCenterAddress, vCenterUserName));
s_pool.registerOutstandingContext(context);
return context;
}

View File

@ -5481,7 +5481,7 @@ public class VmwareResource implements StoragePoolResource, ServerResource, Vmwa
if (s_logger.isTraceEnabled()) {
s_logger.trace("Recycling threadlocal context to pool");
}
context.getPool().returnContext(context);
context.getPool().registerContext(context);
}
}

View File

@ -49,7 +49,6 @@ public class VmwareSecondaryStorageContextFactory {
assert (context != null);
context.setPoolInfo(s_pool, VmwareContextPool.composePoolKey(vCenterAddress, vCenterUserName));
s_pool.registerOutstandingContext(context);
return context;
}

View File

@ -236,7 +236,7 @@ public class VmwareSecondaryStorageResourceHandler implements SecondaryStorageRe
VmwareContext context = currentContext.get();
currentContext.set(null);
assert (context.getPool() != null);
context.getPool().returnContext(context);
context.getPool().registerContext(context);
}
}

View File

@ -666,7 +666,7 @@ public class VmwareContext {
s_logger.warn("Unexpected exception: ", e);
} finally {
if (_pool != null) {
_pool.unregisterOutstandingContext(this);
_pool.unregisterContext(this);
}
unregisterOutstandingContext();
}

View File

@ -16,28 +16,30 @@
// under the License.
package com.cloud.hypervisor.vmware.util;
import com.google.common.base.Strings;
import org.apache.cloudstack.managed.context.ManagedContextTimerTask;
import org.apache.log4j.Logger;
import org.joda.time.Duration;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.Queue;
import java.util.Timer;
import java.util.TimerTask;
import org.apache.log4j.Logger;
import org.apache.cloudstack.managed.context.ManagedContextTimerTask;
import java.util.concurrent.ConcurrentHashMap;
import java.util.concurrent.ConcurrentLinkedQueue;
import java.util.concurrent.ConcurrentMap;
public class VmwareContextPool {
private static final Logger s_logger = Logger.getLogger(VmwareContextPool.class);
private static final long DEFAULT_CHECK_INTERVAL = 10000;
private static final Duration DEFAULT_CHECK_INTERVAL = Duration.millis(10000L);
private static final int DEFAULT_IDLE_QUEUE_LENGTH = 128;
private List<VmwareContext> _outstandingRegistry = new ArrayList<VmwareContext>();
private Map<String, List<VmwareContext>> _pool;
private final ConcurrentMap<String, Queue<VmwareContext>> _pool;
private int _maxIdleQueueLength = DEFAULT_IDLE_QUEUE_LENGTH;
private long _idleCheckIntervalMs = DEFAULT_CHECK_INTERVAL;
private Duration _idleCheckInterval = DEFAULT_CHECK_INTERVAL;
private Timer _timer = new Timer();
@ -45,76 +47,77 @@ public class VmwareContextPool {
this(DEFAULT_IDLE_QUEUE_LENGTH, DEFAULT_CHECK_INTERVAL);
}
public VmwareContextPool(int maxIdleQueueLength) {
this(maxIdleQueueLength, DEFAULT_CHECK_INTERVAL);
}
public VmwareContextPool(int maxIdleQueueLength, long idleCheckIntervalMs) {
_pool = new HashMap<String, List<VmwareContext>>();
public VmwareContextPool(int maxIdleQueueLength, Duration idleCheckInterval) {
_pool = new ConcurrentHashMap<String, Queue<VmwareContext>>();
_maxIdleQueueLength = maxIdleQueueLength;
_idleCheckIntervalMs = idleCheckIntervalMs;
_idleCheckInterval = idleCheckInterval;
_timer.scheduleAtFixedRate(getTimerTask(), _idleCheckIntervalMs, _idleCheckIntervalMs);
_timer.scheduleAtFixedRate(getTimerTask(), _idleCheckInterval.getMillis(), _idleCheckInterval.getMillis());
}
public void registerOutstandingContext(VmwareContext context) {
assert (context != null);
synchronized (this) {
_outstandingRegistry.add(context);
public VmwareContext getContext(final String vCenterAddress, final String vCenterUserName) {
final String poolKey = composePoolKey(vCenterAddress, vCenterUserName).intern();
if (Strings.isNullOrEmpty(poolKey)) {
return null;
}
}
public void unregisterOutstandingContext(VmwareContext context) {
assert (context != null);
synchronized (this) {
_outstandingRegistry.remove(context);
}
}
public VmwareContext getContext(String vCenterAddress, String vCenterUserName) {
String poolKey = composePoolKey(vCenterAddress, vCenterUserName);
synchronized (this) {
List<VmwareContext> l = _pool.get(poolKey);
if (l == null)
return null;
if (l.size() > 0) {
VmwareContext context = l.remove(0);
context.setPoolInfo(this, poolKey);
if (s_logger.isTraceEnabled())
s_logger.trace("Return a VmwareContext from the idle pool: " + poolKey + ". current pool size: " + l.size() + ", outstanding count: " +
VmwareContext.getOutstandingContextCount());
synchronized (poolKey) {
final Queue<VmwareContext> ctxList = _pool.get(poolKey);
if (ctxList != null && !ctxList.isEmpty()) {
final VmwareContext context = ctxList.remove();
if (context != null) {
context.setPoolInfo(this, poolKey);
}
if (s_logger.isTraceEnabled()) {
s_logger.trace("Return a VmwareContext from the idle pool: " + poolKey + ". current pool size: " + ctxList.size() + ", outstanding count: " +
VmwareContext.getOutstandingContextCount());
}
return context;
}
// TODO, we need to control the maximum number of outstanding VmwareContext object in the future
return null;
}
}
public void returnContext(VmwareContext context) {
public void registerContext(final VmwareContext context) {
assert (context.getPool() == this);
assert (context.getPoolKey() != null);
synchronized (this) {
List<VmwareContext> l = _pool.get(context.getPoolKey());
if (l == null) {
l = new ArrayList<VmwareContext>();
_pool.put(context.getPoolKey(), l);
final String poolKey = context.getPoolKey().intern();
synchronized (poolKey) {
Queue<VmwareContext> ctxQueue = _pool.get(poolKey);
if (ctxQueue == null) {
ctxQueue = new ConcurrentLinkedQueue<>();
_pool.put(poolKey, ctxQueue);
}
if (l.size() < _maxIdleQueueLength) {
context.clearStockObjects();
l.add(context);
if (ctxQueue.size() >= _maxIdleQueueLength) {
final VmwareContext oldestContext = ctxQueue.remove();
if (oldestContext != null) {
try {
oldestContext.close();
} catch (Throwable t) {
s_logger.error("Unexpected exception caught while trying to purge oldest VmwareContext", t);
}
}
}
context.clearStockObjects();
ctxQueue.add(context);
if (s_logger.isTraceEnabled())
s_logger.trace("Recycle VmwareContext into idle pool: " + context.getPoolKey() + ", current idle pool size: " + l.size() + ", outstanding count: " +
VmwareContext.getOutstandingContextCount());
} else {
if (s_logger.isTraceEnabled())
s_logger.trace("VmwareContextPool queue exceeds limits, queue size: " + l.size());
context.close();
if (s_logger.isTraceEnabled()) {
s_logger.trace("Recycle VmwareContext into idle pool: " + context.getPoolKey() + ", current idle pool size: " + ctxQueue.size() + ", outstanding count: "
+ VmwareContext.getOutstandingContextCount());
}
}
}
public void unregisterContext(final VmwareContext context) {
assert (context != null);
final String poolKey = context.getPoolKey().intern();
final Queue<VmwareContext> ctxList = _pool.get(poolKey);
synchronized (poolKey) {
if (!Strings.isNullOrEmpty(poolKey) && ctxList != null && ctxList.contains(context)) {
ctxList.remove(context);
}
}
}
@ -124,8 +127,6 @@ public class VmwareContextPool {
@Override
protected void runInContext() {
try {
// doIdleCheck();
doKeepAlive();
} catch (Throwable e) {
s_logger.error("Unexpected exception", e);
@ -134,35 +135,30 @@ public class VmwareContextPool {
};
}
private void getKeepAliveCheckContexts(List<VmwareContext> l, int batchSize) {
synchronized (this) {
int size = Math.min(_outstandingRegistry.size(), batchSize);
while (size > 0) {
VmwareContext context = _outstandingRegistry.remove(0);
l.add(context);
_outstandingRegistry.add(context);
size--;
}
}
}
private void doKeepAlive() {
List<VmwareContext> l = new ArrayList<VmwareContext>();
int batchSize = (int)(_idleCheckIntervalMs / 1000); // calculate batch size at 1 request/sec rate
getKeepAliveCheckContexts(l, batchSize);
for (VmwareContext context : l) {
try {
context.idleCheck();
} catch (Throwable e) {
s_logger.warn("Exception caught during VmwareContext idle check, close and discard the context", e);
context.close();
final List<VmwareContext> closableCtxList = new ArrayList<>();
for (final Queue<VmwareContext> ctxQueue : _pool.values()) {
for (Iterator<VmwareContext> iterator = ctxQueue.iterator(); iterator.hasNext();) {
final VmwareContext context = iterator.next();
if (context == null) {
iterator.remove();
continue;
}
try {
context.idleCheck();
} catch (Throwable e) {
s_logger.warn("Exception caught during VmwareContext idle check, close and discard the context", e);
closableCtxList.add(context);
iterator.remove();
}
}
}
for (final VmwareContext context : closableCtxList) {
context.close();
}
}
public static String composePoolKey(String vCenterAddress, String vCenterUserName) {
public static String composePoolKey(final String vCenterAddress, final String vCenterUserName) {
assert (vCenterUserName != null);
assert (vCenterAddress != null);
return vCenterUserName + "@" + vCenterAddress;

View File

@ -0,0 +1,120 @@
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
package com.cloud.hypervisor.vmware.util;
import com.cloud.utils.concurrency.NamedThreadFactory;
import org.joda.time.Duration;
import org.junit.Assert;
import org.junit.Before;
import org.junit.Test;
import org.mockito.Mockito;
import java.util.ArrayList;
import java.util.List;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.Executors;
public class VmwareContextPoolTest {
private class PoolClient implements Runnable {
private final VmwareContextPool pool;
private volatile Boolean canRun = true;
private int counter = 0;
public PoolClient(final VmwareContextPool pool) {
this.pool = pool;
}
public int count() {
return counter;
}
public void stop() {
canRun = false;
}
@Override
public void run() {
final String poolKey = pool.composePoolKey(vmwareAddress, vmwareUsername);
while (canRun) {
pool.registerContext(createDummyContext(pool, poolKey));
counter++;
}
}
}
private VmwareContextPool vmwareContextPool;
private VmwareContext vmwareContext;
private String vmwareAddress = "address";
private String vmwareUsername = "username";
private int contextLength = 10;
private Duration idleCheckInterval = Duration.millis(1000L);
public VmwareContext createDummyContext(final VmwareContextPool pool, final String poolKey) {
VmwareClient vimClient = new VmwareClient("someAddress");
VmwareContext context = new VmwareContext(vimClient, "someAddress");
context.setPoolInfo(pool, poolKey);
return context;
}
@Before
public void setUp() throws Exception {
final String poolKey = vmwareContextPool.composePoolKey(vmwareAddress, vmwareUsername);
vmwareContextPool = new VmwareContextPool(contextLength, idleCheckInterval);
vmwareContext = createDummyContext(vmwareContextPool, poolKey);
}
@Test
public void testRegisterContext() throws Exception {
vmwareContextPool.registerContext(vmwareContext);
Assert.assertEquals(vmwareContextPool.getContext(vmwareAddress, vmwareUsername), vmwareContext);
}
@Test
public void testUnregisterContext() throws Exception {
vmwareContextPool.unregisterContext(vmwareContext);
Assert.assertNull(vmwareContextPool.getContext(vmwareAddress, vmwareUsername));
}
@Test
public void testComposePoolKey() throws Exception {
Assert.assertEquals(vmwareContextPool.composePoolKey(vmwareAddress, vmwareUsername), vmwareUsername + "@" + vmwareAddress);
}
@Test
public void testMultithreadedPoolClients() throws Exception {
vmwareContextPool = Mockito.spy(vmwareContextPool);
final ExecutorService executor = Executors.newFixedThreadPool(10, new NamedThreadFactory("VmwareContextPoolClients"));
final List<PoolClient> clients = new ArrayList<>();
for (int i = 0; i < 50; i++) {
final PoolClient client = new PoolClient(vmwareContextPool);
clients.add(client);
executor.submit(client);
}
Thread.sleep(1000);
executor.shutdown();
int totalRegistrations = 0;
for (final PoolClient client : clients) {
client.stop();
totalRegistrations += client.count();
}
Mockito.verify(vmwareContextPool, Mockito.atLeast(totalRegistrations)).registerContext(Mockito.any(VmwareContext.class));
Assert.assertEquals(vmwareContextPool.composePoolKey(vmwareAddress, vmwareUsername),
vmwareContextPool.getContext(vmwareAddress, vmwareUsername).getPoolKey());
}
}