dschneider-pivotal commented on code in PR #7751:
URL: https://github.com/apache/geode/pull/7751#discussion_r890412818
##########
geode-core/src/main/java/org/apache/geode/internal/monitoring/ThreadsMonitoringProcess.java:
##########
@@ -119,29 +119,69 @@ private int
checkForStuckThreads(Collection<AbstractExecutor> executors, long cu
return result;
}
+ /**
+ * If set to true, then the JVM will be asked for what locks a thread holds.
+ * This is extra expensive to ask for on some JVMs so be careful setting
this to true.
+ */
+ private static final boolean SHOW_LOCKS =
Boolean.getBoolean("gemfire.threadmonitor.showLocks");
+ /**
+ * If set to true, then the JVM will be asked for all potential stuck
threads with one call.
+ * Since getThreadInfo on many JVMs, stops ALL threads from running, and
since getting info
+ * on multiple threads with one call is additional work, setting this can
cause an extra long
+ * stop the world that can then cause other problems (like a forced
disconnect).
+ * So be careful setting this to true.
+ */
+ private static final boolean BATCH_CALLS =
Boolean.getBoolean("gemfire.threadmonitor.batchCalls");
+
+ private static Map<Long, ThreadInfo> createThreadInfoMap(Set<Long>
stuckThreadIds) {
+ return createThreadInfoMap(stuckThreadIds, SHOW_LOCKS, BATCH_CALLS);
+ }
+
@VisibleForTesting
- public static Map<Long, ThreadInfo> createThreadInfoMap(Set<Long>
stuckThreadIds) {
- /*
- * NOTE: at least some implementations of getThreadInfo(long[], boolean,
boolean)
- * will core dump if the long array contains a duplicate value.
- * That is why stuckThreadIds is a Set instead of a List.
- */
+ public static Map<Long, ThreadInfo> createThreadInfoMap(Set<Long>
stuckThreadIds,
+ final boolean showLocks, final boolean batchCalls) {
if (stuckThreadIds.isEmpty()) {
return Collections.emptyMap();
}
- long[] ids = new long[stuckThreadIds.size()];
- int idx = 0;
- for (long id : stuckThreadIds) {
- ids[idx] = id;
- idx++;
- }
- ThreadInfo[] threadInfos =
ManagementFactory.getThreadMXBean().getThreadInfo(ids, true, true);
+ logger.info("Obtaining ThreadInfo for " + stuckThreadIds.size()
+ + " threads. Configuration: showLocks=" + showLocks + " batchCalls=" +
batchCalls
+ + " This is an expensive operation for the JVM and on most JVMs causes
all threads to be paused.");
Map<Long, ThreadInfo> result = new HashMap<>();
- for (ThreadInfo threadInfo : threadInfos) {
- if (threadInfo != null) {
- result.put(threadInfo.getThreadId(), threadInfo);
+ if (batchCalls) {
Review Comment:
yes
##########
geode-core/src/test/java/org/apache/geode/internal/monitoring/executor/AbstractExecutorGroupJUnitTest.java:
##########
@@ -104,7 +104,7 @@ public void handleExpiry(long stuckTime, Map<Long,
ThreadInfo> map) {
threadIds.add(blockedThread.getId());
threadIds.add(blockingThread.getId());
String threadReport = executor.createThreadReport(60000,
- ThreadsMonitoringProcess.createThreadInfoMap(threadIds));
+ ThreadsMonitoringProcess.createThreadInfoMap(threadIds, true,
true));
Review Comment:
done
--
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.
To unsubscribe, e-mail: [email protected]
For queries about this service, please contact Infrastructure at:
[email protected]