From 4023c4e8c571060d1c72268fdade4b0d7cddbef8 Mon Sep 17 00:00:00 2001 From: Diego Tavares Date: Wed, 27 Nov 2024 15:59:48 -0800 Subject: [PATCH 1/4] (ci/cd) Drop support for cy2022 (#1603) The ci-2022 image has been failing the pipelines for using an unsupported version of GLIBC (see https://github.com/AcademySoftwareFoundation/OpenCue/actions/runs/12016939050/job/33498210814) According to the [Reference Platform](https://vfxplatform.com/) ci2022 uses **GLIBC_2.17**, but I'm not sure what on the pipeline requires a higher version. Since this error happens on the `actions/checkout@v3`, it looks like some version bump on GitHub's actions might be the root cause. --- .github/workflows/testing-pipeline.yml | 16 +- ci/pylintrc_test | 1 - ci/run_python_lint.sh | 8 +- .../spcue/dispatcher/HostReportHandler.java | 892 ++++++++++++------ cuegui/cuegui/AbstractDockWidget.py | 3 + cuegui/cuegui/AbstractTreeWidget.py | 1 + cuegui/cuegui/CreatorDialog.py | 2 + cuegui/cuegui/CueJobMonitorTree.py | 8 +- cuegui/cuegui/CueStateBarWidget.py | 6 +- cuegui/cuegui/DependWizard.py | 14 + cuegui/cuegui/FilterDialog.py | 3 + cuegui/cuegui/FrameRangeSelection.py | 9 + cuegui/cuegui/GroupDialog.py | 2 +- cuegui/cuegui/HostMonitor.py | 9 +- cuegui/cuegui/HostMonitorTree.py | 2 + cuegui/cuegui/ItemDelegate.py | 4 +- cuegui/cuegui/JobMonitorTree.py | 4 + cuegui/cuegui/LayerDialog.py | 1 + cuegui/cuegui/Layout.py | 2 +- cuegui/cuegui/LimitsWidget.py | 2 +- cuegui/cuegui/MainWindow.py | 1 + cuegui/cuegui/PreviewWidget.py | 1 + cuegui/cuegui/Redirect.py | 2 +- cuegui/cuegui/ServiceDialog.py | 6 +- cuegui/cuegui/ShowsWidget.py | 2 +- cuegui/cuegui/SubscriptionGraphWidget.py | 4 +- cuegui/cuegui/SubscriptionsWidget.py | 2 +- cuegui/cuegui/ThreadPool.py | 2 + cuegui/cuegui/UnbookDialog.py | 1 + cuegui/cuegui/plugins/AllocationsPlugin.py | 6 +- cuegui/cuegui/plugins/LogViewPlugin.py | 2 + .../cuegui/plugins/MonitorJobDetailsPlugin.py | 3 + cuegui/cuegui/plugins/MonitorJobsPlugin.py | 1 + cuegui/cuegui/plugins/StuckFramePlugin.py | 5 + cuesubmit/cuesubmit/ui/Submit.py | 1 + cuesubmit/cuesubmit/ui/Widgets.py | 2 + 36 files changed, 721 insertions(+), 309 deletions(-) diff --git a/.github/workflows/testing-pipeline.yml b/.github/workflows/testing-pipeline.yml index fe3ade9a6..75d8c8111 100644 --- a/.github/workflows/testing-pipeline.yml +++ b/.github/workflows/testing-pipeline.yml @@ -7,20 +7,6 @@ on: branches: [ master ] jobs: - test_cuebot_2022: - name: Build Cuebot and Run Unit Tests (CY2022) - runs-on: ubuntu-22.04 - container: - image: aswf/ci-opencue:2022 - env: - ACTIONS_ALLOW_USE_UNSECURE_NODE_VERSION: true - steps: - - uses: actions/checkout@v3 - - name: Build with Gradle - run: | - chown -R aswfuser:aswfgroup . - su -c "cd cuebot && ./gradlew build --stacktrace --info" aswfuser - test_python_2023: name: Run Python Unit Tests (CY2023) runs-on: ubuntu-22.04 @@ -66,7 +52,7 @@ jobs: lint_python: name: Lint Python Code runs-on: ubuntu-22.04 - container: aswf/ci-opencue:2022 + container: aswf/ci-opencue:2024.1 env: ACTIONS_ALLOW_USE_UNSECURE_NODE_VERSION: true steps: diff --git a/ci/pylintrc_test b/ci/pylintrc_test index 434a1d754..d84fc406d 100644 --- a/ci/pylintrc_test +++ b/ci/pylintrc_test @@ -67,7 +67,6 @@ disable=arguments-differ, locally-disabled, missing-class-docstring, missing-function-docstring, - no-self-use, protected-access, raise-missing-from, too-many-arguments, diff --git a/ci/run_python_lint.sh b/ci/run_python_lint.sh index ba98d2b6c..488b9c946 100755 --- a/ci/run_python_lint.sh +++ b/ci/run_python_lint.sh @@ -37,14 +37,14 @@ cd .. echo "Running lint for cuegui/..." cd cuegui -PYTHONPATH=../pycue python -m pylint --rcfile=../ci/pylintrc_main cuegui --ignore=cuegui/images,cuegui/images/crystal -PYTHONPATH=../pycue python -m pylint --rcfile=../ci/pylintrc_test tests +PYTHONPATH=../pycue python -m pylint --rcfile=../ci/pylintrc_main cuegui --ignore=cuegui/images,cuegui/images/crystal --disable=no-member +PYTHONPATH=../pycue python -m pylint --rcfile=../ci/pylintrc_test tests --disable=no-member cd .. echo "Running lint for cuesubmit/..." cd cuesubmit -PYTHONPATH=../pycue:../pyoutline python -m pylint --rcfile=../ci/pylintrc_main cuesubmit -PYTHONPATH=../pycue:../pyoutline python -m pylint --rcfile=../ci/pylintrc_test tests +PYTHONPATH=../pycue:../pyoutline python -m pylint --rcfile=../ci/pylintrc_main cuesubmit --disable=no-member +PYTHONPATH=../pycue:../pyoutline python -m pylint --rcfile=../ci/pylintrc_test tests --disable=no-member cd .. echo "Running lint for rqd/..." diff --git a/cuebot/src/main/java/com/imageworks/spcue/dispatcher/HostReportHandler.java b/cuebot/src/main/java/com/imageworks/spcue/dispatcher/HostReportHandler.java index 39423e80b..98a9df495 100644 --- a/cuebot/src/main/java/com/imageworks/spcue/dispatcher/HostReportHandler.java +++ b/cuebot/src/main/java/com/imageworks/spcue/dispatcher/HostReportHandler.java @@ -1,4 +1,3 @@ - /* * Copyright Contributors to the OpenCue Project * @@ -15,38 +14,20 @@ * limitations under the License. */ - - package com.imageworks.spcue.dispatcher; -import java.sql.Timestamp; -import java.util.ArrayList; -import java.util.Comparator; -import java.util.HashMap; -import java.util.List; -import java.util.Map; -import java.util.concurrent.ExecutionException; -import java.util.concurrent.ThreadPoolExecutor; -import java.util.concurrent.TimeUnit; +import static com.imageworks.spcue.dispatcher.Dispatcher.*; import com.google.common.cache.Cache; import com.google.common.cache.CacheBuilder; -import com.imageworks.spcue.JobInterface; -import org.apache.logging.log4j.Logger; -import org.apache.logging.log4j.LogManager; -import org.springframework.beans.factory.annotation.Autowired; -import org.springframework.core.env.Environment; -import org.springframework.core.task.TaskRejectedException; -import org.springframework.dao.DataAccessException; -import org.springframework.dao.EmptyResultDataAccessException; - import com.imageworks.spcue.CommentDetail; import com.imageworks.spcue.DispatchHost; -import com.imageworks.spcue.FrameInterface; import com.imageworks.spcue.FrameDetail; +import com.imageworks.spcue.FrameInterface; import com.imageworks.spcue.JobEntity; -import com.imageworks.spcue.LayerEntity; +import com.imageworks.spcue.JobInterface; import com.imageworks.spcue.LayerDetail; +import com.imageworks.spcue.LayerEntity; import com.imageworks.spcue.LocalHostAssignment; import com.imageworks.spcue.PrometheusMetricsCollector; import com.imageworks.spcue.Source; @@ -72,12 +53,28 @@ import com.imageworks.spcue.service.HostManager; import com.imageworks.spcue.service.JobManager; import com.imageworks.spcue.util.CueUtil; - -import static com.imageworks.spcue.dispatcher.Dispatcher.*; +import java.sql.Timestamp; +import java.util.ArrayList; +import java.util.Comparator; +import java.util.HashMap; +import java.util.List; +import java.util.Map; +import java.util.concurrent.ExecutionException; +import java.util.concurrent.ThreadPoolExecutor; +import java.util.concurrent.TimeUnit; +import org.apache.logging.log4j.LogManager; +import org.apache.logging.log4j.Logger; +import org.springframework.beans.factory.annotation.Autowired; +import org.springframework.core.env.Environment; +import org.springframework.core.task.TaskRejectedException; +import org.springframework.dao.DataAccessException; +import org.springframework.dao.EmptyResultDataAccessException; public class HostReportHandler { - private static final Logger logger = LogManager.getLogger(HostReportHandler.class); + private static final Logger logger = LogManager.getLogger( + HostReportHandler.class + ); private BookingManager bookingManager; private HostManager hostManager; @@ -91,16 +88,20 @@ public class HostReportHandler { private JobManager jobManager; private JobDao jobDao; private LayerDao layerDao; + @Autowired private Environment env; + @Autowired private CommentManager commentManager; + @Autowired private PrometheusMetricsCollector prometheusMetrics; // Comment constants - private static final String SUBJECT_COMMENT_FULL_TEMP_DIR = "Host set to REPAIR for not having enough storage " + - "space on the temporary directory (mcp)"; + private static final String SUBJECT_COMMENT_FULL_TEMP_DIR = + "Host set to REPAIR for not having enough storage " + + "space on the temporary directory (mcp)"; private static final String CUEBOT_COMMENT_USER = "cuebot"; private static final String WINDOWS_OS = "Windows"; @@ -108,8 +109,11 @@ public class HostReportHandler { // The cache expires after write to avoid growing unbounded. If a request for a host-frame doesn't appear // for a period of time, the entry will be removed. Cache killRequestCounterCache = CacheBuilder.newBuilder() - .expireAfterWrite(FRAME_KILL_CACHE_EXPIRE_AFTER_WRITE_MINUTES, TimeUnit.MINUTES) - .build(); + .expireAfterWrite( + FRAME_KILL_CACHE_EXPIRE_AFTER_WRITE_MINUTES, + TimeUnit.MINUTES + ) + .build(); /** * Boolean to toggle if this class is accepting data or not. @@ -141,8 +145,9 @@ public synchronized void shutdown() { public void queueBootReport(BootReport report) { if (isShutdown()) { throw new RqdRetryReportException( - "Error processing host report. Cuebot not " + - "accepting packets."); + "Error processing host report. Cuebot not " + + "accepting packets." + ); } reportQueue.execute(new DispatchHandleHostReport(report, this)); } @@ -155,8 +160,9 @@ public void queueBootReport(BootReport report) { public void queueHostReport(HostReport report) { if (isShutdown()) { throw new RqdRetryReportException( - "Error processing host report. Cuebot not " + - "accepting packets."); + "Error processing host report. Cuebot not " + + "accepting packets." + ); } reportQueue.execute(new DispatchHandleHostReport(report, this)); } @@ -164,31 +170,45 @@ public void queueHostReport(HostReport report) { public void handleHostReport(HostReport report, boolean isBoot) { long startTime = System.currentTimeMillis(); try { - long swapOut = 0; if (report.getHost().getAttributesMap().containsKey("swapout")) { - swapOut = Integer.parseInt(report.getHost().getAttributesMap().get("swapout")); - if (swapOut > 0) - logger.info(report.getHost().getName() + " swapout: " + - report.getHost().getAttributesMap().get("swapout")); + swapOut = Integer.parseInt( + report.getHost().getAttributesMap().get("swapout") + ); + if (swapOut > 0) logger.info( + report.getHost().getName() + + " swapout: " + + report.getHost().getAttributesMap().get("swapout") + ); } DispatchHost host; RenderHost rhost = report.getHost(); try { host = hostManager.findDispatchHost(rhost.getName()); - hostManager.setHostStatistics(host, - rhost.getTotalMem(), rhost.getFreeMem(), - rhost.getTotalSwap(), rhost.getFreeSwap(), - rhost.getTotalMcp(), rhost.getFreeMcp(), - rhost.getTotalGpuMem(), rhost.getFreeGpuMem(), - rhost.getLoad(), new Timestamp(rhost.getBootTime() * 1000l), - rhost.getAttributesMap().get("SP_OS")); + hostManager.setHostStatistics( + host, + rhost.getTotalMem(), + rhost.getFreeMem(), + rhost.getTotalSwap(), + rhost.getFreeSwap(), + rhost.getTotalMcp(), + rhost.getFreeMcp(), + rhost.getTotalGpuMem(), + rhost.getFreeGpuMem(), + rhost.getLoad(), + new Timestamp(rhost.getBootTime() * 1000l), + rhost.getAttributesMap().get("SP_OS") + ); // Both logics are conflicting, only change hardware state if // there was no need for a tempDirStorage state change if (!changeStateForTempDirStorage(host, report.getHost())) { - changeHardwareState(host, report.getHost().getState(), isBoot); + changeHardwareState( + host, + report.getHost().getState(), + isBoot + ); } changeNimbyState(host, report.getHost()); @@ -200,16 +220,22 @@ public void handleHostReport(HostReport report, boolean isBoot) { hostManager.setHostResources(host, report); } - dispatchSupport.determineIdleCores(host, report.getHost().getLoad()); - + dispatchSupport.determineIdleCores( + host, + report.getHost().getLoad() + ); } catch (DataAccessException dae) { - logger.info("Unable to find host " + rhost.getName() + "," - + dae + " , creating host."); + logger.info( + "Unable to find host " + + rhost.getName() + + "," + + dae + + " , creating host." + ); // TODO: Skip adding it if the host name is over 30 characters host = hostManager.createHost(report); - } - catch (Exception e) { + } catch (Exception e) { logger.warn("Error processing HostReport, " + e); return; } @@ -218,7 +244,9 @@ public void handleHostReport(HostReport report, boolean isBoot) { * Verify all the frames in the report are valid. * Frames that are not valid are removed. */ - List runningFrames = verifyRunningFrameInfo(report); + List runningFrames = verifyRunningFrameInfo( + report + ); /* * Updates memory usage for the proc, frames, @@ -245,7 +273,9 @@ public void handleHostReport(HostReport report, boolean isBoot) { */ String msg = null; boolean hasLocalJob = bookingManager.hasLocalHostAssignment(host); - int coresToReserve = host.handleNegativeCoresRequirement(Dispatcher.CORE_POINTS_RESERVED_MIN); + int coresToReserve = host.handleNegativeCoresRequirement( + Dispatcher.CORE_POINTS_RESERVED_MIN + ); if (hasLocalJob) { List lcas = @@ -255,38 +285,55 @@ public void handleHostReport(HostReport report, boolean isBoot) { } } long memReservedMin = env.getRequiredProperty( - "dispatcher.memory.mem_reserved_min", - Long.class); - - if (!isTempDirStorageEnough(report.getHost().getTotalMcp(), report.getHost().getFreeMcp(), host.getOs())) { + "dispatcher.memory.mem_reserved_min", + Long.class + ); + + if ( + !isTempDirStorageEnough( + report.getHost().getTotalMcp(), + report.getHost().getFreeMcp(), + host.getOs() + ) + ) { msg = String.format( "%s doesn't have enough free space in the temporary directory (mcp), %dMB", - host.name, (report.getHost().getFreeMcp()/1024)); - } - else if (coresToReserve <= 0 || host.idleCores < Dispatcher.CORE_POINTS_RESERVED_MIN) { - msg = String.format("%s doesn't have enough idle cores, %d needs %d", - host.name, host.idleCores, Dispatcher.CORE_POINTS_RESERVED_MIN); - } - else if (host.idleMemory < memReservedMin) { - msg = String.format("%s doesn't have enough idle memory, %d needs %d", - host.name, host.idleMemory, memReservedMin); - } - else if (report.getHost().getFreeMem() < CueUtil.MB512) { - msg = String.format("%s doesn't have enough free system mem, %d needs %d", - host.name, report.getHost().getFreeMem(), memReservedMin); - } - else if(!host.hardwareState.equals(HardwareState.UP)) { + host.name, + (report.getHost().getFreeMcp() / 1024) + ); + } else if ( + coresToReserve <= 0 || + host.idleCores < Dispatcher.CORE_POINTS_RESERVED_MIN + ) { + msg = String.format( + "%s doesn't have enough idle cores, %d needs %d", + host.name, + host.idleCores, + Dispatcher.CORE_POINTS_RESERVED_MIN + ); + } else if (host.idleMemory < memReservedMin) { + msg = String.format( + "%s doesn't have enough idle memory, %d needs %d", + host.name, + host.idleMemory, + memReservedMin + ); + } else if (report.getHost().getFreeMem() < CueUtil.MB512) { + msg = String.format( + "%s doesn't have enough free system mem, %d needs %d", + host.name, + report.getHost().getFreeMem(), + memReservedMin + ); + } else if (!host.hardwareState.equals(HardwareState.UP)) { msg = host + " is not in the Up state."; - } - else if (host.lockState.equals(LockState.LOCKED)) { + } else if (host.lockState.equals(LockState.LOCKED)) { msg = host + " is locked."; - } - else if (report.getHost().getNimbyLocked()) { + } else if (report.getHost().getNimbyLocked()) { if (!hasLocalJob) { msg = host + " is NIMBY locked."; } - } - else if (!dispatchSupport.isCueBookable(host)) { + } else if (!dispatchSupport.isCueBookable(host)) { msg = "The cue has no pending jobs"; } @@ -296,9 +343,7 @@ else if (!dispatchSupport.isCueBookable(host)) { */ if (msg != null) { logger.trace(msg); - } - else { - + } else { // check again. The dangling local host assignment could be removed. hasLocalJob = bookingManager.hasLocalHostAssignment(host); @@ -308,8 +353,8 @@ else if (!dispatchSupport.isCueBookable(host)) { if (hasLocalJob) { if (!bookingManager.hasResourceDeficit(host)) { bookingQueue.execute( - new DispatchBookHostLocal( - host, localDispatcher)); + new DispatchBookHostLocal(host, localDispatcher) + ); } return; } @@ -319,25 +364,38 @@ else if (!dispatchSupport.isCueBookable(host)) { * to that show first. */ if (hostManager.isPreferShow(host)) { - bookingQueue.execute(new DispatchBookHost( - host, hostManager.getPreferredShow(host), dispatcher, env)); + bookingQueue.execute( + new DispatchBookHost( + host, + hostManager.getPreferredShow(host), + dispatcher, + env + ) + ); return; } - bookingQueue.execute(new DispatchBookHost(host, dispatcher, env)); + bookingQueue.execute( + new DispatchBookHost(host, dispatcher, env) + ); } - } finally { - if (reportQueue.getQueue().size() > 0 || - System.currentTimeMillis() - startTime > 100) { + if ( + reportQueue.getQueue().size() > 0 || + System.currentTimeMillis() - startTime > 100 + ) { /* * Write a log if the host report takes a long time to process. */ - CueUtil.logDuration(startTime, "host report " + - report.getHost().getName() + " with " + - report.getFramesCount() + - " running frames, waiting: " + - reportQueue.getQueue().size()); + CueUtil.logDuration( + startTime, + "host report " + + report.getHost().getName() + + " with " + + report.getFramesCount() + + " running frames, waiting: " + + reportQueue.getQueue().size() + ); } } } @@ -354,16 +412,25 @@ else if (!dispatchSupport.isCueBookable(host)) { * @param hostOs Reported operational systems * @return */ - private boolean isTempDirStorageEnough(Long tempTotalStorage, Long tempFreeStorage, String[] hostOs) { + private boolean isTempDirStorageEnough( + Long tempTotalStorage, + Long tempFreeStorage, + String[] hostOs + ) { // The minimum amount of free space in the temporary directory to book a host int minAvailableTempPercentage = env.getRequiredProperty( - "dispatcher.min_available_temp_storage_percentage", Integer.class); + "dispatcher.min_available_temp_storage_percentage", + Integer.class + ); - return minAvailableTempPercentage == -1 + return ( + minAvailableTempPercentage == -1 || // It is safe to assume multiple OSs imply windows is not the base OS, // threfore Windows will always report a single hostOs - || (hostOs.length == 1 && hostOs[0].equalsIgnoreCase(WINDOWS_OS)) - || (((tempFreeStorage * 100.0) / tempTotalStorage) >= minAvailableTempPercentage); + (hostOs.length == 1 && hostOs[0].equalsIgnoreCase(WINDOWS_OS)) || + (((tempFreeStorage * 100.0) / tempTotalStorage) >= + minAvailableTempPercentage) + ); } /** @@ -379,7 +446,11 @@ private boolean isTempDirStorageEnough(Long tempTotalStorage, Long tempFreeStora * @param reportState * @param isBoot */ - private void changeHardwareState(DispatchHost host, HardwareState reportState, boolean isBoot) { + private void changeHardwareState( + DispatchHost host, + HardwareState reportState, + boolean isBoot + ) { // If the states are the same there is no reason to do this update. if (host.hardwareState.equals(reportState)) { return; @@ -405,7 +476,6 @@ private void changeHardwareState(DispatchHost host, HardwareState reportState, b hostManager.setHostState(host, reportState); host.hardwareState = reportState; break; - } } @@ -424,26 +494,41 @@ private void changeHardwareState(DispatchHost host, HardwareState reportState, b * @param reportHost * @return */ - private boolean changeStateForTempDirStorage(DispatchHost host, RenderHost reportHost) { + private boolean changeStateForTempDirStorage( + DispatchHost host, + RenderHost reportHost + ) { // The minimum amount of free space in the temporary directory to book a host int minAvailableTempPercentage = env.getRequiredProperty( - "dispatcher.min_available_temp_storage_percentage", Integer.class); + "dispatcher.min_available_temp_storage_percentage", + Integer.class + ); // Prevent cue frames from booking on hosts with full temporary directories boolean hasEnoughTempStorage = isTempDirStorageEnough( reportHost.getTotalMcp(), reportHost.getFreeMcp(), - host.getOs()); + host.getOs() + ); if (!hasEnoughTempStorage && host.hardwareState == HardwareState.UP) { // Insert a comment indicating that the Host status = Repair with reason = Full temporary directory CommentDetail c = new CommentDetail(); c.subject = SUBJECT_COMMENT_FULL_TEMP_DIR; c.user = CUEBOT_COMMENT_USER; c.timestamp = null; - long requiredTempMb = (long)((minAvailableTempPercentage / 100.0) * reportHost.getTotalMcp()/ 1024); - c.message = "Host " + host.getName() + " marked as REPAIR. The current amount of free space in the " + - "temporary directory (mcp) is " + (reportHost.getFreeMcp()/1024) + "MB. It must have at least " - + ((requiredTempMb)) + "MB of free space in temporary directory"; + long requiredTempMb = (long) (((minAvailableTempPercentage / + 100.0) * + reportHost.getTotalMcp()) / + 1024); + c.message = + "Host " + + host.getName() + + " marked as REPAIR. The current amount of free space in the " + + "temporary directory (mcp) is " + + (reportHost.getFreeMcp() / 1024) + + "MB. It must have at least " + + ((requiredTempMb)) + + "MB of free space in temporary directory"; commentManager.addComment(host, c); // Set the host state to REPAIR @@ -451,11 +536,17 @@ private boolean changeStateForTempDirStorage(DispatchHost host, RenderHost repor host.hardwareState = HardwareState.REPAIR; return true; - } else if (hasEnoughTempStorage && host.hardwareState == HardwareState.REPAIR) { + } else if ( + hasEnoughTempStorage && host.hardwareState == HardwareState.REPAIR + ) { // Check if the host with REPAIR status has comments with subject=SUBJECT_COMMENT_FULL_TEMP_DIR and // user=CUEBOT_COMMENT_USER and delete the comments, if they exist - boolean commentsDeleted = commentManager.deleteCommentByHostUserAndSubject(host, - CUEBOT_COMMENT_USER, SUBJECT_COMMENT_FULL_TEMP_DIR); + boolean commentsDeleted = + commentManager.deleteCommentByHostUserAndSubject( + host, + CUEBOT_COMMENT_USER, + SUBJECT_COMMENT_FULL_TEMP_DIR + ); if (commentsDeleted) { // Set the host state to UP @@ -479,13 +570,20 @@ private void changeNimbyState(DispatchHost host, RenderHost rh) { if (rh.getNimbyLocked()) { if (host.lockState.equals(LockState.OPEN)) { host.lockState = LockState.NIMBY_LOCKED; - hostManager.setHostLock(host,LockState.NIMBY_LOCKED, new Source("NIMBY")); + hostManager.setHostLock( + host, + LockState.NIMBY_LOCKED, + new Source("NIMBY") + ); } - } - else { + } else { if (host.lockState.equals(LockState.NIMBY_LOCKED)) { host.lockState = LockState.OPEN; - hostManager.setHostLock(host,LockState.OPEN, new Source("NIMBY")); + hostManager.setHostLock( + host, + LockState.OPEN, + new Source("NIMBY") + ); } } } @@ -501,11 +599,19 @@ private void changeLockState(DispatchHost host, CoreDetail coreInfo) { if (host.lockState == LockState.LOCKED) { if (coreInfo.getLockedCores() < coreInfo.getTotalCores()) { host.lockState = LockState.OPEN; - hostManager.setHostLock(host, LockState.OPEN, new Source("cores")); + hostManager.setHostLock( + host, + LockState.OPEN, + new Source("cores") + ); } } else if (coreInfo.getLockedCores() >= coreInfo.getTotalCores()) { host.lockState = LockState.LOCKED; - hostManager.setHostLock(host, LockState.LOCKED, new Source("cores")); + hostManager.setHostLock( + host, + LockState.LOCKED, + new Source("cores") + ); } } @@ -525,53 +631,84 @@ private void changeLockState(DispatchHost host, CoreDetail coreInfo) { * @param dispatchHost * @param report */ - private void handleMemoryUsage(final DispatchHost dispatchHost, RenderHost renderHost, - List runningFrames) { + private void handleMemoryUsage( + final DispatchHost dispatchHost, + RenderHost renderHost, + List runningFrames + ) { // Don't keep memory balances on nimby hosts and hosts with invalid memory // information if (dispatchHost.isNimby || renderHost.getTotalMem() <= 0) { return; } - final double OOM_MAX_SAFE_USED_PHYSICAL_THRESHOLD = env - .getRequiredProperty("dispatcher.oom_max_safe_used_physical_memory_threshold", Double.class); - final double OOM_MAX_SAFE_USED_SWAP_THRESHOLD = env - .getRequiredProperty("dispatcher.oom_max_safe_used_swap_memory_threshold", Double.class); - final double OOM_FRAME_OVERBOARD_ALLOWED_THRESHOLD = env - .getRequiredProperty("dispatcher.oom_frame_overboard_allowed_threshold", Double.class); + final double OOM_MAX_SAFE_USED_PHYSICAL_THRESHOLD = + env.getRequiredProperty( + "dispatcher.oom_max_safe_used_physical_memory_threshold", + Double.class + ); + final double OOM_MAX_SAFE_USED_SWAP_THRESHOLD = env.getRequiredProperty( + "dispatcher.oom_max_safe_used_swap_memory_threshold", + Double.class + ); + final double OOM_FRAME_OVERBOARD_ALLOWED_THRESHOLD = + env.getRequiredProperty( + "dispatcher.oom_frame_overboard_allowed_threshold", + Double.class + ); - Double physMemoryUsageRatio = renderHost.getTotalMem() > 0 ? - 1.0 - renderHost.getFreeMem() / (double) renderHost.getTotalMem() : - 0.0; + Double physMemoryUsageRatio = renderHost.getTotalMem() > 0 + ? 1.0 - renderHost.getFreeMem() / (double) renderHost.getTotalMem() + : 0.0; - Double swapMemoryUsageRatio = renderHost.getTotalSwap() > 0 ? - 1.0 - renderHost.getFreeSwap() / (double) renderHost.getTotalSwap() : - 0.0; + Double swapMemoryUsageRatio = renderHost.getTotalSwap() > 0 + ? 1.0 - + renderHost.getFreeSwap() / (double) renderHost.getTotalSwap() + : 0.0; // If checking for the swap threshold has been disabled, only memory usage is // taken into consideration. // If checking for memory has been disabled, checking for swap isolated is not // safe, therefore disabled boolean memoryWarning = false; - if (OOM_MAX_SAFE_USED_PHYSICAL_THRESHOLD > 0.0 && OOM_MAX_SAFE_USED_SWAP_THRESHOLD > 0.0 && - !physMemoryUsageRatio.isNaN() && !swapMemoryUsageRatio.isNaN()) { - memoryWarning = physMemoryUsageRatio > OOM_MAX_SAFE_USED_PHYSICAL_THRESHOLD && + if ( + OOM_MAX_SAFE_USED_PHYSICAL_THRESHOLD > 0.0 && + OOM_MAX_SAFE_USED_SWAP_THRESHOLD > 0.0 && + !physMemoryUsageRatio.isNaN() && + !swapMemoryUsageRatio.isNaN() + ) { + memoryWarning = + physMemoryUsageRatio > OOM_MAX_SAFE_USED_PHYSICAL_THRESHOLD && swapMemoryUsageRatio > OOM_MAX_SAFE_USED_SWAP_THRESHOLD; - } else if (OOM_MAX_SAFE_USED_PHYSICAL_THRESHOLD > 0.0 && !physMemoryUsageRatio.isNaN()) { - memoryWarning = physMemoryUsageRatio > OOM_MAX_SAFE_USED_PHYSICAL_THRESHOLD; + } else if ( + OOM_MAX_SAFE_USED_PHYSICAL_THRESHOLD > 0.0 && + !physMemoryUsageRatio.isNaN() + ) { + memoryWarning = + physMemoryUsageRatio > OOM_MAX_SAFE_USED_PHYSICAL_THRESHOLD; } if (memoryWarning) { - logger.warn("Memory warning(" + renderHost.getName() + "): physMemoryRatio: " + - physMemoryUsageRatio + ", swapRatio: " + swapMemoryUsageRatio); + logger.warn( + "Memory warning(" + + renderHost.getName() + + "): physMemoryRatio: " + + physMemoryUsageRatio + + ", swapRatio: " + + swapMemoryUsageRatio + ); // Try to kill frames using swap memory as they are probably performing poorly - long swapUsed = renderHost.getTotalSwap() - renderHost.getFreeSwap(); - long maxSwapUsageAllowed = (long) (renderHost.getTotalSwap() - * OOM_MAX_SAFE_USED_SWAP_THRESHOLD); + long swapUsed = + renderHost.getTotalSwap() - renderHost.getFreeSwap(); + long maxSwapUsageAllowed = (long) (renderHost.getTotalSwap() * + OOM_MAX_SAFE_USED_SWAP_THRESHOLD); // Sort runningFrames bassed on how much swap they are using - runningFrames.sort(Comparator.comparingLong((RunningFrameInfo frame) -> - frame.getUsedSwapMemory()).reversed()); + runningFrames.sort( + Comparator.comparingLong((RunningFrameInfo frame) -> + frame.getUsedSwapMemory() + ).reversed() + ); int killAttemptsRemaining = 5; for (RunningFrameInfo frame : runningFrames) { @@ -579,16 +716,31 @@ private void handleMemoryUsage(final DispatchHost dispatchHost, RenderHost rende if (frame.getUsedSwapMemory() <= 0) { break; } - if (killProcForMemory(frame.getFrameId(), renderHost.getName(), - KillCause.HostUnderOom)) { + if ( + killProcForMemory( + frame.getFrameId(), + renderHost.getName(), + KillCause.HostUnderOom + ) + ) { swapUsed -= frame.getUsedSwapMemory(); - logger.info("Memory warning(" + renderHost.getName() + "): " + - "Killing frame on " + frame.getJobName() + "." + - frame.getFrameName() + ", using too much swap."); + logger.info( + "Memory warning(" + + renderHost.getName() + + "): " + + "Killing frame on " + + frame.getJobName() + + "." + + frame.getFrameName() + + ", using too much swap." + ); } killAttemptsRemaining -= 1; - if (killAttemptsRemaining <= 0 || swapUsed <= maxSwapUsageAllowed) { + if ( + killAttemptsRemaining <= 0 || + swapUsed <= maxSwapUsageAllowed + ) { break; } } @@ -597,10 +749,20 @@ private void handleMemoryUsage(final DispatchHost dispatchHost, RenderHost rende // if frames didn't go overboard, manage its reservations trying to increase // them accordingly for (final RunningFrameInfo frame : runningFrames) { - if (OOM_FRAME_OVERBOARD_ALLOWED_THRESHOLD > 0 && isFrameOverboard(frame)) { - if (!killFrameOverusingMemory(frame, dispatchHost.getName())) { - logger.warn("Frame " + frame.getJobName() + "." + frame.getFrameName() + - " is overboard but could not be killed"); + if ( + OOM_FRAME_OVERBOARD_ALLOWED_THRESHOLD > 0 && + isFrameOverboard(frame) + ) { + if ( + !killFrameOverusingMemory(frame, dispatchHost.getName()) + ) { + logger.warn( + "Frame " + + frame.getJobName() + + "." + + frame.getFrameName() + + " is overboard but could not be killed" + ); } } else { handleMemoryReservations(frame); @@ -615,29 +777,45 @@ public enum KillCause { FrameTimedOut("Frame timed out"), FrameLluTimedOut("Frame LLU timed out"), FrameVerificationFailure("Frame failed to be verified on the database"); + private final String message; private KillCause(String message) { this.message = message; } + @Override public String toString() { return message; } } - private boolean killFrameOverusingMemory(RunningFrameInfo frame, String hostname) { + private boolean killFrameOverusingMemory( + RunningFrameInfo frame, + String hostname + ) { try { - VirtualProc proc = hostManager.getVirtualProc(frame.getResourceId()); + VirtualProc proc = hostManager.getVirtualProc( + frame.getResourceId() + ); // Don't mess with localDispatch procs if (proc.isLocalDispatch) { return false; } - boolean killed = killProcForMemory(proc.frameId, hostname, KillCause.FrameOverboard); + boolean killed = killProcForMemory( + proc.frameId, + hostname, + KillCause.FrameOverboard + ); if (killed) { - logger.info("Killing frame on " + frame.getJobName() + "." + frame.getFrameName() + - ", using too much memory."); + logger.info( + "Killing frame on " + + frame.getJobName() + + "." + + frame.getFrameName() + + ", using too much memory." + ); } return killed; } catch (EmptyResultDataAccessException e) { @@ -647,8 +825,10 @@ private boolean killFrameOverusingMemory(RunningFrameInfo frame, String hostname private boolean getKillClearance(String hostname, String frameId) { String cacheKey = hostname + "-" + frameId; - final int FRAME_KILL_RETRY_LIMIT = - env.getRequiredProperty("dispatcher.frame_kill_retry_limit", Integer.class); + final int FRAME_KILL_RETRY_LIMIT = env.getRequiredProperty( + "dispatcher.frame_kill_retry_limit", + Integer.class + ); // Cache frame+host receiving a killRequest and count how many times the request is being retried // meaning rqd is probably failing at attempting to kill the related proc @@ -667,13 +847,18 @@ private boolean getKillClearance(String hostname, String frameId) { FrameInterface frame = jobManager.getFrame(frameId); JobInterface job = jobManager.getJob(frame.getJobId()); prometheusMetrics.incrementFrameKillFailureCounter( - hostname, - job.getName(), - frame.getName(), - frameId); + hostname, + job.getName(), + frame.getName(), + frameId + ); } catch (EmptyResultDataAccessException e) { logger.info( - "Trying to kill a frame that no longer exists: host=" + hostname + " frameId=" + frameId); + "Trying to kill a frame that no longer exists: host=" + + hostname + + " frameId=" + + frameId + ); } } return false; @@ -681,7 +866,11 @@ private boolean getKillClearance(String hostname, String frameId) { return true; } - private boolean killProcForMemory(String frameId, String hostname, KillCause killCause) { + private boolean killProcForMemory( + String frameId, + String hostname, + KillCause killCause + ) { if (!getKillClearance(hostname, frameId)) { return false; } @@ -689,15 +878,35 @@ private boolean killProcForMemory(String frameId, String hostname, KillCause kil FrameInterface frame = jobManager.getFrame(frameId); if (dispatcher.isTestMode()) { // Different threads don't share the same database state on the test environment - (new DispatchRqdKillFrameMemory(hostname, frame, killCause.toString(), rqdClient, - dispatchSupport, dispatcher.isTestMode())).run(); + (new DispatchRqdKillFrameMemory( + hostname, + frame, + killCause.toString(), + rqdClient, + dispatchSupport, + dispatcher.isTestMode() + )).run(); } else { try { - killQueue.execute(new DispatchRqdKillFrameMemory(hostname, frame, killCause.toString(), rqdClient, - dispatchSupport, dispatcher.isTestMode())); - prometheusMetrics.incrementFrameKilledCounter(hostname, killCause); + killQueue.execute( + new DispatchRqdKillFrameMemory( + hostname, + frame, + killCause.toString(), + rqdClient, + dispatchSupport, + dispatcher.isTestMode() + ) + ); + prometheusMetrics.incrementFrameKilledCounter( + hostname, + killCause + ); } catch (TaskRejectedException e) { - logger.warn("Unable to add a DispatchRqdKillFrame request, task rejected, " + e); + logger.warn( + "Unable to add a DispatchRqdKillFrame request, task rejected, " + + e + ); return false; } } @@ -705,23 +914,42 @@ private boolean killProcForMemory(String frameId, String hostname, KillCause kil return true; } - private boolean killFrame(String frameId, String hostname, KillCause killCause) { + private boolean killFrame( + String frameId, + String hostname, + KillCause killCause + ) { if (!getKillClearance(hostname, frameId)) { return false; } if (dispatcher.isTestMode()) { // Different threads don't share the same database state on the test environment - (new DispatchRqdKillFrame(hostname, frameId, killCause.toString(), rqdClient)).run(); + (new DispatchRqdKillFrame( + hostname, + frameId, + killCause.toString(), + rqdClient + )).run(); } else { try { - killQueue.execute(new DispatchRqdKillFrame(hostname, + killQueue.execute( + new DispatchRqdKillFrame( + hostname, frameId, killCause.toString(), - rqdClient)); - prometheusMetrics.incrementFrameKilledCounter(hostname, killCause); + rqdClient + ) + ); + prometheusMetrics.incrementFrameKilledCounter( + hostname, + killCause + ); } catch (TaskRejectedException e) { - logger.warn("Unable to add a DispatchRqdKillFrame request, task rejected, " + e); + logger.warn( + "Unable to add a DispatchRqdKillFrame request, task rejected, " + + e + ); } } DispatchSupport.killedOffenderProcs.incrementAndGet(); @@ -735,35 +963,62 @@ private boolean killFrame(String frameId, String hostname, KillCause killCause) */ private boolean isFrameOverboard(final RunningFrameInfo frame) { final double OOM_FRAME_OVERBOARD_ALLOWED_THRESHOLD = - env.getRequiredProperty("dispatcher.oom_frame_overboard_allowed_threshold", Double.class); + env.getRequiredProperty( + "dispatcher.oom_frame_overboard_allowed_threshold", + Double.class + ); if (OOM_FRAME_OVERBOARD_ALLOWED_THRESHOLD < 0) { return false; } - double rss = (double)frame.getRss(); - double maxRss = (double)frame.getMaxRss(); - final double MAX_RSS_OVERBOARD_THRESHOLD = OOM_FRAME_OVERBOARD_ALLOWED_THRESHOLD * 2; + double rss = (double) frame.getRss(); + double maxRss = (double) frame.getMaxRss(); + final double MAX_RSS_OVERBOARD_THRESHOLD = + OOM_FRAME_OVERBOARD_ALLOWED_THRESHOLD * 2; final double RSS_AVAILABLE_FOR_MAX_RSS_TRIGGER = 0.1; try { - VirtualProc proc = hostManager.getVirtualProc(frame.getResourceId()); - double reserved = (double)proc.memoryReserved; + VirtualProc proc = hostManager.getVirtualProc( + frame.getResourceId() + ); + double reserved = (double) proc.memoryReserved; // Last memory report is higher than the threshold - if (isOverboard(rss, reserved, OOM_FRAME_OVERBOARD_ALLOWED_THRESHOLD)) { + if ( + isOverboard( + rss, + reserved, + OOM_FRAME_OVERBOARD_ALLOWED_THRESHOLD + ) + ) { return true; } // If rss is not overboard, handle the situation where the frame might be going overboard from // time to time but the last report wasn't during a spike. For this case, consider a combination // of rss and maxRss. maxRss > 2 * threshold and rss > 0.9 else { - return isOverboard(maxRss, reserved, MAX_RSS_OVERBOARD_THRESHOLD) && - isOverboard(rss, reserved, -RSS_AVAILABLE_FOR_MAX_RSS_TRIGGER); + return ( + isOverboard( + maxRss, + reserved, + MAX_RSS_OVERBOARD_THRESHOLD + ) && + isOverboard( + rss, + reserved, + -RSS_AVAILABLE_FOR_MAX_RSS_TRIGGER + ) + ); } } catch (EmptyResultDataAccessException e) { - logger.info("HostReportHandler(isFrameOverboard): Virtual proc for frame " + - frame.getFrameName() + " on job " + frame.getJobName() + " doesn't exist on the database"); + logger.info( + "HostReportHandler(isFrameOverboard): Virtual proc for frame " + + frame.getFrameName() + + " on job " + + frame.getJobName() + + " doesn't exist on the database" + ); // Not able to mark the frame overboard is it couldn't be found on the db. // Proc accounting (verifyRunningProc) should take care of it return false; @@ -771,7 +1026,7 @@ private boolean isFrameOverboard(final RunningFrameInfo frame) { } private boolean isOverboard(double value, double total, double threshold) { - return value/total >= (1 + threshold); + return value / total >= (1 + threshold); } /** @@ -790,33 +1045,65 @@ private void handleMemoryReservations(final RunningFrameInfo frame) { if (dispatchSupport.increaseReservedMemory(proc, frame.getRss())) { proc.memoryReserved = frame.getRss(); - logger.info("frame " + frame.getFrameName() + " on job " + frame.getJobName() - + " increased its reserved memory to " + - CueUtil.KbToMb(frame.getRss())); + logger.info( + "frame " + + frame.getFrameName() + + " on job " + + frame.getJobName() + + " increased its reserved memory to " + + CueUtil.KbToMb(frame.getRss()) + ); } } catch (ResourceReservationFailureException e) { if (proc != null) { long memNeeded = frame.getRss() - proc.memoryReserved; - logger.info("frame " + frame.getFrameName() + " on job " + frame.getJobName() - + "was unable to reserve an additional " + CueUtil.KbToMb(memNeeded) - + "on proc " + proc.getName() + ", " + e); + logger.info( + "frame " + + frame.getFrameName() + + " on job " + + frame.getJobName() + + "was unable to reserve an additional " + + CueUtil.KbToMb(memNeeded) + + "on proc " + + proc.getName() + + ", " + + e + ); try { - if (dispatchSupport.balanceReservedMemory(proc, memNeeded)) { + if ( + dispatchSupport.balanceReservedMemory(proc, memNeeded) + ) { proc.memoryReserved = frame.getRss(); - logger.info("was able to balance host: " + proc.getName()); + logger.info( + "was able to balance host: " + proc.getName() + ); } else { - logger.info("failed to balance host: " + proc.getName()); + logger.info( + "failed to balance host: " + proc.getName() + ); } } catch (Exception ex) { - logger.warn("failed to balance host: " + proc.getName() + ", " + e); + logger.warn( + "failed to balance host: " + proc.getName() + ", " + e + ); } } else { - logger.info("frame " + frame.getFrameName() + " on job " + frame.getJobName() - + "was unable to reserve an additional memory. Proc could not be found"); + logger.info( + "frame " + + frame.getFrameName() + + " on job " + + frame.getJobName() + + "was unable to reserve an additional memory. Proc could not be found" + ); } } catch (EmptyResultDataAccessException e) { - logger.info("HostReportHandler: Memory reservations for frame " + frame.getFrameName() + - " on job " + frame.getJobName() + " proc could not be found"); + logger.info( + "HostReportHandler: Memory reservations for frame " + + frame.getFrameName() + + " on job " + + frame.getJobName() + + " proc could not be found" + ); } } @@ -825,22 +1112,39 @@ private void handleMemoryReservations(final RunningFrameInfo frame) { * * @param rFrames */ - private void killTimedOutFrames(List runningFrames, String hostname) { + private void killTimedOutFrames( + List runningFrames, + String hostname + ) { for (RunningFrameInfo frame : runningFrames) { String layerId = frame.getLayerId(); try { LayerDetail layer = layerDao.getLayerDetail(layerId); - long runtimeMinutes = ((System.currentTimeMillis() - frame.getStartTime()) / 1000l) / 60; + long runtimeMinutes = + ((System.currentTimeMillis() - frame.getStartTime()) / + 1000l) / + 60; if (layer.timeout != 0 && runtimeMinutes > layer.timeout) { - killFrame(frame.getFrameId(), hostname, KillCause.FrameTimedOut); + killFrame( + frame.getFrameId(), + hostname, + KillCause.FrameTimedOut + ); } else if (layer.timeout_llu != 0 && frame.getLluTime() != 0) { long r = System.currentTimeMillis() / 1000; long lastUpdate = (r - frame.getLluTime()) / 60; - if (layer.timeout_llu != 0 && lastUpdate > (layer.timeout_llu - 1)) { - killFrame(frame.getFrameId(), hostname, KillCause.FrameLluTimedOut); + if ( + layer.timeout_llu != 0 && + lastUpdate > (layer.timeout_llu - 1) + ) { + killFrame( + frame.getFrameId(), + hostname, + KillCause.FrameLluTimedOut + ); } } } catch (EmptyResultDataAccessException e) { @@ -855,18 +1159,27 @@ private void killTimedOutFrames(List runningFrames, String hos * @param rFrames */ private void updateMemoryUsageAndLluTime(List rFrames) { - - for (RunningFrameInfo rf: rFrames) { + for (RunningFrameInfo rf : rFrames) { FrameInterface frame = jobManager.getFrame(rf.getFrameId()); - dispatchSupport.updateFrameMemoryUsageAndLluTime(frame, - rf.getRss(), rf.getMaxRss(), rf.getLluTime()); - - dispatchSupport.updateProcMemoryUsage(frame, rf.getRss(), rf.getMaxRss(), - rf.getVsize(), rf.getMaxVsize(), rf.getUsedGpuMemory(), - rf.getMaxUsedGpuMemory(), rf.getUsedSwapMemory(), - rf.getChildren().toByteArray()); - + dispatchSupport.updateFrameMemoryUsageAndLluTime( + frame, + rf.getRss(), + rf.getMaxRss(), + rf.getLluTime() + ); + + dispatchSupport.updateProcMemoryUsage( + frame, + rf.getRss(), + rf.getMaxRss(), + rf.getVsize(), + rf.getMaxVsize(), + rf.getUsedGpuMemory(), + rf.getMaxUsedGpuMemory(), + rf.getUsedSwapMemory(), + rf.getChildren().toByteArray() + ); } updateJobMemoryUsage(rFrames); @@ -879,23 +1192,22 @@ private void updateMemoryUsageAndLluTime(List rFrames) { * @param frames */ private void updateJobMemoryUsage(List frames) { + final Map jobs = new HashMap( + frames.size() + ); - final Map jobs = - new HashMap(frames.size()); - - for (RunningFrameInfo frame: frames) { + for (RunningFrameInfo frame : frames) { JobEntity job = new JobEntity(frame.getJobId()); if (jobs.containsKey(job)) { if (jobs.get(job) < frame.getMaxRss()) { jobs.put(job, frame.getMaxRss()); } - } - else { + } else { jobs.put(job, frame.getMaxRss()); } } - for (Map.Entry set: jobs.entrySet()) { + for (Map.Entry set : jobs.entrySet()) { jobDao.updateMaxRSS(set.getKey(), set.getValue()); } } @@ -906,24 +1218,23 @@ private void updateJobMemoryUsage(List frames) { * @param frames */ private void updateLayerMemoryUsage(List frames) { + final Map layers = new HashMap( + frames.size() + ); - final Map layers = - new HashMap(frames.size()); - - for (RunningFrameInfo frame: frames) { + for (RunningFrameInfo frame : frames) { LayerEntity layer = new LayerEntity(frame.getLayerId()); if (layers.containsKey(layer)) { if (layers.get(layer) < frame.getMaxRss()) { layers.put(layer, frame.getMaxRss()); } - } - else { + } else { layers.put(layer, frame.getMaxRss()); } } /* Attempt to update the max RSS value for the job **/ - for (Map.Entry set: layers.entrySet()) { + for (Map.Entry set : layers.entrySet()) { layerDao.increaseLayerMinMemory(set.getKey(), set.getValue()); layerDao.updateLayerMaxRSS(set.getKey(), set.getValue(), false); } @@ -951,24 +1262,38 @@ private void updateLayerMemoryUsage(List frames) { * @param report */ public List verifyRunningFrameInfo(HostReport report) { - List runningFrames = new ArrayList(report.getFramesCount()); - - for (RunningFrameInfo runningFrame: report.getFramesList()) { + List runningFrames = new ArrayList( + report.getFramesCount() + ); - long runtimeSeconds = (System.currentTimeMillis() - - runningFrame.getStartTime()) / 1000l; + for (RunningFrameInfo runningFrame : report.getFramesList()) { + long runtimeSeconds = + (System.currentTimeMillis() - runningFrame.getStartTime()) / + 1000l; // Don't test frames that haven't been running long enough. if (runtimeSeconds < FRAME_VERIFICATION_GRACE_PERIOD_SECONDS) { - logger.info("verified " + runningFrame.getJobName() + - "/" + runningFrame.getFrameName() + " on " + - report.getHost().getName() + " by grace period " + - runtimeSeconds + " seconds."); + logger.info( + "verified " + + runningFrame.getJobName() + + "/" + + runningFrame.getFrameName() + + " on " + + report.getHost().getName() + + " by grace period " + + runtimeSeconds + + " seconds." + ); runningFrames.add(runningFrame); continue; } - if (hostManager.verifyRunningProc(runningFrame.getResourceId(), runningFrame.getFrameId())) { + if ( + hostManager.verifyRunningProc( + runningFrame.getResourceId(), + runningFrame.getFrameId() + ) + ) { runningFrames.add(runningFrame); continue; } @@ -984,11 +1309,14 @@ public List verifyRunningFrameInfo(HostReport report) { try { proc = hostManager.getVirtualProc(runningFrame.getResourceId()); - msg = "Virtual proc " + proc.getProcId() + - "is assigned to " + proc.getFrameId() + - " not " + runningFrame.getFrameId(); - } - catch (Exception e) { + msg = + "Virtual proc " + + proc.getProcId() + + "is assigned to " + + proc.getFrameId() + + " not " + + runningFrame.getFrameId(); + } catch (Exception e) { /* * This will happen if the host goes offline and then * comes back. In this case, we don't touch the frame @@ -1007,27 +1335,53 @@ public List verifyRunningFrameInfo(HostReport report) { if (proc == null) { // A frameCompleteReport might have been delivered before this report was // processed - FrameDetail frameLatestVersion = jobManager.getFrameDetail(runningFrame.getFrameId()); + FrameDetail frameLatestVersion = jobManager.getFrameDetail( + runningFrame.getFrameId() + ); if (frameLatestVersion.state != FrameState.RUNNING) { - logger.info("DelayedVerification, the proc " + - runningFrame.getResourceId() + " on host " + - report.getHost().getName() + " has already Completed " + - runningFrame.getJobName() + "/" + runningFrame.getFrameName()); - } else if (killFrame(runningFrame.getFrameId(), + logger.info( + "DelayedVerification, the proc " + + runningFrame.getResourceId() + + " on host " + + report.getHost().getName() + + " has already Completed " + + runningFrame.getJobName() + + "/" + + runningFrame.getFrameName() + ); + } else if ( + killFrame( + runningFrame.getFrameId(), report.getHost().getName(), - KillCause.FrameVerificationFailure)) { - logger.info("FrameVerificationError, the proc " + - runningFrame.getResourceId() + " on host " + - report.getHost().getName() + " was running for " + - (runtimeSeconds / 60.0f) + " minutes " + - runningFrame.getJobName() + "/" + runningFrame.getFrameName() + - " but the DB did not " + - "reflect this. " + - msg); + KillCause.FrameVerificationFailure + ) + ) { + logger.info( + "FrameVerificationError, the proc " + + runningFrame.getResourceId() + + " on host " + + report.getHost().getName() + + " was running for " + + (runtimeSeconds / 60.0f) + + " minutes " + + runningFrame.getJobName() + + "/" + + runningFrame.getFrameName() + + " but the DB did not " + + "reflect this. " + + msg + ); } else { - logger.warn("FrameStuckWarning: frameId=" + runningFrame.getFrameId() + - " render_node=" + report.getHost().getName() + " - " + - runningFrame.getJobName() + "/" + runningFrame.getFrameName()); + logger.warn( + "FrameStuckWarning: frameId=" + + runningFrame.getFrameId() + + " render_node=" + + report.getHost().getName() + + " - " + + runningFrame.getJobName() + + "/" + + runningFrame.getFrameName() + ); } } } @@ -1121,6 +1475,7 @@ public Dispatcher getLocalDispatcher() { public void setLocalDispatcher(Dispatcher localDispatcher) { this.localDispatcher = localDispatcher; } + public ThreadPoolExecutor getKillQueue() { return killQueue; } @@ -1129,4 +1484,3 @@ public void setKillQueue(ThreadPoolExecutor killQueue) { this.killQueue = killQueue; } } - diff --git a/cuegui/cuegui/AbstractDockWidget.py b/cuegui/cuegui/AbstractDockWidget.py index 0697662e3..c5059b2c3 100644 --- a/cuegui/cuegui/AbstractDockWidget.py +++ b/cuegui/cuegui/AbstractDockWidget.py @@ -57,12 +57,15 @@ def __init__(self, parent, name, area = QtCore.Qt.LeftDockWidgetArea): self.widget().setLayout(self.__layout) def closeEvent(self, event): + """Delete event and emit close signal""" del event self.closed.emit(self) def showEvent(self, event): + """Delete event and emit enabled signal""" del event self.enabled.emit() def layout(self): + """Returns the layout""" return self.__layout diff --git a/cuegui/cuegui/AbstractTreeWidget.py b/cuegui/cuegui/AbstractTreeWidget.py index eb748fa8a..6260ec669 100644 --- a/cuegui/cuegui/AbstractTreeWidget.py +++ b/cuegui/cuegui/AbstractTreeWidget.py @@ -117,6 +117,7 @@ def __init__(self, parent): self.setUpdateInterval(10) def closeEvent(self, event): + """Close Event""" if hasattr(self, '_timer'): self._timer.stop() del self._timer diff --git a/cuegui/cuegui/CreatorDialog.py b/cuegui/cuegui/CreatorDialog.py index 5d2e5e450..2e86c6b4a 100644 --- a/cuegui/cuegui/CreatorDialog.py +++ b/cuegui/cuegui/CreatorDialog.py @@ -63,6 +63,7 @@ def __init__(self, show=None, parent=None): layout.addRow('Burst:', self.burstBox) def create(self): + """Create Subscription""" try: showMap = dict(list(zip([s.data.name for s in self.__shows], self.__shows))) allocMap = dict(list(zip([a.data.name for a in self.__allocs], self.__allocs))) @@ -103,5 +104,6 @@ def __init__(self, show=None, parent=None): # pylint: enable=no-member def create(self): + """Create subscription""" self.__creator.create() self.close() diff --git a/cuegui/cuegui/CueJobMonitorTree.py b/cuegui/cuegui/CueJobMonitorTree.py index 7b47b1902..f7e41dfd6 100644 --- a/cuegui/cuegui/CueJobMonitorTree.py +++ b/cuegui/cuegui/CueJobMonitorTree.py @@ -264,9 +264,11 @@ def startDrag(self, dropActions): cuegui.Utils.startDrag(self, dropActions, self.selectedObjects()) def dragEnterEvent(self, event): + """Called after a drag event begins""" cuegui.Utils.dragEnterEvent(event) def dragMoveEvent(self, event): + """Called on a drag move event""" cuegui.Utils.dragMoveEvent(event) # Causes the list to scroll when dragging is over the top or bottom 20% @@ -288,6 +290,7 @@ def dragMoveEvent(self, event): self.verticalScrollBar().setValue(self.verticalScrollBar().value() + move) def dropEvent(self, event): + """Drop event action""" item = self.itemAt(event.pos()) if item and item.type() in (cuegui.Constants.TYPE_ROOTGROUP, cuegui.Constants.TYPE_GROUP): @@ -307,7 +310,7 @@ def dropEvent(self, event): % item.rpcObject.data.name, event_item=item, items=body_content, - dist_groups={}, + dst_groups={}, parent=self) dialog.exec_() @@ -482,6 +485,7 @@ def __processUpdateHandleNested(self, parent, groups): "Failed to create tree item. RootView might be closed", exc_info=True) def mouseDoubleClickEvent(self, event): + """Event triggered by a mouse click""" del event objects = self.selectedObjects() if objects: @@ -861,12 +865,14 @@ def __init__(self, title, text, event_item, items, dst_groups, _hlayout.addWidget(_btn_cancel) _vlayout.addLayout(_hlayout) + # pylint: disable=no-member self.connect(_btn_accept, QtCore.SIGNAL("clicked()"), self.move_items) self.connect(_btn_cancel, QtCore.SIGNAL("clicked()"), self.reject) + # pylint: enable=no-member def move_items(self): """Reparent jobs to new group""" diff --git a/cuegui/cuegui/CueStateBarWidget.py b/cuegui/cuegui/CueStateBarWidget.py index 90fd7d652..8a61bb3bf 100644 --- a/cuegui/cuegui/CueStateBarWidget.py +++ b/cuegui/cuegui/CueStateBarWidget.py @@ -57,8 +57,8 @@ def __init__(self, sourceTree, parent=None): self.__sourceTree = weakref.proxy(sourceTree) self.__colors = [] self.__baseColor = self.app.palette().color(QtGui.QPalette.Base) - self.__colorsLock = QtCore.QReadWriteLock() - self.__timer = QtCore.QTimer(self) + self.__colorsLock = QtCore.QReadWriteLock() # pylint: disable=no-member + self.__timer = QtCore.QTimer(self) # pylint: disable=no-member self.__lastUpdate = 0 self.__timer.timeout.connect(self.updateColors) # pylint: disable=no-member @@ -173,7 +173,7 @@ def updateColors(self): def __updateColors(self): """Calls __processUpdateColors in 1 second""" self.__lastUpdate = time.time() - QtCore.QTimer.singleShot(1000, self.__processUpdateColors) + QtCore.QTimer.singleShot(1000, self.__processUpdateColors) # pylint: disable=no-member def __processUpdateColors(self): """Updates the list of colors to display diff --git a/cuegui/cuegui/DependWizard.py b/cuegui/cuegui/DependWizard.py index 25de89944..76b38c2d8 100644 --- a/cuegui/cuegui/DependWizard.py +++ b/cuegui/cuegui/DependWizard.py @@ -383,12 +383,14 @@ def __msg(self): if item[1]: return "this %s" % item[0] + # pylint: disable=missing-function-docstring def initializePage(self): self.setSubTitle("What type of dependency would you like %s to have?" % self.__msg()) # it is not respecting or providing my size hints otherwise self.wizard().setMinimumSize(500, 500) + # pylint: disable=missing-function-docstring def validatePage(self): # pylint: disable=consider-using-dict-items for option in self.__options: @@ -436,6 +438,7 @@ def __init__(self, parent): self.__layerList = self._addListWidget(2, 0, QtWidgets.QAbstractItemView.MultiSelection) + # pylint: disable=missing-function-docstring def initializePage(self): self.wizard().layerOptions = self.wizard().jobs[0].getLayers() @@ -448,6 +451,7 @@ def initializePage(self): self.__layerList.item(num).setSelected( str(self.__layerList.item(num).text()) in self._getNames(self.wizard().onLayer)) + # pylint: disable=missing-function-docstring def validatePage(self): self.wizard().layers = [] for num in range(self.__layerList.count()): @@ -486,9 +490,11 @@ def __init__(self, parent): self.__frame = self._addLineEdit(1, 9, "1") self.registerField("frame", self.__frame) + # pylint: disable=missing-function-docstring def initializePage(self): QtWidgets.QWizardPage.initializePage(self) + # pylint: disable=missing-function-docstring def validatePage(self): frames = str(self.field("frame")) if frames: @@ -541,6 +547,7 @@ def filterJobs(self, text): [job for job in self.wizard().onJobOptions if re.search(str(text), job, re.IGNORECASE) and job not in exclude]) + # pylint: disable=missing-function-docstring def initializePage(self): # If the filter edit box is empty, populate it with SHOW-SHOT-USER_ # based on the first job selected to receive the dependency @@ -558,6 +565,7 @@ def initializePage(self): QtWidgets.QWizardPage.initializePage(self) + # pylint: disable=missing-function-docstring def validatePage(self): self.wizard().onJob = [] for num in range(self.__jobList.count()): @@ -596,6 +604,7 @@ def __init__(self, parent): self._addLabel("Depend on Layer:", 0, 0) self.__onLayerList = self._addListWidget(1, 0) + # pylint: disable=missing-function-docstring def initializePage(self): QtWidgets.QWizardPage.initializePage(self) @@ -620,6 +629,7 @@ def initializePage(self): self.__onLayerList.item(num).setSelected( str(self.__onLayerList.item(num).text()) in self._getNames(self.wizard().onLayer)) + # pylint: disable=missing-function-docstring def validatePage(self): self.wizard().onLayer = [] for num in range(self.__onLayerList.count()): @@ -660,9 +670,11 @@ def __init__(self, parent): self.setField("onFrame", "") + # pylint: disable=missing-function-docstring def initializePage(self): QtWidgets.QWizardPage.initializePage(self) + # pylint: disable=missing-function-docstring def validatePage(self): frames = str(self.field("onFrame")) if frames: @@ -700,6 +712,7 @@ def __init__(self, parent, jobs, layers, frames): self.setTitle("Confirmation") self.setSubTitle("Are you sure?") + # pylint: disable=missing-function-docstring def initializePage(self): self._removeAllWidgets() @@ -724,6 +737,7 @@ def initializePage(self): self._displayItems("Frame", self.wizard().onFrame, 9) # pylint: disable=too-many-nested-blocks + # pylint: disable=missing-function-docstring def validatePage(self): # Just names: jobs = self._getNames(self.wizard().jobs) diff --git a/cuegui/cuegui/FilterDialog.py b/cuegui/cuegui/FilterDialog.py index ab4d4d25b..9fb5018f5 100644 --- a/cuegui/cuegui/FilterDialog.py +++ b/cuegui/cuegui/FilterDialog.py @@ -856,6 +856,7 @@ def __init__(self, parent): QtWidgets.QComboBox.__init__(self, parent) def wheelEvent(self, event): + """Handle wheel scroll event""" event.ignore() class NoWheelDoubleSpinBox(QtWidgets.QDoubleSpinBox): @@ -865,6 +866,7 @@ def __init__(self, parent): QtWidgets.QDoubleSpinBox.__init__(self, parent) def wheelEvent(self, event): + """Handle wheel scroll event""" event.ignore() class NoWheelSpinBox(QtWidgets.QSpinBox): @@ -874,4 +876,5 @@ def __init__(self, parent): QtWidgets.QSpinBox.__init__(self, parent) def wheelEvent(self, event): + """Handle wheel scroll event""" event.ignore() diff --git a/cuegui/cuegui/FrameRangeSelection.py b/cuegui/cuegui/FrameRangeSelection.py index 003c4bc22..b074b50d0 100644 --- a/cuegui/cuegui/FrameRangeSelection.py +++ b/cuegui/cuegui/FrameRangeSelection.py @@ -157,6 +157,7 @@ def setSelectedFrameRange(self, selectedRange): # QT event handlers and implementation details below this line. def mousePressEvent(self, mouseEvent): + """Event triggered by a mouse click""" hitTime = self.__getTimeFromLocalPoint(mouseEvent.x()) if mouseEvent.buttons() & QtCore.Qt.LeftButton: @@ -164,6 +165,7 @@ def mousePressEvent(self, mouseEvent): self.__selectionRange = (hitTime, hitTime) def mouseMoveEvent(self, mouseEvent): + """Event triggered by a mouse movement""" self.__floatTime = None hitTime = self.__getTimeFromLocalPoint(mouseEvent.x()) @@ -181,6 +183,7 @@ def mouseMoveEvent(self, mouseEvent): self.update() def mouseReleaseEvent(self, mouseEvent): + """Event triggered when a mouse click is released""" if self.__double: self.__double = False self.setStartTime(self.__frameRange[0], True) @@ -198,10 +201,12 @@ def mouseReleaseEvent(self, mouseEvent): self.update() def mouseDoubleClickEvent(self, mouseEvent): + """Event triggered by a double click""" del mouseEvent self.__double = True def paintEvent(self, paintEvent): + """Paint event""" del paintEvent painter = QtGui.QPainter(self) self.__paintBackground(painter) @@ -217,15 +222,18 @@ def paintEvent(self, paintEvent): self.__paintEndTime(painter) def leaveEvent(self, event): + """Triggered at the end of any event""" del event self.__floatTime = None self.update() def __getTickAreaExtent(self): + """Return a QRect with the selectable area""" return QtCore.QRect( 10, -self.height() // 2, self.width() - self.__right_margin - 20, self.height()) def __getTickArea(self, time): + """Get a QRect with a tick area""" tickArea = self.__getTickAreaExtent() tickSpacing = ( float(self.__getTickAreaExtent().width()) / @@ -234,6 +242,7 @@ def __getTickArea(self, time): tickArea.top(), tickSpacing, tickArea.height()) def __getTimeFromLocalPoint(self, x): + """Get time from a local point""" tickSpacing = ( float(self.__getTickAreaExtent().width()) / max(1, (self.__frameRange[1] - self.__frameRange[0]))) diff --git a/cuegui/cuegui/GroupDialog.py b/cuegui/cuegui/GroupDialog.py index d5f26ac18..4e0491c5c 100644 --- a/cuegui/cuegui/GroupDialog.py +++ b/cuegui/cuegui/GroupDialog.py @@ -1,4 +1,3 @@ - # Copyright Contributors to the OpenCue Project # # Licensed under the Apache License, Version 2.0 (the "License"); @@ -155,6 +154,7 @@ def __createButtons(self, buttons, row, width): # pylint: enable=no-member def accept(self): + """Accept action""" __name = str(self._nameValue.text()) if not __name: return diff --git a/cuegui/cuegui/HostMonitor.py b/cuegui/cuegui/HostMonitor.py index c5b84491a..334e612eb 100644 --- a/cuegui/cuegui/HostMonitor.py +++ b/cuegui/cuegui/HostMonitor.py @@ -113,6 +113,7 @@ def __filterByHostNameSetup(self, layout): btn.setFocusPolicy(QtCore.Qt.NoFocus) btn.setFixedWidth(24) layout.addWidget(btn) + # pylint: disable=no-member QtCore.QObject.connect(btn, QtCore.SIGNAL('clicked()'), self.__filterByHostNameClear) @@ -149,6 +150,7 @@ def __filterAllocationSetup(self, layout): menu = QtWidgets.QMenu(self) btn.setMenu(menu) + # pylint: disable=no-member QtCore.QObject.connect(menu, QtCore.SIGNAL("triggered(QAction*)"), self.__filterAllocationHandle) @@ -210,12 +212,13 @@ def __filterHardwareStateSetup(self, layout): btn.setContentsMargins(0, 0, 0, 0) btn.setFlat(True) + # pylint: disable=no-member menu = QtWidgets.QMenu(self) btn.setMenu(menu) QtCore.QObject.connect(menu, QtCore.SIGNAL("triggered(QAction*)"), self.__filterHardwareStateHandle) - + # pylint: enable=no-member for item in ["Clear", None] + self.__filterHardwareStateList: if item: a = QtWidgets.QAction(menu) @@ -266,6 +269,7 @@ def __filterHardwareStateHandle(self, action): # Checkbox to toggle auto-refresh # ============================================================================== def __refreshToggleCheckBoxSetup(self, layout): + # pylint: disable=no-member checkBox = QtWidgets.QCheckBox("Auto-refresh", self) layout.addWidget(checkBox) if self.hostMonitorTree.enableRefresh: @@ -274,6 +278,7 @@ def __refreshToggleCheckBoxSetup(self, layout): QtCore.SIGNAL('stateChanged(int)'), self.__refreshToggleCheckBoxHandle) __refreshToggleCheckBoxCheckBox = checkBox + # pylint: enable=no-member def __refreshToggleCheckBoxHandle(self, state): self.hostMonitorTree.enableRefresh = bool(state) @@ -300,7 +305,7 @@ def __refreshButtonEnableHandle(self): def __refreshButtonDisableHandle(self): """Called when the refresh button should be disabled""" self.btn_refresh.setEnabled(False) - QtCore.QTimer.singleShot(5000, self.__refreshButtonEnableHandle) + QtCore.QTimer.singleShot(5000, self.__refreshButtonEnableHandle) # pylint: disable=no-member # ============================================================================== # Button to clear all filters diff --git a/cuegui/cuegui/HostMonitorTree.py b/cuegui/cuegui/HostMonitorTree.py index a7c63147f..b504e8778 100644 --- a/cuegui/cuegui/HostMonitorTree.py +++ b/cuegui/cuegui/HostMonitorTree.py @@ -284,9 +284,11 @@ def startDrag(self, dropActions): cuegui.Utils.startDrag(self, dropActions, self.selectedObjects()) def dragEnterEvent(self, event): + """Enter drag event""" cuegui.Utils.dragEnterEvent(event, "application/x-host-ids") def dragMoveEvent(self, event): + """Move drag event""" cuegui.Utils.dragMoveEvent(event, "application/x-host-ids") diff --git a/cuegui/cuegui/ItemDelegate.py b/cuegui/cuegui/ItemDelegate.py index a91f16b4f..48c828e66 100644 --- a/cuegui/cuegui/ItemDelegate.py +++ b/cuegui/cuegui/ItemDelegate.py @@ -68,6 +68,7 @@ def __init__(self, parent, *args): QtWidgets.QItemDelegate.__init__(self, parent, *args) def paint(self, painter, option, index): + """Paint QItem""" if option.state & QtWidgets.QStyle.State_Selected: # If selected cell self._paintSelected(painter, option, index) @@ -476,6 +477,7 @@ def paint(self, painter, option, index): AbstractDelegate.paint(self, painter, option, index) def sizeHint(self, option, index): + """Delete both option and index and return a new qsize""" del option del index - return QtCore.QSize(12, 12) + return QtCore.QSize(12, 12) # pylint: disable=no-member diff --git a/cuegui/cuegui/JobMonitorTree.py b/cuegui/cuegui/JobMonitorTree.py index 7a2946794..d520c6d52 100644 --- a/cuegui/cuegui/JobMonitorTree.py +++ b/cuegui/cuegui/JobMonitorTree.py @@ -249,15 +249,19 @@ def __itemSingleClickedComment(self, item, col): self.__menuActions.jobs().viewComments([job]) def startDrag(self, dropActions): + """Triggers a drag event""" cuegui.Utils.startDrag(self, dropActions, self.selectedObjects()) def dragEnterEvent(self, event): + """Enter Drag event""" cuegui.Utils.dragEnterEvent(event) def dragMoveEvent(self, event): + """Move Drag Event""" cuegui.Utils.dragMoveEvent(event) def dropEvent(self, event): + """Drop Drag Event""" for job_name in cuegui.Utils.dropEvent(event): self.addJob(job_name) diff --git a/cuegui/cuegui/LayerDialog.py b/cuegui/cuegui/LayerDialog.py index aed2f740c..8686ce17e 100644 --- a/cuegui/cuegui/LayerDialog.py +++ b/cuegui/cuegui/LayerDialog.py @@ -534,5 +534,6 @@ def __init__(self, layers, parent=None): # pylint: enable=no-member def accept(self): + """Accept action""" self._tags_widget.apply() self.close() diff --git a/cuegui/cuegui/Layout.py b/cuegui/cuegui/Layout.py index 9b26d23c8..b12de3c5f 100644 --- a/cuegui/cuegui/Layout.py +++ b/cuegui/cuegui/Layout.py @@ -41,7 +41,7 @@ def startup(app_name): """ # E.g. ~/.config/.cuecommander/config.ini config_path = "/.%s/config" % app_name.lower() - settings = QtCore.QSettings(QtCore.QSettings.IniFormat, QtCore.QSettings.UserScope, config_path) + settings = QtCore.QSettings(QtCore.QSettings.IniFormat, QtCore.QSettings.UserScope, config_path) # pylint: disable=no-member logger.info('Reading config file from %s', settings.fileName()) local = settings.fileName() diff --git a/cuegui/cuegui/LimitsWidget.py b/cuegui/cuegui/LimitsWidget.py index 82f236342..833f06a58 100644 --- a/cuegui/cuegui/LimitsWidget.py +++ b/cuegui/cuegui/LimitsWidget.py @@ -148,7 +148,7 @@ def contextMenuEvent(self, e): menu.addSeparator() self.__menuActions.limits().addAction(menu, "delete") self.__menuActions.limits().addAction(menu, "rename") - menu.exec_(QtCore.QPoint(e.globalX(), e.globalY())) + menu.exec_(QtCore.QPoint(e.globalX(), e.globalY())) # pylint: disable=no-member def tick(self): pass diff --git a/cuegui/cuegui/MainWindow.py b/cuegui/cuegui/MainWindow.py index a27990cfd..14450aeeb 100644 --- a/cuegui/cuegui/MainWindow.py +++ b/cuegui/cuegui/MainWindow.py @@ -446,6 +446,7 @@ def __toggleFullscreen(self): ################################################################################ def keyPressEvent(self, event): + """Handle keys being pressed""" if event.key() == QtCore.Qt.Key_Space: self.app.request_update.emit() event.accept() diff --git a/cuegui/cuegui/PreviewWidget.py b/cuegui/cuegui/PreviewWidget.py index 6e109bd01..a49b17de3 100644 --- a/cuegui/cuegui/PreviewWidget.py +++ b/cuegui/cuegui/PreviewWidget.py @@ -167,6 +167,7 @@ def __findHttpPort(self): raise Exception("This frame doesn't support previews. No Preview Server found.") +# pylint: disable=no-member class PreviewProcessorWatchThread(QtCore.QThread): """ Waits for preview files to appear and emits the progress every second. This diff --git a/cuegui/cuegui/Redirect.py b/cuegui/cuegui/Redirect.py index 1476b1ad2..3b8d4b936 100644 --- a/cuegui/cuegui/Redirect.py +++ b/cuegui/cuegui/Redirect.py @@ -892,7 +892,7 @@ class ProxyModel(QtCore.QSortFilterProxyModel): """Provides support for sorting data passed between the model and the tree view""" def lessThan(self, left, right): - + """Handle sorting comparison""" leftData = self.sourceModel().data(left) rightData = self.sourceModel().data(right) diff --git a/cuegui/cuegui/ServiceDialog.py b/cuegui/cuegui/ServiceDialog.py index 5ca292262..20d959f70 100644 --- a/cuegui/cuegui/ServiceDialog.py +++ b/cuegui/cuegui/ServiceDialog.py @@ -232,10 +232,10 @@ def __init__(self, show, parent=None): self.__btn_del.clicked.connect(self.delService) self.__form.saved.connect(self.saved) self.__service_list.currentItemChanged.connect(self.selected) - # pylint: enable=no-member self.refresh() self.__service_list.setCurrentRow(0, QtCore.QItemSelectionModel.Select) + # pylint: enable=no-member def selected(self, item, old_item): """ @@ -287,7 +287,7 @@ def saved(self, service): item = self.__service_list.item(i) if item: if str(item.text()) == service.name(): - self.__service_list.setCurrentRow(i, QtCore.QItemSelectionModel.Select) + self.__service_list.setCurrentRow(i, QtCore.QItemSelectionModel.Select) # pylint: disable=no-member break def refresh(self): @@ -331,7 +331,7 @@ def delService(self): self.__selected.delete() row = self.currentRow() if row >= 1: - self.__service_list.setCurrentRow(row - 1, QtCore.QItemSelectionModel.Select) + self.__service_list.setCurrentRow(row - 1, QtCore.QItemSelectionModel.Select) # pylint: disable=no-member self.refresh() def currentRow(self): diff --git a/cuegui/cuegui/ShowsWidget.py b/cuegui/cuegui/ShowsWidget.py index 8d24b7ae7..db6fcda85 100644 --- a/cuegui/cuegui/ShowsWidget.py +++ b/cuegui/cuegui/ShowsWidget.py @@ -105,7 +105,7 @@ def contextMenuEvent(self, e): menu.addSeparator() self.__menuActions.shows().addAction(menu, "createSubscription") - menu.exec_(QtCore.QPoint(e.globalX(), e.globalY())) + menu.exec_(QtCore.QPoint(e.globalX(), e.globalY())) # pylint: disable=no-member def tick(self): pass diff --git a/cuegui/cuegui/SubscriptionGraphWidget.py b/cuegui/cuegui/SubscriptionGraphWidget.py index b17004d11..498e93a68 100644 --- a/cuegui/cuegui/SubscriptionGraphWidget.py +++ b/cuegui/cuegui/SubscriptionGraphWidget.py @@ -42,7 +42,7 @@ def __init__(self, parent): self.__shows = [] self.__showMenuActions = {} self.__subBars = [] - self.__timer = QtCore.QTimer(self) + self.__timer = QtCore.QTimer(self) # pylint: disable=no-member self.__timer.timeout.connect(self.update_data) # pylint: disable=no-member self.__timer.setInterval(1000 * 5) @@ -230,7 +230,7 @@ def contextMenuEvent(self, e): new_action = QtWidgets.QAction('Add new subscription', self) new_action.triggered.connect(self.createSubscription) # pylint: disable=no-member menu.addAction(new_action) - menu.exec_(QtCore.QPoint(e.globalX(),e.globalY())) + menu.exec_(QtCore.QPoint(e.globalX(),e.globalY())) # pylint: disable=no-member def createSubscription(self): """Shows a dialog for creating a new subscription.""" diff --git a/cuegui/cuegui/SubscriptionsWidget.py b/cuegui/cuegui/SubscriptionsWidget.py index eb474e074..58c2158e0 100644 --- a/cuegui/cuegui/SubscriptionsWidget.py +++ b/cuegui/cuegui/SubscriptionsWidget.py @@ -243,7 +243,7 @@ def contextMenuEvent(self, e): self.__menuActions.subscriptions().addAction(menu, "editBurst") menu.addSeparator() self.__menuActions.subscriptions().addAction(menu, "delete") - menu.exec_(QtCore.QPoint(e.globalX(),e.globalY())) + menu.exec_(QtCore.QPoint(e.globalX(),e.globalY())) # pylint: disable=no-member def tick(self): pass diff --git a/cuegui/cuegui/ThreadPool.py b/cuegui/cuegui/ThreadPool.py index 8a615ee6c..c0352c1f9 100644 --- a/cuegui/cuegui/ThreadPool.py +++ b/cuegui/cuegui/ThreadPool.py @@ -68,6 +68,7 @@ def systemCpuCount(): return 1 +# pylint: disable=no-member class ThreadPool(QtCore.QObject): """A general purpose work queue class.""" @@ -140,6 +141,7 @@ def __init__(self, name, parent): self.__running = False # pylint: disable=protected-access + # pylint: disable=missing-function-docstring def run(self): self.__running = True while self.__running: diff --git a/cuegui/cuegui/UnbookDialog.py b/cuegui/cuegui/UnbookDialog.py index 334c43909..618427200 100644 --- a/cuegui/cuegui/UnbookDialog.py +++ b/cuegui/cuegui/UnbookDialog.py @@ -195,6 +195,7 @@ def _convert(val): return [result] def accept(self): + """Accept Unbook action""" if not self.__jobs: self.close() diff --git a/cuegui/cuegui/plugins/AllocationsPlugin.py b/cuegui/cuegui/plugins/AllocationsPlugin.py index cc8273c25..1bf8ce3ec 100644 --- a/cuegui/cuegui/plugins/AllocationsPlugin.py +++ b/cuegui/cuegui/plugins/AllocationsPlugin.py @@ -161,12 +161,15 @@ def contextMenuEvent(self, e): """When right clicking on an item, this raises a context menu""" def dragEnterEvent(self, event): + """Drag enter event""" cuegui.Utils.dragEnterEvent(event, "application/x-host-ids") def dragMoveEvent(self, event): + """Drag move event""" cuegui.Utils.dragMoveEvent(event, "application/x-host-ids") def dropEvent(self, event): + """Drop event""" item = self.itemAt(event.pos()) if item.type() == cuegui.Constants.TYPE_ALLOC: @@ -181,8 +184,7 @@ def dropEvent(self, event): self.updateSoon() def tick(self): - # tick is unused in this widget - pass + """no-op""" class AllocationWidgetItem(cuegui.AbstractWidgetItem.AbstractWidgetItem): diff --git a/cuegui/cuegui/plugins/LogViewPlugin.py b/cuegui/cuegui/plugins/LogViewPlugin.py index a59f20251..aecaa24fe 100644 --- a/cuegui/cuegui/plugins/LogViewPlugin.py +++ b/cuegui/cuegui/plugins/LogViewPlugin.py @@ -339,6 +339,7 @@ def __init__(self, fn, *args, **kwargs): @QtCore.Slot() def run(self): + """Thread run action""" # pylint: disable=bare-except try: content, log_mtime = self.fn(*self.args, **self.kwargs) @@ -1000,6 +1001,7 @@ def __init__(self, parent=None): self.completeFormat.setForeground(cuegui.Style.ColorTheme.LOG_COMPLETE) def highlightBlock(self, text): + """Handle blocks that should be highlighted""" if not self.on: return diff --git a/cuegui/cuegui/plugins/MonitorJobDetailsPlugin.py b/cuegui/cuegui/plugins/MonitorJobDetailsPlugin.py index bb1b61d02..922a04140 100644 --- a/cuegui/cuegui/plugins/MonitorJobDetailsPlugin.py +++ b/cuegui/cuegui/plugins/MonitorJobDetailsPlugin.py @@ -100,12 +100,15 @@ def __splitterMoved(self, pos, index): self.__monitorLayers.disableUpdate = not bool(pos) def dragEnterEvent(self, event): + """Enter drag event handler""" cuegui.Utils.dragEnterEvent(event) def dragMoveEvent(self, event): + """Move drag event handler""" cuegui.Utils.dragMoveEvent(event) def dropEvent(self, event): + """Drop Event handler""" for jobName in cuegui.Utils.dropEvent(event): self.__setJob(jobName) diff --git a/cuegui/cuegui/plugins/MonitorJobsPlugin.py b/cuegui/cuegui/plugins/MonitorJobsPlugin.py index 744603088..c504ba957 100644 --- a/cuegui/cuegui/plugins/MonitorJobsPlugin.py +++ b/cuegui/cuegui/plugins/MonitorJobsPlugin.py @@ -351,6 +351,7 @@ def __init__(self, parent): self.setToolTip(toolTip) def contextMenuEvent(self, e): + """Handle context menu events""" menu = QtWidgets.QMenu(self) menu.addAction(cuegui.Action.create(self, diff --git a/cuegui/cuegui/plugins/StuckFramePlugin.py b/cuegui/cuegui/plugins/StuckFramePlugin.py index aff41339d..94f886447 100644 --- a/cuegui/cuegui/plugins/StuckFramePlugin.py +++ b/cuegui/cuegui/plugins/StuckFramePlugin.py @@ -767,6 +767,7 @@ def __init__(self, parent): self.jobs_created = {} self.groups_created = {} self.currentHosts = [] + self.show = None # Bring Up a comment if it exists self._itemSingleClickedComment.connect(self.__itemSingleClickedComment) @@ -1447,15 +1448,19 @@ def RemoveJob(self): self._processUpdate(None, self.currentHosts) def startDrag(self, dropActions): + """Drag start action""" cuegui.Utils.startDrag(self, dropActions, self.selectedObjects()) def dragEnterEvent(self, event): + """Drag enter action""" cuegui.Utils.dragEnterEvent(event, "application/x-host-ids") def dragMoveEvent(self, event): + """Drag move event""" cuegui.Utils.dragMoveEvent(event, "application/x-host-ids") def updateFilters(self, filters, show): + """Update filters""" self.showData = show self.show = show.data.name self.filters = filters diff --git a/cuesubmit/cuesubmit/ui/Submit.py b/cuesubmit/cuesubmit/ui/Submit.py index cd2cbc39f..adbac9c4b 100644 --- a/cuesubmit/cuesubmit/ui/Submit.py +++ b/cuesubmit/cuesubmit/ui/Submit.py @@ -211,6 +211,7 @@ def __init__( self.jobDataChanged() def showEvent(self, event): + """Show Event""" del event if self.startupErrors: diff --git a/cuesubmit/cuesubmit/ui/Widgets.py b/cuesubmit/cuesubmit/ui/Widgets.py index fb16400a9..443096344 100644 --- a/cuesubmit/cuesubmit/ui/Widgets.py +++ b/cuesubmit/cuesubmit/ui/Widgets.py @@ -164,10 +164,12 @@ def __init__(self, defaultText=None, completerStrings=None, parent=None): self.setStyleSheet(Style.LINE_EDIT) def focusInEvent(self, e): + """Event when in focus""" super(CueLineEdit, self).focusInEvent(e) self.focusChange.emit(True) def focusOutEvent(self, e): + """Event when out of focus""" super(CueLineEdit, self).focusOutEvent(e) self.focusChange.emit(False) From 471bc0fa3d9ba0843efecf30a15d858e301612d8 Mon Sep 17 00:00:00 2001 From: Jimmy Christensen Date: Thu, 28 Nov 2024 17:40:56 +0100 Subject: [PATCH 2/4] [cuebot] Convert null value from job.str_os to empty string in SQL (#1600) **Link the Issue(s) this Pull Request is related to.** #1591 **Summarize your change.** This is a different take on the MR #1594 which only changes the SQL queries instead of the Java code. --- .../com/imageworks/spcue/dao/postgres/DispatchQuery.java | 2 +- .../com/imageworks/spcue/dao/postgres/FrameDaoJdbc.java | 2 +- .../spcue/dao/postgres/NestedWhiteboardDaoJdbc.java | 2 +- .../java/com/imageworks/spcue/dao/postgres/ProcDaoJdbc.java | 6 +++--- 4 files changed, 6 insertions(+), 6 deletions(-) diff --git a/cuebot/src/main/java/com/imageworks/spcue/dao/postgres/DispatchQuery.java b/cuebot/src/main/java/com/imageworks/spcue/dao/postgres/DispatchQuery.java index fec2f47ac..010294323 100644 --- a/cuebot/src/main/java/com/imageworks/spcue/dao/postgres/DispatchQuery.java +++ b/cuebot/src/main/java/com/imageworks/spcue/dao/postgres/DispatchQuery.java @@ -530,7 +530,7 @@ private static final String replaceQueryForFifo(String query) { "str_user, " + "int_uid, " + "str_log_dir, " + - "str_os, " + + "COALESCE(str_os, '') AS str_os, " + "frame_name, " + "frame_state, " + "pk_frame, " + diff --git a/cuebot/src/main/java/com/imageworks/spcue/dao/postgres/FrameDaoJdbc.java b/cuebot/src/main/java/com/imageworks/spcue/dao/postgres/FrameDaoJdbc.java index 1703664c7..c25e00874 100644 --- a/cuebot/src/main/java/com/imageworks/spcue/dao/postgres/FrameDaoJdbc.java +++ b/cuebot/src/main/java/com/imageworks/spcue/dao/postgres/FrameDaoJdbc.java @@ -348,7 +348,7 @@ public DispatchFrame mapRow(ResultSet rs, int rowNum) throws SQLException { "job.str_user,"+ "job.int_uid,"+ "job.str_log_dir,"+ - "job.str_os,"+ + "COALESCE(str_os, '') AS str_os, " + "frame.str_name AS frame_name, "+ "frame.str_state AS frame_state, "+ "frame.pk_frame, "+ diff --git a/cuebot/src/main/java/com/imageworks/spcue/dao/postgres/NestedWhiteboardDaoJdbc.java b/cuebot/src/main/java/com/imageworks/spcue/dao/postgres/NestedWhiteboardDaoJdbc.java index 8c920c5a4..fdd147ca1 100644 --- a/cuebot/src/main/java/com/imageworks/spcue/dao/postgres/NestedWhiteboardDaoJdbc.java +++ b/cuebot/src/main/java/com/imageworks/spcue/dao/postgres/NestedWhiteboardDaoJdbc.java @@ -94,7 +94,7 @@ public CachedJobWhiteboardMapper(NestedJobWhiteboardMapper result) { "job.b_paused, " + "job.b_autoeat, " + "job.b_comment, " + - "job.str_os, " + + "COALESCE(str_os, '') AS str_os, " + "job.int_frame_count, " + "job.int_layer_count, " + "job_stat.int_waiting_count, " + diff --git a/cuebot/src/main/java/com/imageworks/spcue/dao/postgres/ProcDaoJdbc.java b/cuebot/src/main/java/com/imageworks/spcue/dao/postgres/ProcDaoJdbc.java index 2a597cfeb..0e24ed1c8 100644 --- a/cuebot/src/main/java/com/imageworks/spcue/dao/postgres/ProcDaoJdbc.java +++ b/cuebot/src/main/java/com/imageworks/spcue/dao/postgres/ProcDaoJdbc.java @@ -356,7 +356,7 @@ public VirtualProc mapRow(ResultSet rs, int rowNum) throws SQLException { "proc.int_virt_max_used,"+ "proc.int_virt_used,"+ "host.str_name AS host_name, " + - "job.str_os " + + "COALESCE(job.str_os, '') AS str_os " + "FROM " + "proc, " + "job, " + @@ -389,7 +389,7 @@ public VirtualProc findVirtualProc(FrameInterface frame) { "proc.*, " + "host.str_name AS host_name, " + "host.pk_alloc, " + - "job.str_os, " + + "COALESCE(job.str_os, '') AS str_os, " + "alloc.pk_facility " + "FROM " + "proc, " + @@ -530,7 +530,7 @@ public String getCurrentFrameId(ProcInterface p) { "SELECT " + "proc.*, " + "host.str_name AS host_name, " + - "job.str_os, " + + "COALESCE(job.str_os, '') AS str_os, " + "host.pk_alloc, " + "alloc.pk_facility " + "FROM " + From eb494e700591247a473f05564b6f81f1047e2f87 Mon Sep 17 00:00:00 2001 From: Anton Brand Date: Wed, 4 Dec 2024 14:06:24 -0500 Subject: [PATCH 3/4] [RQD] Fix core detection on Windows platforms (#1468) **Link the Issue(s) this Pull Request is related to.** #1469 **Summarize your change.** Fix an error on Windows platforms where a submitted job could not be picked up properly due to available processors incorrect detection. The `reserveHT` method of the RQD `Machine` class relies on a `__procs_by_physid_and_coreid` attribute that is not correctly filled when on a Windows platform. See: - `reserveHT` relying on `__procs_by_physid_and_coreid`: https://github.com/AcademySoftwareFoundation/OpenCue/blob/master/rqd/rqd/rqmachine.py#L842 - `__procs_by_physid_and_coreid` being filled only if on a Linux platform: https://github.com/AcademySoftwareFoundation/OpenCue/blob/master/rqd/rqd/rqmachine.py#L613 --------- Signed-off-by: Diego Tavares Co-authored-by: Diego Tavares Co-authored-by: Kern Attila GERMAIN <5556461+KernAttila@users.noreply.github.com> --- rqd/rqd/rqmachine.py | 75 +++++++++++++++++++++++++++++++++++--------- rqd/setup.py | 3 +- 2 files changed, 63 insertions(+), 15 deletions(-) diff --git a/rqd/rqd/rqmachine.py b/rqd/rqd/rqmachine.py index a6d9a6317..8694afee4 100644 --- a/rqd/rqd/rqmachine.py +++ b/rqd/rqd/rqmachine.py @@ -670,20 +670,8 @@ def __initMachineStats(self, pathCpuInfo=None): hyperthreadingMultiplier = 1 if platform.system() == 'Windows': - # Windows memory information - stat = self.getWindowsMemory() - TEMP_DEFAULT = 1048576 - self.__renderHost.total_mcp = TEMP_DEFAULT - self.__renderHost.total_mem = int(stat.ullTotalPhys / 1024) - self.__renderHost.total_swap = int(stat.ullTotalPageFile / 1024) - - # Windows CPU information - logical_core_count = psutil.cpu_count(logical=True) - actual_core_count = psutil.cpu_count(logical=False) - hyperthreadingMultiplier = logical_core_count // actual_core_count - - __totalCores = logical_core_count * rqd.rqconstants.CORE_VALUE - __numProcs = 1 # TODO: figure out how to count sockets in Python + logicalCoreCount, __numProcs, hyperthreadingMultiplier = self.__initStatsFromWindows() + __totalCores = logicalCoreCount * rqd.rqconstants.CORE_VALUE # All other systems will just have one proc/core if not __numProcs or not __totalCores: @@ -713,6 +701,65 @@ def __initMachineStats(self, pathCpuInfo=None): if hyperthreadingMultiplier >= 1: self.__renderHost.attributes['hyperthreadingMultiplier'] = str(hyperthreadingMultiplier) + def __initStatsFromWindows(self): + """Init machine stats for Windows platforms. + + @rtype: tuple + @return: A 3-items tuple containing: + - the number of logical cores + - the number of physical processors + - the hyper-threading multiplier + """ + # Windows memory information + stat = self.getWindowsMemory() + TEMP_DEFAULT = 1048576 + self.__renderHost.total_mcp = TEMP_DEFAULT + self.__renderHost.total_mem = int(stat.ullTotalPhys / 1024) + self.__renderHost.total_swap = int(stat.ullTotalPageFile / 1024) + + # Windows CPU information + self.__updateProcsMappingsFromWindows() + + logicalCoreCount = psutil.cpu_count(logical=True) + actualCoreCount = psutil.cpu_count(logical=False) + hyperThreadingMultiplier = logicalCoreCount // actualCoreCount + + physicalProcessorCount = len(self.__procs_by_physid_and_coreid) + + return logicalCoreCount, physicalProcessorCount, hyperThreadingMultiplier + + def __updateProcsMappingsFromWindows(self): + """ + Update `__procs_by_physid_and_coreid` and `__physid_and_coreid_by_proc` mappings + for Windows platforms. + """ + # Windows-specific + import wmi # pylint:disable=import-outside-toplevel,import-error + + # Reset mappings + self.__procs_by_physid_and_coreid = {} + self.__physid_and_coreid_by_proc = {} + + # Connect to the Windows Management Instrumentation (WMI) interface + wmiInstance = wmi.WMI() + + # Retrieve CPU information using WMI + for physicalId, processor in enumerate(wmiInstance.Win32_Processor()): + + threadPerCore = processor.NumberOfLogicalProcessors // processor.NumberOfCores + procId = 0 + + for coreId in range(processor.NumberOfCores): + for _ in range(threadPerCore): + self.__procs_by_physid_and_coreid.setdefault( + str(physicalId), {} + ).setdefault(str(coreId), set()).add(str(procId)) + self.__physid_and_coreid_by_proc[str(procId)] = ( + str(physicalId), + str(coreId), + ) + procId += 1 + def getWindowsMemory(self): """Gets information on system memory, Windows compatible version.""" # From diff --git a/rqd/setup.py b/rqd/setup.py index a9735b142..69c88c706 100644 --- a/rqd/setup.py +++ b/rqd/setup.py @@ -59,7 +59,8 @@ 'grpcio', 'grpcio-tools', 'psutil', - 'pywin32; platform_system == "Windows"' + 'pywin32==224; platform_system == "Windows"', + 'wmi==1.5.1; platform_system == "Windows"' ] ) From 33bde086c1fa6ac2d53563799347edb0fbe95990 Mon Sep 17 00:00:00 2001 From: Nuwan Jayawardene Date: Thu, 5 Dec 2024 01:08:35 +0530 Subject: [PATCH 4/4] [integration-test] [ci/cd] Fix install-client-sources script (#1588) **Link the Issue(s) this Pull Request is related to.** N/A **Summarize your change.** Fixes broken filepath of ci/fix_compiled_proto.py directory. Identified as it broke the integration test script. --- sandbox/install-client-sources.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/sandbox/install-client-sources.sh b/sandbox/install-client-sources.sh index 80ed1f39e..2ce711681 100755 --- a/sandbox/install-client-sources.sh +++ b/sandbox/install-client-sources.sh @@ -10,7 +10,7 @@ python -m grpc_tools.protoc -I=. \ --python_out=../pycue/opencue/compiled_proto \ --grpc_python_out=../pycue/opencue/compiled_proto ./*.proto cd .. -python ../ci/fix_compiled_proto.py pycue/opencue/compiled_proto +python ci/fix_compiled_proto.py pycue/opencue/compiled_proto # Install all client packages. pip install pycue/ pyoutline/ cueadmin/ cuesubmit/ cuegui/