You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@ignite.apache.org by il...@apache.org on 2020/02/20 13:59:52 UTC

[ignite] branch master updated: IGNITE-12697 More detailed YARN log when checking container - Fixes #7437.

This is an automated email from the ASF dual-hosted git repository.

ilyak pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/ignite.git


The following commit(s) were added to refs/heads/master by this push:
     new 6eaa1dd  IGNITE-12697 More detailed YARN log when checking container - Fixes #7437.
6eaa1dd is described below

commit 6eaa1dd14003ef312a25163d1dcc38c446adb3ad
Author: Valeriy Shinkevich <v....@gmail.com>
AuthorDate: Thu Feb 20 16:56:51 2020 +0300

    IGNITE-12697 More detailed YARN log when checking container - Fixes #7437.
    
    Signed-off-by: Ilya Kasnacheev <il...@gmail.com>
---
 .../org/apache/ignite/yarn/ApplicationMaster.java  | 25 ++++++++++++++++------
 1 file changed, 19 insertions(+), 6 deletions(-)

diff --git a/modules/yarn/src/main/java/org/apache/ignite/yarn/ApplicationMaster.java b/modules/yarn/src/main/java/org/apache/ignite/yarn/ApplicationMaster.java
index f42edb1..886f2d7 100644
--- a/modules/yarn/src/main/java/org/apache/ignite/yarn/ApplicationMaster.java
+++ b/modules/yarn/src/main/java/org/apache/ignite/yarn/ApplicationMaster.java
@@ -110,6 +110,8 @@ public class ApplicationMaster implements AMRMClientAsync.CallbackHandler {
     @Override public synchronized void onContainersAllocated(List<Container> conts) {
         for (Container c : conts) {
             if (checkContainer(c)) {
+                log.log(Level.INFO, "Container {0} allocated", c.getId());
+
                 try {
                     ContainerLaunchContext ctx = Records.newRecord(ContainerLaunchContext.class);
 
@@ -174,8 +176,11 @@ public class ApplicationMaster implements AMRMClientAsync.CallbackHandler {
                     log.log(Level.WARNING, "Error launching container " + c.getId(), ex);
                 }
             }
-            else
+            else {
+                log.log(Level.WARNING, "Container {0} check failed. Releasing...", c.getId());
+
                 rmClient.releaseAssignedContainer(c.getId());
+            }
         }
     }
 
@@ -185,20 +190,28 @@ public class ApplicationMaster implements AMRMClientAsync.CallbackHandler {
      */
     private boolean checkContainer(Container cont) {
         // Check limit on running nodes.
-        if (props.instances() <= containers.size())
+        if (props.instances() <= containers.size()) {
+            log.log(Level.WARNING, "Limit on running nodes exceeded. ({0} of {1} max)",
+                new Object[] {containers.size(), props.instances()});
+
             return false;
+        }
 
         // Check host name
         if (props.hostnameConstraint() != null
-                && props.hostnameConstraint().matcher(cont.getNodeId().getHost()).matches())
+                && props.hostnameConstraint().matcher(cont.getNodeId().getHost()).matches()) {
+            log.log(Level.WARNING, "Wrong host name '{0}'. It didn't match to '{1}' pattern.",
+                new Object[] {cont.getNodeId().getHost(), props.hostnameConstraint().toString()});
+
             return false;
+        }
 
         // Check that slave satisfies min requirements.
         if (cont.getResource().getVirtualCores() < props.cpusPerNode()
             || cont.getResource().getMemory() < props.totalMemoryPerNode()) {
-            log.log(Level.FINE, "Container resources not sufficient requirements. Host: {0}, cpu: {1}, mem: {2}",
-                new Object[]{cont.getNodeId().getHost(), cont.getResource().getVirtualCores(),
-                   cont.getResource().getMemory()});
+            log.log(Level.WARNING, "Container resources not sufficient requirements. Host: {0}, cpu: {1}, mem: {2}",
+                new Object[] {cont.getNodeId().getHost(), cont.getResource().getVirtualCores(),
+                cont.getResource().getMemory()});
 
             return false;
         }