diff --git a/docker/kubernetes/dolphinscheduler/values.yaml b/docker/kubernetes/dolphinscheduler/values.yaml index 52431f9cad..d87f09e34a 100644 --- a/docker/kubernetes/dolphinscheduler/values.yaml +++ b/docker/kubernetes/dolphinscheduler/values.yaml @@ -104,6 +104,9 @@ common: HIVE_HOME: "/opt/soft/hive" FLINK_HOME: "/opt/soft/flink" DATAX_HOME: "/opt/soft/datax" + SESSION_TIMEOUT_MS: 60000 + ORG_QUARTZ_THREADPOOL_THREADCOUNT: "25" + ORG_QUARTZ_SCHEDULER_BATCHTRIGGERACQUISTITIONMAXCOUNT: "1" ## Shared storage persistence mounted into api, master and worker, such as Hadoop, Spark, Flink and DataX binary package sharedStoragePersistence: enabled: false @@ -165,7 +168,6 @@ master: MASTER_KILL_YARN_JOB_WHEN_HANDLE_FAILOVER: "true" ORG_QUARTZ_THREADPOOL_THREADCOUNT: "25" ORG_QUARTZ_SCHEDULER_BATCHTRIGGERACQUISTITIONMAXCOUNT: "1" - SESSION_TIMEOUT_MS: 60000 MASTER_PERSIST_EVENT_STATE_THREADS: 10 ## Periodic probe of container liveness. Container will be restarted if the probe fails. Cannot be updated. ## More info: https://kubernetes.io/docs/concepts/workloads/pods/pod-lifecycle#container-probes @@ -234,7 +236,6 @@ worker: WORKER_MAX_CPULOAD_AVG: "-1" WORKER_RESERVED_MEMORY: "0.3" WORKER_GROUPS: "default" - SESSION_TIMEOUT_MS: 60000 WORKER_RETRY_REPORT_TASK_STATUS_INTERVAL: 600 ## Periodic probe of container liveness. Container will be restarted if the probe fails. Cannot be updated. ## More info: https://kubernetes.io/docs/concepts/workloads/pods/pod-lifecycle#container-probes diff --git a/dolphinscheduler-server/src/main/java/org/apache/dolphinscheduler/server/worker/registry/WorkerRegistryClient.java b/dolphinscheduler-server/src/main/java/org/apache/dolphinscheduler/server/worker/registry/WorkerRegistryClient.java index 326fcb2bb6..74af482e5b 100644 --- a/dolphinscheduler-server/src/main/java/org/apache/dolphinscheduler/server/worker/registry/WorkerRegistryClient.java +++ b/dolphinscheduler-server/src/main/java/org/apache/dolphinscheduler/server/worker/registry/WorkerRegistryClient.java @@ -133,14 +133,13 @@ public class WorkerRegistryClient { public void handleConnectionState(ConnectionState state) { switch (state) { case CONNECTED: - logger.info("registry connection state is {}", state); + logger.debug("registry connection state is {}", state); break; case SUSPENDED: - logger.info("registry connection state is {}, ready to stop myself", state); - registryClient.getStoppable().stop("registry connection state is SUSPENDED, stop myself"); + logger.warn("registry connection state is {}, ready to retry connection", state); break; case RECONNECTED: - logger.info("registry connection state is {}, clean the node info", state); + logger.debug("registry connection state is {}, clean the node info", state); String address = NetUtils.getAddr(workerConfig.getListenPort()); Set workerZkPaths = getWorkerZkPaths(); for (String workerZKPath : workerZkPaths) { @@ -149,7 +148,7 @@ public class WorkerRegistryClient { } break; case DISCONNECTED: - logger.info("registry connection state is {}, ready to stop myself", state); + logger.warn("registry connection state is {}, ready to stop myself", state); registryClient.getStoppable().stop("registry connection state is DISCONNECTED, stop myself"); break; default: