Browse Source

[Improvement][Worker] Task log may be lost #5775 (#5907)

Wenjun Ruan 3 years ago committed by GitHub
parent
commit
f40e795f10
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
  1. 5
      dolphinscheduler-common/src/main/java/org/apache/dolphinscheduler/common/Constants.java
  2. 63
      dolphinscheduler-server/src/main/java/org/apache/dolphinscheduler/server/worker/task/AbstractCommandExecutor.java
  3. 25
      dolphinscheduler-server/src/main/java/org/apache/dolphinscheduler/server/worker/task/AbstractTask.java
  4. 3
      dolphinscheduler-server/src/main/java/org/apache/dolphinscheduler/server/worker/task/PythonCommandExecutor.java
  5. 4
      dolphinscheduler-server/src/main/java/org/apache/dolphinscheduler/server/worker/task/ShellCommandExecutor.java
  6. 41
      dolphinscheduler-server/src/main/java/org/apache/dolphinscheduler/server/worker/task/sql/SqlTask.java
  7. 23
      dolphinscheduler-server/src/test/java/org/apache/dolphinscheduler/server/worker/task/sqoop/SqoopTaskTest.java

5
dolphinscheduler-common/src/main/java/org/apache/dolphinscheduler/common/Constants.java

@ -388,6 +388,11 @@ public final class Constants {
*/ */
public static final int DEFAULT_LOG_FLUSH_INTERVAL = 1000; public static final int DEFAULT_LOG_FLUSH_INTERVAL = 1000;
/**
* default log buffer size in AbstractCommandExecutor
*/
public static final int DEFAULT_LOG_BUFFER_SIZE = 128;
/** /**
* time unit secong to minutes * time unit secong to minutes

63
dolphinscheduler-server/src/main/java/org/apache/dolphinscheduler/server/worker/task/AbstractCommandExecutor.java

@ -41,6 +41,7 @@ import java.util.Collections;
import java.util.LinkedList; import java.util.LinkedList;
import java.util.List; import java.util.List;
import java.util.concurrent.ExecutorService; import java.util.concurrent.ExecutorService;
import java.util.concurrent.LinkedBlockingQueue;
import java.util.concurrent.TimeUnit; import java.util.concurrent.TimeUnit;
import java.util.function.Consumer; import java.util.function.Consumer;
import java.util.regex.Matcher; import java.util.regex.Matcher;
@ -67,7 +68,7 @@ public abstract class AbstractCommandExecutor {
/** /**
* log handler * log handler
*/ */
protected Consumer<List<String>> logHandler; protected Consumer<LinkedBlockingQueue<String>> logHandler;
/** /**
* logger * logger
@ -75,9 +76,9 @@ public abstract class AbstractCommandExecutor {
protected Logger logger; protected Logger logger;
/** /**
* log list * log collection
*/ */
protected final List<String> logBuffer; protected final LinkedBlockingQueue<String> logBuffer;
/** /**
* taskExecutionContext * taskExecutionContext
@ -92,13 +93,13 @@ public abstract class AbstractCommandExecutor {
*/ */
private TaskExecutionContextCacheManager taskExecutionContextCacheManager; private TaskExecutionContextCacheManager taskExecutionContextCacheManager;
public AbstractCommandExecutor(Consumer<List<String>> logHandler, public AbstractCommandExecutor(Consumer<LinkedBlockingQueue<String>> logHandler,
TaskExecutionContext taskExecutionContext , TaskExecutionContext taskExecutionContext,
Logger logger){ Logger logger) {
this.logHandler = logHandler; this.logHandler = logHandler;
this.taskExecutionContext = taskExecutionContext; this.taskExecutionContext = taskExecutionContext;
this.logger = logger; this.logger = logger;
this.logBuffer = Collections.synchronizedList(new ArrayList<>()); this.logBuffer = new LinkedBlockingQueue<>(Constants.DEFAULT_LOG_BUFFER_SIZE);
this.taskExecutionContextCacheManager = SpringApplicationContext.getBean(TaskExecutionContextCacheManagerImpl.class); this.taskExecutionContextCacheManager = SpringApplicationContext.getBean(TaskExecutionContextCacheManagerImpl.class);
} }
@ -331,15 +332,14 @@ public abstract class AbstractCommandExecutor {
*/ */
private void clear() { private void clear() {
List<String> markerList = new ArrayList<>(); LinkedBlockingQueue<String> markerLog = new LinkedBlockingQueue<>(1);
markerList.add(ch.qos.logback.classic.ClassicConstants.FINALIZE_SESSION_MARKER.toString()); markerLog.add(ch.qos.logback.classic.ClassicConstants.FINALIZE_SESSION_MARKER.toString());
if (!logBuffer.isEmpty()) { if (!logBuffer.isEmpty()) {
// log handle // log handle
logHandler.accept(logBuffer); logHandler.accept(logBuffer);
logBuffer.clear();
} }
logHandler.accept(markerList); logHandler.accept(markerLog);
} }
/** /**
@ -350,9 +350,7 @@ public abstract class AbstractCommandExecutor {
String threadLoggerInfoName = String.format(LoggerUtils.TASK_LOGGER_THREAD_NAME + "-%s", taskExecutionContext.getTaskAppId()); String threadLoggerInfoName = String.format(LoggerUtils.TASK_LOGGER_THREAD_NAME + "-%s", taskExecutionContext.getTaskAppId());
ExecutorService getOutputLogService = ThreadUtils.newDaemonSingleThreadExecutor(threadLoggerInfoName + "-" + "getOutputLogService"); ExecutorService getOutputLogService = ThreadUtils.newDaemonSingleThreadExecutor(threadLoggerInfoName + "-" + "getOutputLogService");
getOutputLogService.submit(() -> { getOutputLogService.submit(() -> {
BufferedReader inReader = null; try (BufferedReader inReader = new BufferedReader(new InputStreamReader(process.getInputStream()))) {
try {
inReader = new BufferedReader(new InputStreamReader(process.getInputStream()));
String line; String line;
while ((line = inReader.readLine()) != null) { while ((line = inReader.readLine()) != null) {
logBuffer.add(line); logBuffer.add(line);
@ -361,7 +359,6 @@ public abstract class AbstractCommandExecutor {
logger.error(e.getMessage(), e); logger.error(e.getMessage(), e);
} finally { } finally {
logOutputIsSuccess = true; logOutputIsSuccess = true;
close(inReader);
} }
}); });
getOutputLogService.shutdown(); getOutputLogService.shutdown();
@ -450,31 +447,20 @@ public abstract class AbstractCommandExecutor {
* @return line list * @return line list
*/ */
private List<String> convertFile2List(String filename) { private List<String> convertFile2List(String filename) {
List lineList = new ArrayList<String>(100); List<String> lineList = new ArrayList<>(100);
File file=new File(filename); File file = new File(filename);
if (!file.exists()){ if (!file.exists()){
return lineList; return lineList;
} }
BufferedReader br = null; try (BufferedReader br = new BufferedReader(new InputStreamReader(new FileInputStream(filename), StandardCharsets.UTF_8))) {
try {
br = new BufferedReader(new InputStreamReader(new FileInputStream(filename), StandardCharsets.UTF_8));
String line = null; String line = null;
while ((line = br.readLine()) != null) { while ((line = br.readLine()) != null) {
lineList.add(line); lineList.add(line);
} }
} catch (Exception e) { } catch (Exception e) {
logger.error(String.format("read file: %s failed : ",filename),e); logger.error(String.format("read file: %s failed : ", filename), e);
} finally {
if(br != null){
try {
br.close();
} catch (IOException e) {
logger.error(e.getMessage(),e);
}
}
} }
return lineList; return lineList;
} }
@ -551,27 +537,10 @@ public abstract class AbstractCommandExecutor {
lastFlushTime = now; lastFlushTime = now;
/** log handle */ /** log handle */
logHandler.accept(logBuffer); logHandler.accept(logBuffer);
logBuffer.clear();
} }
return lastFlushTime; return lastFlushTime;
} }
/**
* close buffer reader
*
* @param inReader in reader
*/
private void close(BufferedReader inReader) {
if (inReader != null) {
try {
inReader.close();
} catch (IOException e) {
logger.error(e.getMessage(), e);
}
}
}
protected List<String> commandOptions() { protected List<String> commandOptions() {
return Collections.emptyList(); return Collections.emptyList();
} }

25
dolphinscheduler-server/src/main/java/org/apache/dolphinscheduler/server/worker/task/AbstractTask.java

@ -42,8 +42,9 @@ import org.apache.dolphinscheduler.server.utils.ParamUtils;
import org.apache.commons.lang.StringUtils; import org.apache.commons.lang.StringUtils;
import java.util.List;
import java.util.Map; import java.util.Map;
import java.util.StringJoiner;
import java.util.concurrent.LinkedBlockingQueue;
import org.slf4j.Logger; import org.slf4j.Logger;
@ -58,13 +59,13 @@ public abstract class AbstractTask {
TaskExecutionContext taskExecutionContext; TaskExecutionContext taskExecutionContext;
/** /**
* log record * log record
*/ */
protected Logger logger; protected Logger logger;
/** /**
* SHELL process pid * SHELL process pid
*/ */
protected int processId; protected int processId;
@ -80,14 +81,15 @@ public abstract class AbstractTask {
protected volatile boolean cancel = false; protected volatile boolean cancel = false;
/** /**
* exit code * exit code
*/ */
protected volatile int exitStatusCode = -1; protected volatile int exitStatusCode = -1;
/** /**
* constructor * constructor
*
* @param taskExecutionContext taskExecutionContext * @param taskExecutionContext taskExecutionContext
* @param logger logger * @param logger logger
*/ */
protected AbstractTask(TaskExecutionContext taskExecutionContext, Logger logger) { protected AbstractTask(TaskExecutionContext taskExecutionContext, Logger logger) {
this.taskExecutionContext = taskExecutionContext; this.taskExecutionContext = taskExecutionContext;
@ -96,6 +98,7 @@ public abstract class AbstractTask {
/** /**
* init task * init task
*
* @throws Exception exception * @throws Exception exception
*/ */
public void init() throws Exception { public void init() throws Exception {
@ -103,13 +106,14 @@ public abstract class AbstractTask {
/** /**
* task handle * task handle
*
* @throws Exception exception * @throws Exception exception
*/ */
public abstract void handle() throws Exception; public abstract void handle() throws Exception;
/** /**
* cancel application * cancel application
*
* @param status status * @param status status
* @throws Exception exception * @throws Exception exception
*/ */
@ -119,14 +123,19 @@ public abstract class AbstractTask {
/** /**
* log handle * log handle
*
* @param logs log list * @param logs log list
*/ */
public void logHandle(List<String> logs) { public void logHandle(LinkedBlockingQueue<String> logs) {
// note that the "new line" is added here to facilitate log parsing // note that the "new line" is added here to facilitate log parsing
if (logs.contains(FINALIZE_SESSION_MARKER.toString())) { if (logs.contains(FINALIZE_SESSION_MARKER.toString())) {
logger.info(FINALIZE_SESSION_MARKER, FINALIZE_SESSION_MARKER.toString()); logger.info(FINALIZE_SESSION_MARKER, FINALIZE_SESSION_MARKER.toString());
} else { } else {
logger.info(" -> {}", String.join("\n\t", logs)); StringJoiner joiner = new StringJoiner("\n\t");
while (!logs.isEmpty()) {
joiner.add(logs.poll());
}
logger.info(" -> {}", joiner);
} }
} }

3
dolphinscheduler-server/src/main/java/org/apache/dolphinscheduler/server/worker/task/PythonCommandExecutor.java

@ -30,6 +30,7 @@ import java.nio.file.Paths;
import java.util.Collections; import java.util.Collections;
import java.util.Date; import java.util.Date;
import java.util.List; import java.util.List;
import java.util.concurrent.LinkedBlockingQueue;
import java.util.function.Consumer; import java.util.function.Consumer;
/** /**
@ -54,7 +55,7 @@ public class PythonCommandExecutor extends AbstractCommandExecutor {
* @param taskExecutionContext taskExecutionContext * @param taskExecutionContext taskExecutionContext
* @param logger logger * @param logger logger
*/ */
public PythonCommandExecutor(Consumer<List<String>> logHandler, public PythonCommandExecutor(Consumer<LinkedBlockingQueue<String>> logHandler,
TaskExecutionContext taskExecutionContext, TaskExecutionContext taskExecutionContext,
Logger logger) { Logger logger) {
super(logHandler,taskExecutionContext,logger); super(logHandler,taskExecutionContext,logger);

4
dolphinscheduler-server/src/main/java/org/apache/dolphinscheduler/server/worker/task/ShellCommandExecutor.java

@ -26,7 +26,7 @@ import java.io.IOException;
import java.nio.charset.StandardCharsets; import java.nio.charset.StandardCharsets;
import java.nio.file.Files; import java.nio.file.Files;
import java.nio.file.Paths; import java.nio.file.Paths;
import java.util.List; import java.util.concurrent.LinkedBlockingQueue;
import java.util.function.Consumer; import java.util.function.Consumer;
/** /**
@ -50,7 +50,7 @@ public class ShellCommandExecutor extends AbstractCommandExecutor {
* @param taskExecutionContext taskExecutionContext * @param taskExecutionContext taskExecutionContext
* @param logger logger * @param logger logger
*/ */
public ShellCommandExecutor(Consumer<List<String>> logHandler, public ShellCommandExecutor(Consumer<LinkedBlockingQueue<String>> logHandler,
TaskExecutionContext taskExecutionContext, TaskExecutionContext taskExecutionContext,
Logger logger) { Logger logger) {
super(logHandler,taskExecutionContext,logger); super(logHandler,taskExecutionContext,logger);

41
dolphinscheduler-server/src/main/java/org/apache/dolphinscheduler/server/worker/task/sql/SqlTask.java

@ -16,9 +16,14 @@
*/ */
package org.apache.dolphinscheduler.server.worker.task.sql; package org.apache.dolphinscheduler.server.worker.task.sql;
import com.alibaba.fastjson.JSONArray; import static org.apache.dolphinscheduler.common.Constants.COMMA;
import com.alibaba.fastjson.JSONObject; import static org.apache.dolphinscheduler.common.Constants.HIVE_CONF;
import org.apache.commons.lang.StringUtils; import static org.apache.dolphinscheduler.common.Constants.PASSWORD;
import static org.apache.dolphinscheduler.common.Constants.SEMICOLON;
import static org.apache.dolphinscheduler.common.Constants.STATUS;
import static org.apache.dolphinscheduler.common.Constants.USER;
import static org.apache.dolphinscheduler.common.enums.DbType.HIVE;
import org.apache.dolphinscheduler.alert.utils.MailUtils; import org.apache.dolphinscheduler.alert.utils.MailUtils;
import org.apache.dolphinscheduler.common.Constants; import org.apache.dolphinscheduler.common.Constants;
import org.apache.dolphinscheduler.common.enums.CommandType; import org.apache.dolphinscheduler.common.enums.CommandType;
@ -30,7 +35,11 @@ import org.apache.dolphinscheduler.common.task.AbstractParameters;
import org.apache.dolphinscheduler.common.task.sql.SqlBinds; import org.apache.dolphinscheduler.common.task.sql.SqlBinds;
import org.apache.dolphinscheduler.common.task.sql.SqlParameters; import org.apache.dolphinscheduler.common.task.sql.SqlParameters;
import org.apache.dolphinscheduler.common.task.sql.SqlType; import org.apache.dolphinscheduler.common.task.sql.SqlType;
import org.apache.dolphinscheduler.common.utils.*; import org.apache.dolphinscheduler.common.utils.CollectionUtils;
import org.apache.dolphinscheduler.common.utils.CommonUtils;
import org.apache.dolphinscheduler.common.utils.EnumUtils;
import org.apache.dolphinscheduler.common.utils.JSONUtils;
import org.apache.dolphinscheduler.common.utils.ParameterUtils;
import org.apache.dolphinscheduler.dao.AlertDao; import org.apache.dolphinscheduler.dao.AlertDao;
import org.apache.dolphinscheduler.dao.datasource.BaseDataSource; import org.apache.dolphinscheduler.dao.datasource.BaseDataSource;
import org.apache.dolphinscheduler.dao.datasource.DataSourceFactory; import org.apache.dolphinscheduler.dao.datasource.DataSourceFactory;
@ -41,16 +50,30 @@ import org.apache.dolphinscheduler.server.utils.ParamUtils;
import org.apache.dolphinscheduler.server.utils.UDFUtils; import org.apache.dolphinscheduler.server.utils.UDFUtils;
import org.apache.dolphinscheduler.server.worker.task.AbstractTask; import org.apache.dolphinscheduler.server.worker.task.AbstractTask;
import org.apache.dolphinscheduler.service.bean.SpringApplicationContext; import org.apache.dolphinscheduler.service.bean.SpringApplicationContext;
import org.slf4j.Logger;
import java.sql.*; import org.apache.commons.lang.StringUtils;
import java.util.*;
import java.sql.Connection;
import java.sql.DriverManager;
import java.sql.PreparedStatement;
import java.sql.ResultSet;
import java.sql.ResultSetMetaData;
import java.sql.SQLException;
import java.sql.Statement;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.Optional;
import java.util.Properties;
import java.util.regex.Matcher; import java.util.regex.Matcher;
import java.util.regex.Pattern; import java.util.regex.Pattern;
import java.util.stream.Collectors; import java.util.stream.Collectors;
import static org.apache.dolphinscheduler.common.Constants.*; import org.slf4j.Logger;
import static org.apache.dolphinscheduler.common.enums.DbType.HIVE;
import com.alibaba.fastjson.JSONArray;
import com.alibaba.fastjson.JSONObject;
/** /**
* sql task * sql task
*/ */

23
dolphinscheduler-server/src/test/java/org/apache/dolphinscheduler/server/worker/task/sqoop/SqoopTaskTest.java

@ -26,6 +26,8 @@ import org.apache.dolphinscheduler.service.bean.SpringApplicationContext;
import org.apache.dolphinscheduler.service.process.ProcessService; import org.apache.dolphinscheduler.service.process.ProcessService;
import java.util.Date; import java.util.Date;
import java.util.List;
import java.util.concurrent.LinkedBlockingQueue;
import org.junit.Assert; import org.junit.Assert;
import org.junit.Before; import org.junit.Before;
@ -199,4 +201,25 @@ public class SqoopTaskTest {
} }
} }
@Test
public void testLogHandler() throws InterruptedException {
LinkedBlockingQueue<String> loggerBuffer = new LinkedBlockingQueue<>();
Thread thread1 = new Thread(() -> {
for (int i = 0; i < 10; i++) {
loggerBuffer.add("test add log");
}
});
Thread thread2 = new Thread(() -> {
for (int i = 0; i < 10; i++) {
sqoopTask.logHandle(loggerBuffer);
}
});
thread1.start();
thread2.start();
thread1.join();
thread2.join();
// if no exception throw, assert true
Assert.assertTrue(true);
}
} }

Loading…
Cancel
Save