datahub/wherehows-backend/app/actors/EtlJobActor.java
Mars Lan 5f5c0937d1 Rename web, backend-service (#490)
* Rename web to wherehows-api and update README.

* Rename backend-service to wherehows-backend

* Rename metadata-etl to wherehows-etl

* Rename hadoop-dataset-extractor-standalone to wherehows-hadoop
2017-07-10 13:42:56 -07:00

160 lines
5.3 KiB
Java

/**
* Copyright 2015 LinkedIn Corp. All rights reserved.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
*/
package actors;
import akka.actor.UntypedActor;
import java.net.UnknownHostException;
import java.util.List;
import metadata.etl.models.EtlJobStatus;
import models.daos.EtlJobDao;
import models.daos.EtlJobPropertyDao;
import msgs.EtlJobMessage;
import play.Logger;
import play.Play;
import shared.Global;
import java.io.BufferedReader;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.lang.reflect.Field;
import java.util.Properties;
import wherehows.common.Constant;
/**
* Created by zechen on 9/4/15.
*/
public class EtlJobActor extends UntypedActor {
private Process process;
private static final String ETL_TEMP_DIR = Play.application().configuration().getString("etl.temp_dir");
@Override
public void onReceive(Object message)
throws Exception {
Properties props = null;
if (message instanceof EtlJobMessage) {
EtlJobMessage msg = (EtlJobMessage) message;
try {
props = EtlJobPropertyDao.getJobProperties(msg.getEtlJobName(), msg.getRefId());
Properties whProps = EtlJobPropertyDao.getWherehowsProperties();
props.putAll(whProps);
props.setProperty(Constant.WH_APP_FOLDER_KEY, ETL_TEMP_DIR);
EtlJobDao.startRun(msg.getWhEtlExecId(), "Job started!");
// start a new process here
final ProcessBuilder pb = ConfigUtil.buildProcess(
msg.getEtlJobName(), msg.getWhEtlExecId(), msg.getCmdParam(), props);
Logger.debug("run command : " + pb.command());
ConfigUtil.generateProperties(msg.getEtlJobName(), msg.getRefId(), msg.getWhEtlExecId(), props);
int retry = 0;
int execResult = 0;
String line;
while (retry < 3) {
long startTime = System.currentTimeMillis();
process = pb.start();
// update process id and hostname for started job
EtlJobDao.updateJobProcessInfo(msg.getWhEtlExecId(), getPid(process), getHostname());
// wait until this process finished.
execResult = process.waitFor();
long elapsedTime = System.currentTimeMillis() - startTime;
// For process error such as ImportError or ArgumentError happening shortly after starting, retry
if (execResult == 2 && elapsedTime < 10000) {
retry++;
Logger.error("*** Process + " + getPid(process) + " failed, status: " + execResult + ". Retry " + retry);
if (process.isAlive()) {
process.destroy();
}
Thread.sleep(10000);
} else {
break;
}
}
// if the process failed, log the error and throw exception
if (execResult > 0) {
BufferedReader br = new BufferedReader(new InputStreamReader(process.getErrorStream()));
String errString = "Error Details:\n";
while ((line = br.readLine()) != null)
errString = errString.concat(line).concat("\n");
Logger.error("*** Process + " + getPid(process) + " failed, status: " + execResult);
Logger.error(errString);
throw new Exception("Process + " + getPid(process) + " failed");
}
EtlJobDao.endRun(msg.getWhEtlExecId(), EtlJobStatus.SUCCEEDED, "Job succeed!");
Logger.info("ETL job {} finished", msg.toDebugString());
if (msg.getEtlJobName().affectDataset()) {
ActorRegistry.treeBuilderActor.tell("dataset", getSelf());
}
if (msg.getEtlJobName().affectFlow()) {
ActorRegistry.treeBuilderActor.tell("flow", getSelf());
}
} catch (Throwable e) { // catch all throwable at the highest level.
e.printStackTrace();
Logger.error("ETL job {} got a problem", msg.toDebugString());
if (process.isAlive()) {
process.destroy();
}
EtlJobDao.endRun(msg.getWhEtlExecId(), EtlJobStatus.ERROR, e.getMessage());
} finally {
Global.removeRunningJob(((EtlJobMessage) message).getWhEtlJobId());
if (!Logger.isDebugEnabled()) // if debug enable, won't delete the config files.
ConfigUtil.deletePropertiesFile(props, msg.getWhEtlExecId());
}
}
}
/**
* Reflection to get the pid
*
* @param process {@code Process}
* @return pid, -1 if not found
*/
private static int getPid(Process process) {
try {
Class<?> cProcessImpl = process.getClass();
Field fPid = cProcessImpl.getDeclaredField("pid");
if (!fPid.isAccessible()) {
fPid.setAccessible(true);
}
return fPid.getInt(process);
} catch (Exception e) {
return -1;
}
}
/**
* Return the hostname of the machine
* @return hostname, null if unknown
*/
private static String getHostname() {
try {
return java.net.InetAddress.getLocalHost().getHostName();
} catch (UnknownHostException ex) {
return null;
}
}
}