1100 lines
56 KiB
Java
1100 lines
56 KiB
Java
package io.dataease.service.dataset;
|
|
|
|
import com.google.gson.Gson;
|
|
import io.dataease.base.domain.*;
|
|
import io.dataease.base.mapper.DatasetTableMapper;
|
|
import io.dataease.base.mapper.DatasetTableTaskMapper;
|
|
import io.dataease.base.mapper.DatasourceMapper;
|
|
import io.dataease.base.mapper.ext.ExtChartViewMapper;
|
|
import io.dataease.commons.constants.*;
|
|
import io.dataease.commons.model.AuthURD;
|
|
import io.dataease.commons.utils.*;
|
|
import io.dataease.datasource.constants.DatasourceTypes;
|
|
import io.dataease.datasource.dto.*;
|
|
import io.dataease.datasource.provider.DatasourceProvider;
|
|
import io.dataease.datasource.provider.JdbcProvider;
|
|
import io.dataease.datasource.provider.ProviderFactory;
|
|
import io.dataease.datasource.request.DatasourceRequest;
|
|
import io.dataease.dto.dataset.DataTableInfoDTO;
|
|
import io.dataease.exception.DataEaseException;
|
|
import io.dataease.listener.util.CacheUtils;
|
|
import io.dataease.provider.QueryProvider;
|
|
import io.dataease.service.message.DeMsgutil;
|
|
import org.apache.commons.collections4.CollectionUtils;
|
|
import org.apache.commons.io.FileUtils;
|
|
import org.apache.commons.lang3.ObjectUtils;
|
|
import org.apache.commons.lang3.StringUtils;
|
|
import org.apache.http.HttpResponse;
|
|
import org.apache.http.client.methods.HttpGet;
|
|
import org.apache.http.impl.client.CloseableHttpClient;
|
|
import org.apache.poi.hssf.usermodel.HSSFSheet;
|
|
import org.apache.poi.hssf.usermodel.HSSFWorkbook;
|
|
import org.apache.poi.xssf.usermodel.XSSFSheet;
|
|
import org.apache.poi.xssf.usermodel.XSSFWorkbook;
|
|
import org.pentaho.di.cluster.SlaveServer;
|
|
import org.pentaho.di.core.database.DatabaseMeta;
|
|
import org.pentaho.di.core.row.ValueMetaInterface;
|
|
import org.pentaho.di.core.util.HttpClientManager;
|
|
import org.pentaho.di.job.Job;
|
|
import org.pentaho.di.job.JobExecutionConfiguration;
|
|
import org.pentaho.di.job.JobHopMeta;
|
|
import org.pentaho.di.job.JobMeta;
|
|
import org.pentaho.di.job.entries.shell.JobEntryShell;
|
|
import org.pentaho.di.job.entries.special.JobEntrySpecial;
|
|
import org.pentaho.di.job.entries.success.JobEntrySuccess;
|
|
import org.pentaho.di.job.entries.trans.JobEntryTrans;
|
|
import org.pentaho.di.job.entry.JobEntryCopy;
|
|
import org.pentaho.di.repository.RepositoryDirectoryInterface;
|
|
import org.pentaho.di.repository.filerep.KettleFileRepository;
|
|
import org.pentaho.di.trans.TransHopMeta;
|
|
import org.pentaho.di.trans.TransMeta;
|
|
import org.pentaho.di.trans.step.StepMeta;
|
|
import org.pentaho.di.trans.steps.excelinput.ExcelInputField;
|
|
import org.pentaho.di.trans.steps.excelinput.ExcelInputMeta;
|
|
import org.pentaho.di.trans.steps.excelinput.SpreadSheetType;
|
|
import org.pentaho.di.trans.steps.tableinput.TableInputMeta;
|
|
import org.pentaho.di.trans.steps.textfileoutput.TextFileField;
|
|
import org.pentaho.di.trans.steps.textfileoutput.TextFileOutputMeta;
|
|
import org.pentaho.di.trans.steps.userdefinedjavaclass.UserDefinedJavaClassDef;
|
|
import org.pentaho.di.trans.steps.userdefinedjavaclass.UserDefinedJavaClassMeta;
|
|
import org.pentaho.di.www.SlaveServerJobStatus;
|
|
import org.quartz.JobExecutionContext;
|
|
import org.springframework.beans.factory.annotation.Value;
|
|
import org.springframework.context.annotation.Lazy;
|
|
import org.springframework.stereotype.Service;
|
|
import javax.annotation.Resource;
|
|
import java.io.File;
|
|
import java.io.FileInputStream;
|
|
import java.io.InputStream;
|
|
import java.net.InetAddress;
|
|
import java.util.*;
|
|
import java.util.stream.Collectors;
|
|
|
|
@Service
|
|
public class ExtractDataService {
|
|
|
|
@Resource
|
|
@Lazy
|
|
private DataSetTableService dataSetTableService;
|
|
@Resource
|
|
private DataSetTableFieldsService dataSetTableFieldsService;
|
|
@Resource
|
|
@Lazy
|
|
private DataSetTableTaskLogService dataSetTableTaskLogService;
|
|
@Resource
|
|
@Lazy
|
|
private DataSetTableTaskService dataSetTableTaskService;
|
|
@Resource
|
|
private DatasourceMapper datasourceMapper;
|
|
@Resource
|
|
private DatasetTableMapper datasetTableMapper;
|
|
@Resource
|
|
private DatasetTableTaskMapper datasetTableTaskMapper;
|
|
|
|
@Resource
|
|
private ExtChartViewMapper extChartViewMapper;
|
|
|
|
private static String lastUpdateTime = "${__last_update_time__}";
|
|
private static String currentUpdateTime = "${__current_update_time__}";
|
|
private static String separator = "|DE|";
|
|
private static String extention = "txt";
|
|
private static String root_path = "/opt/dataease/data/kettle/";
|
|
|
|
@Value("${carte.host:127.0.0.1}")
|
|
private String carte;
|
|
@Value("${carte.port:8080}")
|
|
private String port;
|
|
@Value("${carte.user:cluster}")
|
|
private String user;
|
|
@Value("${carte.passwd:cluster}")
|
|
private String passwd;
|
|
private static String creatTableSql = "CREATE TABLE IF NOT EXISTS `TABLE_NAME`" +
|
|
"Column_Fields" +
|
|
"UNIQUE KEY(dataease_uuid)\n" +
|
|
"DISTRIBUTED BY HASH(dataease_uuid) BUCKETS 10\n" +
|
|
"PROPERTIES(\"replication_num\" = \"1\");";
|
|
|
|
private static String dropTableSql = "DROP TABLE IF EXISTS TABLE_NAME;";
|
|
private static String shellScript = "result=`curl --location-trusted -u %s:%s -H \"label:%s\" -H \"column_separator:%s\" -H \"columns:%s\" -H \"merge_type: %s\" -T %s -XPUT http://%s:%s/api/%s/%s/_stream_load`\n" +
|
|
"if [ $? == 0 ] ; then\n" +
|
|
" failstatus=$(echo $result | grep '\"Status\": \"Fail\"')\n" +
|
|
" if [[ \"$failstatus\" != \"\" ]]; then\n" +
|
|
" echo $result\n" +
|
|
" exit 1\n" +
|
|
" fi\n" +
|
|
"else\n" +
|
|
" echo $result\n" +
|
|
" exit 1\n" +
|
|
"fi\n" +
|
|
"rm -rf %s\n";
|
|
|
|
public synchronized boolean existSyncTask(DatasetTable datasetTable, DatasetTableTask datasetTableTask) {
|
|
datasetTable.setSyncStatus(JobStatus.Underway.name());
|
|
DatasetTableExample example = new DatasetTableExample();
|
|
example.createCriteria().andIdEqualTo(datasetTable.getId()).andSyncStatusNotEqualTo(JobStatus.Underway.name());
|
|
example.or(example.createCriteria().andIdEqualTo(datasetTable.getId()).andSyncStatusIsNull());
|
|
Boolean existSyncTask = datasetTableMapper.updateByExampleSelective(datasetTable, example) == 0;
|
|
if (existSyncTask) {
|
|
DatasetTableTaskLog datasetTableTaskLog = new DatasetTableTaskLog();
|
|
datasetTableTaskLog.setTaskId(datasetTableTask.getId());
|
|
datasetTableTaskLog.setTableId(datasetTable.getId());
|
|
datasetTableTaskLog.setStatus(JobStatus.Underway.name());
|
|
List<DatasetTableTaskLog> datasetTableTaskLogs = dataSetTableTaskLogService.select(datasetTableTaskLog);
|
|
if (CollectionUtils.isNotEmpty(datasetTableTaskLogs) && datasetTableTaskLogs.get(0).getTriggerType().equalsIgnoreCase(TriggerType.Custom.name())) {
|
|
return false;
|
|
}
|
|
return true;
|
|
} else {
|
|
datasetTableTask.setLastExecTime(System.currentTimeMillis());
|
|
datasetTableTask.setLastExecStatus(JobStatus.Underway.name());
|
|
dataSetTableTaskService.update(datasetTableTask);
|
|
return false;
|
|
}
|
|
}
|
|
|
|
public void extractExcelData(String datasetTableId, String type) {
|
|
Datasource datasource = new Datasource();
|
|
datasource.setType("excel");
|
|
DatasetTable datasetTable = getDatasetTable(datasetTableId);
|
|
if (datasetTable == null) {
|
|
LogUtil.error("Can not find DatasetTable: " + datasetTableId);
|
|
return;
|
|
}
|
|
UpdateType updateType = UpdateType.valueOf(type);
|
|
DatasetTableTaskLog datasetTableTaskLog = new DatasetTableTaskLog();
|
|
List<DatasetTableField> datasetTableFields = dataSetTableFieldsService.list(DatasetTableField.builder().tableId(datasetTable.getId()).build());
|
|
datasetTableFields.sort((o1, o2) -> {
|
|
if (o1.getColumnIndex() == null) {
|
|
return -1;
|
|
}
|
|
if (o2.getColumnIndex() == null) {
|
|
return 1;
|
|
}
|
|
return o1.getColumnIndex().compareTo(o2.getColumnIndex());
|
|
});
|
|
String dorisTablColumnSql = createDorisTablColumnSql(datasetTableFields);
|
|
switch (updateType) {
|
|
case all_scope: // 全量更新
|
|
try {
|
|
datasetTableTaskLog = writeDatasetTableTaskLog(datasetTableTaskLog, datasetTableId, null);
|
|
createDorisTable(DorisTableUtils.dorisName(datasetTableId), dorisTablColumnSql);
|
|
createDorisTable(DorisTableUtils.dorisTmpName(DorisTableUtils.dorisName(datasetTableId)), dorisTablColumnSql);
|
|
generateTransFile("all_scope", datasetTable, datasource, datasetTableFields, null);
|
|
if (datasetTable.getType().equalsIgnoreCase("sql")) {
|
|
generateJobFile("all_scope", datasetTable, fetchSqlField(new Gson().fromJson(datasetTable.getInfo(), DataTableInfoDTO.class).getSql(), datasource));
|
|
} else {
|
|
generateJobFile("all_scope", datasetTable, String.join(",", datasetTableFields.stream().map(DatasetTableField::getDataeaseName).collect(Collectors.toList())));
|
|
}
|
|
Long execTime = System.currentTimeMillis();
|
|
extractData(datasetTable, "all_scope");
|
|
replaceTable(DorisTableUtils.dorisName(datasetTableId));
|
|
saveSucessLog(datasetTableTaskLog);
|
|
sendWebMsg(datasetTable, null, true);
|
|
deleteFile("all_scope", datasetTableId);
|
|
updateTableStatus(datasetTableId, datasetTable, JobStatus.Completed, execTime);
|
|
} catch (Exception e) {
|
|
saveErrorLog(datasetTableId, null, e);
|
|
sendWebMsg(datasetTable, null, false);
|
|
updateTableStatus(datasetTableId, datasetTable, JobStatus.Error, null);
|
|
dropDorisTable(DorisTableUtils.dorisTmpName(DorisTableUtils.dorisName(datasetTableId)));
|
|
deleteFile("all_scope", datasetTableId);
|
|
} finally {
|
|
}
|
|
break;
|
|
|
|
case add_scope: // 增量更新
|
|
try {
|
|
datasetTableTaskLog = writeDatasetTableTaskLog(datasetTableTaskLog, datasetTableId, null);
|
|
generateTransFile("incremental_add", datasetTable, datasource, datasetTableFields, null);
|
|
generateJobFile("incremental_add", datasetTable, String.join(",", datasetTableFields.stream().map(DatasetTableField::getDataeaseName).collect(Collectors.toList())));
|
|
Long execTime = System.currentTimeMillis();
|
|
extractData(datasetTable, "incremental_add");
|
|
saveSucessLog(datasetTableTaskLog);
|
|
sendWebMsg(datasetTable, null, true);
|
|
updateTableStatus(datasetTableId, datasetTable, JobStatus.Completed, execTime);
|
|
} catch (Exception e) {
|
|
saveErrorLog(datasetTableId, null, e);
|
|
sendWebMsg(datasetTable, null, false);
|
|
updateTableStatus(datasetTableId, datasetTable, JobStatus.Error, null);
|
|
deleteFile("incremental_add", datasetTableId);
|
|
deleteFile("incremental_delete", datasetTableId);
|
|
} finally {
|
|
}
|
|
break;
|
|
}
|
|
//侵入式清除下属视图缓存
|
|
List<String> viewIds = extChartViewMapper.allViewIds(datasetTableId);
|
|
if (CollectionUtils.isNotEmpty(viewIds)) {
|
|
viewIds.forEach(viewId -> {
|
|
CacheUtils.remove(JdbcConstants.VIEW_CACHE_KEY, viewId);
|
|
});
|
|
}
|
|
}
|
|
|
|
public void extractData(String datasetTableId, String taskId, String type, JobExecutionContext context) {
|
|
DatasetTable datasetTable = getDatasetTable(datasetTableId);
|
|
if (datasetTable == null) {
|
|
LogUtil.error("Can not find DatasetTable: " + datasetTableId);
|
|
return;
|
|
}
|
|
DatasetTableTask datasetTableTask = datasetTableTaskMapper.selectByPrimaryKey(taskId);
|
|
if (datasetTableTask == null) {
|
|
return;
|
|
}
|
|
if (datasetTableTask.getStatus().equalsIgnoreCase(TaskStatus.Stopped.name())) {
|
|
LogUtil.info("Skip synchronization task, task ID : " + datasetTableTask.getId());
|
|
return;
|
|
}
|
|
if (existSyncTask(datasetTable, datasetTableTask)) {
|
|
LogUtil.info("Skip synchronization task for dataset, dataset ID : " + datasetTableId);
|
|
return;
|
|
}
|
|
|
|
DatasetTableTaskLog datasetTableTaskLog = new DatasetTableTaskLog();
|
|
UpdateType updateType = UpdateType.valueOf(type);
|
|
if (context != null) {
|
|
datasetTable.setQrtzInstance(context.getFireInstanceId());
|
|
datasetTableMapper.updateByPrimaryKeySelective(datasetTable);
|
|
}
|
|
Datasource datasource = new Datasource();
|
|
if (StringUtils.isNotEmpty(datasetTable.getDataSourceId())) {
|
|
datasource = datasourceMapper.selectByPrimaryKey(datasetTable.getDataSourceId());
|
|
} else {
|
|
datasource.setType(datasetTable.getType());
|
|
}
|
|
List<DatasetTableField> datasetTableFields = dataSetTableFieldsService.list(DatasetTableField.builder().tableId(datasetTable.getId()).build());
|
|
datasetTableFields.sort((o1, o2) -> {
|
|
if (o1.getColumnIndex() == null) {
|
|
return -1;
|
|
}
|
|
if (o2.getColumnIndex() == null) {
|
|
return 1;
|
|
}
|
|
return o1.getColumnIndex().compareTo(o2.getColumnIndex());
|
|
});
|
|
String dorisTablColumnSql = createDorisTablColumnSql(datasetTableFields);
|
|
|
|
switch (updateType) {
|
|
case all_scope: // 全量更新
|
|
try {
|
|
if (datasetTableTask != null && datasetTableTask.getRate().equalsIgnoreCase(ScheduleType.CRON.toString())) {
|
|
datasetTableTaskLog = writeDatasetTableTaskLog(datasetTableTaskLog, datasetTableId, taskId);
|
|
}
|
|
if (datasetTableTask != null && datasetTableTask.getRate().equalsIgnoreCase(ScheduleType.SIMPLE.toString())) {
|
|
datasetTableTaskLog = getDatasetTableTaskLog(datasetTableTaskLog, datasetTableId, taskId);
|
|
}
|
|
createDorisTable(DorisTableUtils.dorisName(datasetTableId), dorisTablColumnSql);
|
|
createDorisTable(DorisTableUtils.dorisTmpName(DorisTableUtils.dorisName(datasetTableId)), dorisTablColumnSql);
|
|
generateTransFile("all_scope", datasetTable, datasource, datasetTableFields, null);
|
|
if (datasetTable.getType().equalsIgnoreCase("sql")) {
|
|
generateJobFile("all_scope", datasetTable, fetchSqlField(new Gson().fromJson(datasetTable.getInfo(), DataTableInfoDTO.class).getSql(), datasource));
|
|
} else {
|
|
generateJobFile("all_scope", datasetTable, String.join(",", datasetTableFields.stream().map(DatasetTableField::getDataeaseName).collect(Collectors.toList())));
|
|
}
|
|
Long execTime = System.currentTimeMillis();
|
|
extractData(datasetTable, "all_scope");
|
|
replaceTable(DorisTableUtils.dorisName(datasetTableId));
|
|
saveSucessLog(datasetTableTaskLog);
|
|
|
|
sendWebMsg(datasetTable, datasetTableTask, true);
|
|
|
|
deleteFile("all_scope", datasetTableId);
|
|
|
|
updateTableStatus(datasetTableId, datasetTable, JobStatus.Completed, execTime);
|
|
datasetTableTask.setLastExecStatus(JobStatus.Completed.name());
|
|
dataSetTableTaskService.update(datasetTableTask);
|
|
|
|
} catch (Exception e) {
|
|
saveErrorLog(datasetTableId, taskId, e);
|
|
datasetTableTask.setLastExecStatus(JobStatus.Error.name());
|
|
dataSetTableTaskService.update(datasetTableTask);
|
|
|
|
sendWebMsg(datasetTable, datasetTableTask, false);
|
|
updateTableStatus(datasetTableId, datasetTable, JobStatus.Error, null);
|
|
dropDorisTable(DorisTableUtils.dorisTmpName(DorisTableUtils.dorisName(datasetTableId)));
|
|
deleteFile("all_scope", datasetTableId);
|
|
} finally {
|
|
}
|
|
break;
|
|
|
|
case add_scope: // 增量更新
|
|
try {
|
|
DatasetTableIncrementalConfig datasetTableIncrementalConfig = dataSetTableService.incrementalConfig(datasetTableId);
|
|
if (datasetTableIncrementalConfig == null || StringUtils.isEmpty(datasetTableIncrementalConfig.getTableId())) {
|
|
updateTableStatus(datasetTableId, datasetTable, JobStatus.Completed, null);
|
|
return;
|
|
}
|
|
|
|
if (datasetTable.getLastUpdateTime() == 0 || datasetTable.getLastUpdateTime() == null) {
|
|
updateTableStatus(datasetTableId, datasetTable, JobStatus.Completed, null);
|
|
return;
|
|
}
|
|
|
|
if (datasetTableTask != null && datasetTableTask.getRate().equalsIgnoreCase(ScheduleType.CRON.toString())) {
|
|
datasetTableTaskLog = writeDatasetTableTaskLog(datasetTableTaskLog, datasetTableId, taskId);
|
|
}
|
|
if (datasetTableTask != null && datasetTableTask.getRate().equalsIgnoreCase(ScheduleType.SIMPLE.toString())) {
|
|
datasetTableTaskLog = getDatasetTableTaskLog(datasetTableTaskLog, datasetTableId, taskId);
|
|
}
|
|
Long execTime = System.currentTimeMillis();
|
|
if (StringUtils.isNotEmpty(datasetTableIncrementalConfig.getIncrementalAdd()) && StringUtils.isNotEmpty(datasetTableIncrementalConfig.getIncrementalAdd().replace(" ", ""))) {// 增量添加
|
|
String sql = datasetTableIncrementalConfig.getIncrementalAdd().replace(lastUpdateTime, datasetTable.getLastUpdateTime().toString())
|
|
.replace(currentUpdateTime, Long.valueOf(System.currentTimeMillis()).toString());
|
|
generateTransFile("incremental_add", datasetTable, datasource, datasetTableFields, sql);
|
|
generateJobFile("incremental_add", datasetTable, fetchSqlField(sql, datasource));
|
|
extractData(datasetTable, "incremental_add");
|
|
}
|
|
|
|
if (StringUtils.isNotEmpty(datasetTableIncrementalConfig.getIncrementalDelete()) && StringUtils.isNotEmpty(datasetTableIncrementalConfig.getIncrementalDelete().replace(" ", ""))) {// 增量删除
|
|
String sql = datasetTableIncrementalConfig.getIncrementalDelete().replace(lastUpdateTime, datasetTable.getLastUpdateTime().toString())
|
|
.replace(currentUpdateTime, Long.valueOf(System.currentTimeMillis()).toString());
|
|
generateTransFile("incremental_delete", datasetTable, datasource, datasetTableFields, sql);
|
|
generateJobFile("incremental_delete", datasetTable, fetchSqlField(sql, datasource));
|
|
extractData(datasetTable, "incremental_delete");
|
|
}
|
|
saveSucessLog(datasetTableTaskLog);
|
|
|
|
sendWebMsg(datasetTable, datasetTableTask, true);
|
|
|
|
deleteFile("incremental_add", datasetTableId);
|
|
deleteFile("incremental_delete", datasetTableId);
|
|
|
|
updateTableStatus(datasetTableId, datasetTable, JobStatus.Completed, execTime);
|
|
datasetTableTask.setLastExecStatus(JobStatus.Completed.name());
|
|
dataSetTableTaskService.update(datasetTableTask);
|
|
} catch (Exception e) {
|
|
saveErrorLog(datasetTableId, taskId, e);
|
|
sendWebMsg(datasetTable, datasetTableTask, false);
|
|
updateTableStatus(datasetTableId, datasetTable, JobStatus.Error, null);
|
|
datasetTableTask.setLastExecStatus(JobStatus.Error.name());
|
|
dataSetTableTaskService.update(datasetTableTask);
|
|
deleteFile("incremental_add", datasetTableId);
|
|
deleteFile("incremental_delete", datasetTableId);
|
|
} finally {
|
|
}
|
|
break;
|
|
}
|
|
//侵入式清除下属视图缓存
|
|
List<String> viewIds = extChartViewMapper.allViewIds(datasetTableId);
|
|
if (CollectionUtils.isNotEmpty(viewIds)) {
|
|
viewIds.forEach(viewId -> {
|
|
CacheUtils.remove(JdbcConstants.VIEW_CACHE_KEY, viewId);
|
|
});
|
|
}
|
|
|
|
}
|
|
|
|
private void sendWebMsg(DatasetTable datasetTable, DatasetTableTask datasetTableTask, Boolean status) {
|
|
String taskId = datasetTableTask.getId();
|
|
String msg = status ? "成功" : "失败";
|
|
Long typeId = status ? 5L : 6L;
|
|
String id = datasetTable.getId();
|
|
AuthURD authURD = AuthUtils.authURDR(id);
|
|
Set<Long> userIds = AuthUtils.userIdsByURD(authURD);
|
|
Gson gson = new Gson();
|
|
userIds.forEach(userId -> {
|
|
Map<String, Object> param = new HashMap<>();
|
|
param.put("tableId", id);
|
|
if (StringUtils.isNotEmpty(taskId)) {
|
|
param.put("taskId", taskId);
|
|
}
|
|
String content = "数据集【" + datasetTable.getName() + "】同步" + msg;
|
|
if (ObjectUtils.isNotEmpty(datasetTableTask) && ObjectUtils.isNotEmpty(datasetTableTask.getName())) {
|
|
content += " 任务名称【" + datasetTableTask.getName() + "】";
|
|
}
|
|
DeMsgutil.sendMsg(userId, typeId, 1L, content, gson.toJson(param));
|
|
});
|
|
}
|
|
|
|
private void updateTableStatus(String datasetTableId, DatasetTable datasetTable, JobStatus completed, Long execTime) {
|
|
datasetTable.setSyncStatus(completed.name());
|
|
if (execTime != null) {
|
|
datasetTable.setLastUpdateTime(execTime);
|
|
}
|
|
DatasetTableExample example = new DatasetTableExample();
|
|
example.createCriteria().andIdEqualTo(datasetTableId);
|
|
datasetTableMapper.updateByExampleSelective(datasetTable, example);
|
|
}
|
|
|
|
private void saveSucessLog(DatasetTableTaskLog datasetTableTaskLog) {
|
|
datasetTableTaskLog.setStatus(JobStatus.Completed.name());
|
|
datasetTableTaskLog.setEndTime(System.currentTimeMillis());
|
|
dataSetTableTaskLogService.save(datasetTableTaskLog);
|
|
}
|
|
|
|
private void saveErrorLog(String datasetTableId, String taskId, Exception e) {
|
|
LogUtil.error("Extract data error: " + datasetTableId, e);
|
|
DatasetTableTaskLog datasetTableTaskLog = new DatasetTableTaskLog();
|
|
datasetTableTaskLog.setTableId(datasetTableId);
|
|
datasetTableTaskLog.setStatus(JobStatus.Underway.name());
|
|
if (StringUtils.isNotEmpty(taskId)) {
|
|
datasetTableTaskLog.setTaskId(taskId);
|
|
}
|
|
List<DatasetTableTaskLog> datasetTableTaskLogs = dataSetTableTaskLogService.select(datasetTableTaskLog);
|
|
if (CollectionUtils.isNotEmpty(datasetTableTaskLogs)) {
|
|
datasetTableTaskLog = datasetTableTaskLogs.get(0);
|
|
datasetTableTaskLog.setStatus(JobStatus.Error.name());
|
|
datasetTableTaskLog.setInfo(e.getMessage());
|
|
datasetTableTaskLog.setEndTime(System.currentTimeMillis());
|
|
dataSetTableTaskLogService.save(datasetTableTaskLog);
|
|
}
|
|
|
|
}
|
|
|
|
private String createDorisTablColumnSql(List<DatasetTableField> datasetTableFields) {
|
|
String Column_Fields = "dataease_uuid varchar(50), `";
|
|
for (DatasetTableField datasetTableField : datasetTableFields) {
|
|
Column_Fields = Column_Fields + datasetTableField.getDataeaseName() + "` ";
|
|
switch (datasetTableField.getDeExtractType()) {
|
|
case 0:
|
|
if (datasetTableField.getSize() > 65533 || datasetTableField.getSize() * 3 > 65533) {
|
|
Column_Fields = Column_Fields + "varchar(65533)" + ",`";
|
|
} else {
|
|
Column_Fields = Column_Fields + "varchar(lenth)".replace("lenth", String.valueOf(datasetTableField.getSize() * 3)) + ",`";
|
|
}
|
|
break;
|
|
case 1:
|
|
Column_Fields = Column_Fields + "varchar(lenth)".replace("lenth", String.valueOf(datasetTableField.getSize())) + ",`";
|
|
break;
|
|
case 2:
|
|
Column_Fields = Column_Fields + "bigint(lenth)".replace("lenth", String.valueOf(datasetTableField.getSize())) + ",`";
|
|
break;
|
|
case 3:
|
|
Column_Fields = Column_Fields + "DOUBLE" + ",`";
|
|
break;
|
|
case 4:
|
|
Column_Fields = Column_Fields + "TINYINT(lenth)".replace("lenth", String.valueOf(datasetTableField.getSize())) + ",`";
|
|
break;
|
|
default:
|
|
Column_Fields = Column_Fields + "varchar(lenth)".replace("lenth", String.valueOf(datasetTableField.getSize())) + ",`";
|
|
break;
|
|
}
|
|
}
|
|
|
|
Column_Fields = Column_Fields.substring(0, Column_Fields.length() - 2);
|
|
Column_Fields = "(" + Column_Fields + ")\n";
|
|
return Column_Fields;
|
|
}
|
|
|
|
private void createDorisTable(String dorisTableName, String dorisTablColumnSql) throws Exception {
|
|
Datasource dorisDatasource = (Datasource) CommonBeanFactory.getBean("DorisDatasource");
|
|
JdbcProvider jdbcProvider = CommonBeanFactory.getBean(JdbcProvider.class);
|
|
DatasourceRequest datasourceRequest = new DatasourceRequest();
|
|
datasourceRequest.setDatasource(dorisDatasource);
|
|
datasourceRequest.setQuery(creatTableSql.replace("TABLE_NAME", dorisTableName).replace("Column_Fields", dorisTablColumnSql));
|
|
jdbcProvider.exec(datasourceRequest);
|
|
}
|
|
|
|
private void dropDorisTable(String dorisTableName) {
|
|
try {
|
|
Datasource dorisDatasource = (Datasource) CommonBeanFactory.getBean("DorisDatasource");
|
|
JdbcProvider jdbcProvider = CommonBeanFactory.getBean(JdbcProvider.class);
|
|
DatasourceRequest datasourceRequest = new DatasourceRequest();
|
|
datasourceRequest.setDatasource(dorisDatasource);
|
|
datasourceRequest.setQuery(dropTableSql.replace("TABLE_NAME", dorisTableName));
|
|
jdbcProvider.exec(datasourceRequest);
|
|
} catch (Exception ignore) {
|
|
}
|
|
}
|
|
|
|
private void replaceTable(String dorisTableName) throws Exception {
|
|
Datasource dorisDatasource = (Datasource) CommonBeanFactory.getBean("DorisDatasource");
|
|
JdbcProvider jdbcProvider = CommonBeanFactory.getBean(JdbcProvider.class);
|
|
;
|
|
DatasourceRequest datasourceRequest = new DatasourceRequest();
|
|
datasourceRequest.setDatasource(dorisDatasource);
|
|
datasourceRequest.setQuery("ALTER TABLE DORIS_TABLE REPLACE WITH TABLE DORIS_TMP_TABLE PROPERTIES('swap' = 'false');".replace("DORIS_TABLE", dorisTableName).replace("DORIS_TMP_TABLE", DorisTableUtils.dorisTmpName(dorisTableName)));
|
|
jdbcProvider.exec(datasourceRequest);
|
|
}
|
|
|
|
private DatasetTable getDatasetTable(String datasetTableId) {
|
|
for (int i = 0; i < 5; i++) {
|
|
DatasetTable datasetTable = dataSetTableService.get(datasetTableId);
|
|
if (datasetTable == null) {
|
|
try {
|
|
Thread.sleep(1000);
|
|
} catch (Exception ignore) {
|
|
}
|
|
} else {
|
|
return datasetTable;
|
|
}
|
|
}
|
|
return null;
|
|
}
|
|
|
|
private DatasetTableTaskLog writeDatasetTableTaskLog(DatasetTableTaskLog datasetTableTaskLog, String datasetTableId, String taskId) {
|
|
datasetTableTaskLog.setTableId(datasetTableId);
|
|
datasetTableTaskLog.setTaskId(taskId);
|
|
datasetTableTaskLog.setStatus(JobStatus.Underway.name());
|
|
datasetTableTaskLog.setTriggerType(TriggerType.Cron.name());
|
|
List<DatasetTableTaskLog> datasetTableTaskLogs = dataSetTableTaskLogService.select(datasetTableTaskLog);
|
|
if (CollectionUtils.isEmpty(datasetTableTaskLogs)) {
|
|
datasetTableTaskLog.setStartTime(System.currentTimeMillis());
|
|
dataSetTableTaskLogService.save(datasetTableTaskLog);
|
|
return datasetTableTaskLog;
|
|
} else {
|
|
return datasetTableTaskLogs.get(0);
|
|
}
|
|
}
|
|
|
|
private DatasetTableTaskLog getDatasetTableTaskLog(DatasetTableTaskLog datasetTableTaskLog, String datasetTableId, String taskId) {
|
|
datasetTableTaskLog.setTableId(datasetTableId);
|
|
datasetTableTaskLog.setTaskId(taskId);
|
|
datasetTableTaskLog.setStatus(JobStatus.Underway.name());
|
|
for (int i = 0; i < 5; i++) {
|
|
List<DatasetTableTaskLog> datasetTableTaskLogs = dataSetTableTaskLogService.select(datasetTableTaskLog);
|
|
if (CollectionUtils.isNotEmpty(datasetTableTaskLogs)) {
|
|
return datasetTableTaskLogs.get(0);
|
|
}
|
|
try {
|
|
Thread.sleep(1000);
|
|
} catch (Exception ignore) {
|
|
}
|
|
}
|
|
datasetTableTaskLog.setStartTime(System.currentTimeMillis());
|
|
dataSetTableTaskLogService.save(datasetTableTaskLog);
|
|
return datasetTableTaskLog;
|
|
}
|
|
|
|
private void extractData(DatasetTable datasetTable, String extractType) throws Exception {
|
|
KettleFileRepository repository = CommonBeanFactory.getBean(KettleFileRepository.class);
|
|
RepositoryDirectoryInterface repositoryDirectoryInterface = repository.loadRepositoryDirectoryTree();
|
|
JobMeta jobMeta = null;
|
|
switch (extractType) {
|
|
case "all_scope":
|
|
jobMeta = repository.loadJob("job_" + DorisTableUtils.dorisName(datasetTable.getId()), repositoryDirectoryInterface, null, null);
|
|
break;
|
|
case "incremental_add":
|
|
jobMeta = repository.loadJob("job_add_" + DorisTableUtils.dorisName(datasetTable.getId()), repositoryDirectoryInterface, null, null);
|
|
break;
|
|
case "incremental_delete":
|
|
jobMeta = repository.loadJob("job_delete_" + DorisTableUtils.dorisName(datasetTable.getId()), repositoryDirectoryInterface, null, null);
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
|
|
SlaveServer remoteSlaveServer = getSlaveServer();
|
|
JobExecutionConfiguration jobExecutionConfiguration = new JobExecutionConfiguration();
|
|
jobExecutionConfiguration.setRemoteServer(remoteSlaveServer);
|
|
jobExecutionConfiguration.setRepository(repository);
|
|
String lastCarteObjectId = Job.sendToSlaveServer(jobMeta, jobExecutionConfiguration, repository, null);
|
|
SlaveServerJobStatus jobStatus = null;
|
|
boolean executing = true;
|
|
while (executing) {
|
|
jobStatus = remoteSlaveServer.getJobStatus(jobMeta.getName(), lastCarteObjectId, 0);
|
|
executing = jobStatus.isRunning() || jobStatus.isWaiting();
|
|
if (!executing)
|
|
break;
|
|
Thread.sleep(1000);
|
|
}
|
|
if (jobStatus.getStatusDescription().equals("Finished")) {
|
|
return;
|
|
} else {
|
|
DataEaseException.throwException((jobStatus.getLoggingString()));
|
|
}
|
|
}
|
|
|
|
private boolean isExitFile(String fileName) {
|
|
File file = new File(root_path + fileName);
|
|
return file.exists();
|
|
}
|
|
|
|
private SlaveServer getSlaveServer() {
|
|
SlaveServer remoteSlaveServer = new SlaveServer();
|
|
remoteSlaveServer.setHostname(carte);// 设置远程IP
|
|
remoteSlaveServer.setPort(port);// 端口
|
|
remoteSlaveServer.setUsername(user);
|
|
remoteSlaveServer.setPassword(passwd);
|
|
return remoteSlaveServer;
|
|
}
|
|
|
|
private void generateJobFile(String extractType, DatasetTable datasetTable, String columnFeilds) throws Exception {
|
|
String outFile = null;
|
|
String jobName = null;
|
|
String script = null;
|
|
Datasource dorisDatasource = (Datasource) CommonBeanFactory.getBean("DorisDatasource");
|
|
DorisConfigration dorisConfigration = new Gson().fromJson(dorisDatasource.getConfiguration(), DorisConfigration.class);
|
|
String columns = columnFeilds + ",dataease_uuid";
|
|
String transName = null;
|
|
switch (extractType) {
|
|
case "all_scope":
|
|
transName = "trans_" + DorisTableUtils.dorisName(datasetTable.getId());
|
|
outFile = DorisTableUtils.dorisTmpName(DorisTableUtils.dorisName(datasetTable.getId()));
|
|
jobName = "job_" + DorisTableUtils.dorisName(datasetTable.getId());
|
|
script = String.format(shellScript, dorisConfigration.getUsername(), dorisConfigration.getPassword(), String.valueOf(System.currentTimeMillis()), separator, columns, "APPEND", root_path + outFile + "." + extention, dorisConfigration.getHost(), dorisConfigration.getHttpPort(), dorisConfigration.getDataBase(), DorisTableUtils.dorisTmpName(DorisTableUtils.dorisName(datasetTable.getId())), root_path + outFile + "." + extention);
|
|
break;
|
|
case "incremental_add":
|
|
transName = "trans_add_" + DorisTableUtils.dorisName(datasetTable.getId());
|
|
outFile = DorisTableUtils.dorisAddName(datasetTable.getId());
|
|
jobName = "job_add_" + DorisTableUtils.dorisName(datasetTable.getId());
|
|
script = String.format(shellScript, dorisConfigration.getUsername(), dorisConfigration.getPassword(), String.valueOf(System.currentTimeMillis()), separator, columns, "APPEND", root_path + outFile + "." + extention, dorisConfigration.getHost(), dorisConfigration.getHttpPort(), dorisConfigration.getDataBase(), DorisTableUtils.dorisName(datasetTable.getId()), root_path + outFile + "." + extention);
|
|
break;
|
|
case "incremental_delete":
|
|
transName = "trans_delete_" + DorisTableUtils.dorisName(datasetTable.getId());
|
|
outFile = DorisTableUtils.dorisDeleteName(DorisTableUtils.dorisName(datasetTable.getId()));
|
|
script = String.format(shellScript, dorisConfigration.getUsername(), dorisConfigration.getPassword(), String.valueOf(System.currentTimeMillis()), separator, columns, "DELETE", root_path + outFile + "." + extention, dorisConfigration.getHost(), dorisConfigration.getHttpPort(), dorisConfigration.getDataBase(), DorisTableUtils.dorisName(datasetTable.getId()), root_path + outFile + "." + extention);
|
|
jobName = "job_delete_" + DorisTableUtils.dorisName(datasetTable.getId());
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
|
|
JobMeta jobMeta = new JobMeta();
|
|
jobMeta.setName(jobName);
|
|
|
|
//start
|
|
JobEntrySpecial start = new JobEntrySpecial();
|
|
start.setName("START");
|
|
start.setStart(true);
|
|
JobEntryCopy startEntry = new JobEntryCopy(start);
|
|
startEntry.setDrawn(true);
|
|
startEntry.setLocation(100, 100);
|
|
jobMeta.addJobEntry(startEntry);
|
|
|
|
//trans
|
|
JobEntryTrans transrans = new JobEntryTrans();
|
|
transrans.setTransname(transName);
|
|
transrans.setName("Transformation");
|
|
JobEntryCopy transEntry = new JobEntryCopy(transrans);
|
|
transEntry.setDrawn(true);
|
|
transEntry.setLocation(300, 100);
|
|
jobMeta.addJobEntry(transEntry);
|
|
|
|
jobMeta.addJobHop(new JobHopMeta(startEntry, transEntry));
|
|
|
|
//exec shell
|
|
JobEntryShell shell = new JobEntryShell();
|
|
shell.setScript(script);
|
|
shell.insertScript = true;
|
|
shell.setName("shell");
|
|
JobEntryCopy shellEntry = new JobEntryCopy(shell);
|
|
shellEntry.setDrawn(true);
|
|
shellEntry.setLocation(500, 100);
|
|
jobMeta.addJobEntry(shellEntry);
|
|
|
|
JobHopMeta transHop = new JobHopMeta(transEntry, shellEntry);
|
|
transHop.setEvaluation(true);
|
|
jobMeta.addJobHop(transHop);
|
|
|
|
//success
|
|
JobEntrySuccess success = new JobEntrySuccess();
|
|
success.setName("Success");
|
|
JobEntryCopy successEntry = new JobEntryCopy(success);
|
|
successEntry.setDrawn(true);
|
|
successEntry.setLocation(700, 100);
|
|
jobMeta.addJobEntry(successEntry);
|
|
|
|
|
|
JobHopMeta greenHop = new JobHopMeta(shellEntry, successEntry);
|
|
greenHop.setEvaluation(true);
|
|
jobMeta.addJobHop(greenHop);
|
|
|
|
String jobXml = jobMeta.getXML();
|
|
File file = new File(root_path + jobName + ".kjb");
|
|
FileUtils.writeStringToFile(file, jobXml, "UTF-8");
|
|
}
|
|
|
|
private String fetchSqlField(String sql, Datasource ds) throws Exception {
|
|
QueryProvider qp = ProviderFactory.getQueryProvider(ds.getType());
|
|
DatasourceProvider datasourceProvider = ProviderFactory.getProvider(ds.getType());
|
|
DatasourceRequest datasourceRequest = new DatasourceRequest();
|
|
datasourceRequest.setDatasource(ds);
|
|
datasourceRequest.setQuery(qp.wrapSql(sql));
|
|
List<String> dorisFileds = new ArrayList<>();
|
|
datasourceProvider.fetchResultField(datasourceRequest).stream().map(TableFiled::getFieldName).forEach(filed -> {
|
|
dorisFileds.add(DorisTableUtils.columnName(filed));
|
|
});
|
|
return String.join(",", dorisFileds);
|
|
}
|
|
|
|
private void generateTransFile(String extractType, DatasetTable datasetTable, Datasource datasource, List<DatasetTableField> datasetTableFields, String selectSQL) throws Exception {
|
|
TransMeta transMeta = new TransMeta();
|
|
String outFile = null;
|
|
DatasourceTypes datasourceType = DatasourceTypes.valueOf(datasource.getType());
|
|
DatabaseMeta dataMeta = null;
|
|
StepMeta inputStep = null;
|
|
StepMeta outputStep = null;
|
|
StepMeta udjcStep = null;
|
|
TransHopMeta hi1 = null;
|
|
TransHopMeta hi2 = null;
|
|
String transName = null;
|
|
|
|
switch (datasourceType) {
|
|
case mysql:
|
|
MysqlConfigration mysqlConfigration = new Gson().fromJson(datasource.getConfiguration(), MysqlConfigration.class);
|
|
dataMeta = new DatabaseMeta("db", "MYSQL", "Native", mysqlConfigration.getHost(), mysqlConfigration.getDataBase(), mysqlConfigration.getPort().toString(), mysqlConfigration.getUsername(), mysqlConfigration.getPassword());
|
|
dataMeta.addExtraOption("MYSQL", "characterEncoding", "UTF-8");
|
|
transMeta.addDatabase(dataMeta);
|
|
selectSQL = getSelectSQL(extractType, datasetTable, datasource, datasetTableFields, selectSQL);
|
|
inputStep = inputStep(transMeta, selectSQL);
|
|
udjcStep = udjc(datasetTableFields, DatasourceTypes.mysql);
|
|
break;
|
|
case sqlServer:
|
|
SqlServerConfigration sqlServerConfigration = new Gson().fromJson(datasource.getConfiguration(), SqlServerConfigration.class);
|
|
dataMeta = new DatabaseMeta("db", "MSSQLNATIVE", "Native", sqlServerConfigration.getHost(), sqlServerConfigration.getDataBase(), sqlServerConfigration.getPort().toString(), sqlServerConfigration.getUsername(), sqlServerConfigration.getPassword());
|
|
transMeta.addDatabase(dataMeta);
|
|
selectSQL = getSelectSQL(extractType, datasetTable, datasource, datasetTableFields, selectSQL);
|
|
inputStep = inputStep(transMeta, selectSQL);
|
|
udjcStep = udjc(datasetTableFields, DatasourceTypes.sqlServer);
|
|
break;
|
|
case oracle:
|
|
OracleConfigration oracleConfigration = new Gson().fromJson(datasource.getConfiguration(), OracleConfigration.class);
|
|
if (oracleConfigration.getConnectionType().equalsIgnoreCase("serviceName")) {
|
|
String database = "(DESCRIPTION =(ADDRESS = (PROTOCOL = TCP)(HOST = ORACLE_HOSTNAME)(PORT = ORACLE_PORT))(CONNECT_DATA = (SERVER = DEDICATED)(SERVICE_NAME = ORACLE_SERVICE_NAME )))".replace("ORACLE_HOSTNAME", oracleConfigration.getHost()).replace("ORACLE_PORT", oracleConfigration.getPort().toString()).replace("ORACLE_SERVICE_NAME", oracleConfigration.getDataBase());
|
|
dataMeta = new DatabaseMeta("db", "ORACLE", "Native", "", database, "-1", oracleConfigration.getUsername(), oracleConfigration.getPassword());
|
|
} else {
|
|
dataMeta = new DatabaseMeta("db", "ORACLE", "Native", oracleConfigration.getHost(), oracleConfigration.getDataBase(), oracleConfigration.getPort().toString(), oracleConfigration.getUsername(), oracleConfigration.getPassword());
|
|
}
|
|
transMeta.addDatabase(dataMeta);
|
|
|
|
selectSQL = getSelectSQL(extractType, datasetTable, datasource, datasetTableFields, selectSQL);
|
|
inputStep = inputStep(transMeta, selectSQL);
|
|
udjcStep = udjc(datasetTableFields, DatasourceTypes.oracle);
|
|
break;
|
|
case excel:
|
|
String filePath = new Gson().fromJson(datasetTable.getInfo(), DataTableInfoDTO.class).getData();
|
|
inputStep = excelInputStep(filePath, datasetTableFields);
|
|
udjcStep = udjc(datasetTableFields, DatasourceTypes.excel);
|
|
default:
|
|
break;
|
|
}
|
|
|
|
switch (extractType) {
|
|
case "all_scope":
|
|
transName = "trans_" + DorisTableUtils.dorisName(datasetTable.getId());
|
|
outFile = DorisTableUtils.dorisTmpName(DorisTableUtils.dorisName(datasetTable.getId()));
|
|
transMeta.setName(transName);
|
|
break;
|
|
case "incremental_add":
|
|
transName = "trans_add_" + DorisTableUtils.dorisName(datasetTable.getId());
|
|
outFile = DorisTableUtils.dorisAddName(datasetTable.getId());
|
|
transMeta.setName(transName);
|
|
break;
|
|
case "incremental_delete":
|
|
transName = "trans_delete_" + DorisTableUtils.dorisName(datasetTable.getId());
|
|
outFile = DorisTableUtils.dorisDeleteName(DorisTableUtils.dorisName(datasetTable.getId()));
|
|
transMeta.setName(transName);
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
|
|
|
|
outputStep = outputStep(outFile);
|
|
hi1 = new TransHopMeta(inputStep, udjcStep);
|
|
hi2 = new TransHopMeta(udjcStep, outputStep);
|
|
transMeta.addTransHop(hi1);
|
|
transMeta.addTransHop(hi2);
|
|
transMeta.addStep(inputStep);
|
|
transMeta.addStep(udjcStep);
|
|
transMeta.addStep(outputStep);
|
|
|
|
String transXml = transMeta.getXML();
|
|
File file = new File(root_path + transName + ".ktr");
|
|
FileUtils.writeStringToFile(file, transXml, "UTF-8");
|
|
}
|
|
|
|
private String getSelectSQL(String extractType, DatasetTable datasetTable, Datasource datasource, List<DatasetTableField> datasetTableFields, String selectSQL) {
|
|
if (extractType.equalsIgnoreCase("all_scope") && datasetTable.getType().equalsIgnoreCase("db")) {
|
|
String tableName = new Gson().fromJson(datasetTable.getInfo(), DataTableInfoDTO.class).getTable();
|
|
QueryProvider qp = ProviderFactory.getQueryProvider(datasource.getType());
|
|
selectSQL = qp.createRawQuerySQL(tableName, datasetTableFields);
|
|
}
|
|
|
|
if (extractType.equalsIgnoreCase("all_scope") && datasetTable.getType().equalsIgnoreCase("sql")) {
|
|
selectSQL = new Gson().fromJson(datasetTable.getInfo(), DataTableInfoDTO.class).getSql();
|
|
QueryProvider qp = ProviderFactory.getQueryProvider(datasource.getType());
|
|
selectSQL = qp.createRawQuerySQLAsTmp(selectSQL, datasetTableFields);
|
|
}
|
|
if (!extractType.equalsIgnoreCase("all_scope")) {
|
|
QueryProvider qp = ProviderFactory.getQueryProvider(datasource.getType());
|
|
selectSQL = qp.createRawQuerySQLAsTmp(selectSQL, datasetTableFields);
|
|
}
|
|
return selectSQL;
|
|
}
|
|
|
|
private StepMeta inputStep(TransMeta transMeta, String selectSQL) {
|
|
TableInputMeta tableInput = new TableInputMeta();
|
|
DatabaseMeta database = transMeta.findDatabase("db");
|
|
tableInput.setDatabaseMeta(database);
|
|
tableInput.setSQL(selectSQL);
|
|
StepMeta fromStep = new StepMeta("TableInput", "Data Input", tableInput);
|
|
fromStep.setDraw(true);
|
|
fromStep.setLocation(100, 100);
|
|
return fromStep;
|
|
}
|
|
|
|
private StepMeta excelInputStep(String filePath, List<DatasetTableField> datasetTableFields) {
|
|
String suffix = filePath.substring(filePath.lastIndexOf(".") + 1);
|
|
ExcelInputMeta excelInputMeta = new ExcelInputMeta();
|
|
if (StringUtils.equalsIgnoreCase(suffix, "xlsx")) {
|
|
excelInputMeta.setSpreadSheetType(SpreadSheetType.SAX_POI);
|
|
try {
|
|
InputStream inputStream = new FileInputStream(filePath);
|
|
XSSFWorkbook xssfWorkbook = new XSSFWorkbook(inputStream);
|
|
XSSFSheet sheet0 = xssfWorkbook.getSheetAt(0);
|
|
excelInputMeta.setSheetName(new String[]{sheet0.getSheetName()});
|
|
} catch (Exception e) {
|
|
e.printStackTrace();
|
|
}
|
|
}
|
|
if (StringUtils.equalsIgnoreCase(suffix, "xls")) {
|
|
excelInputMeta.setSpreadSheetType(SpreadSheetType.JXL);
|
|
try {
|
|
InputStream inputStream = new FileInputStream(filePath);
|
|
HSSFWorkbook workbook = new HSSFWorkbook(inputStream);
|
|
HSSFSheet sheet0 = workbook.getSheetAt(0);
|
|
excelInputMeta.setSheetName(new String[]{sheet0.getSheetName()});
|
|
} catch (Exception e) {
|
|
e.printStackTrace();
|
|
}
|
|
}
|
|
excelInputMeta.setPassword("Encrypted");
|
|
excelInputMeta.setFileName(new String[]{filePath});
|
|
excelInputMeta.setStartsWithHeader(true);
|
|
excelInputMeta.setIgnoreEmptyRows(true);
|
|
ExcelInputField[] fields = new ExcelInputField[datasetTableFields.size()];
|
|
for (int i = 0; i < datasetTableFields.size(); i++) {
|
|
ExcelInputField field = new ExcelInputField();
|
|
field.setName(datasetTableFields.get(i).getOriginName());
|
|
if (datasetTableFields.get(i).getDeExtractType() == 1) {
|
|
field.setType("String");
|
|
field.setFormat("yyyy-MM-dd HH:mm:ss");
|
|
} else {
|
|
field.setType("String");
|
|
}
|
|
fields[i] = field;
|
|
}
|
|
|
|
excelInputMeta.setField(fields);
|
|
StepMeta fromStep = new StepMeta("ExcelInput", "Data Input", excelInputMeta);
|
|
fromStep.setDraw(true);
|
|
fromStep.setLocation(100, 100);
|
|
return fromStep;
|
|
}
|
|
|
|
private StepMeta outputStep(String dorisOutputTable) {
|
|
TextFileOutputMeta textFileOutputMeta = new TextFileOutputMeta();
|
|
textFileOutputMeta.setEncoding("UTF-8");
|
|
textFileOutputMeta.setHeaderEnabled(false);
|
|
textFileOutputMeta.setFilename(root_path + dorisOutputTable);
|
|
textFileOutputMeta.setSeparator(separator);
|
|
textFileOutputMeta.setExtension(extention);
|
|
textFileOutputMeta.setOutputFields(new TextFileField[0]);
|
|
StepMeta outputStep = new StepMeta("TextFileOutput", "TextFileOutput", textFileOutputMeta);
|
|
outputStep.setLocation(600, 100);
|
|
outputStep.setDraw(true);
|
|
return outputStep;
|
|
}
|
|
|
|
private StepMeta udjc(List<DatasetTableField> datasetTableFields, DatasourceTypes datasourceType) {
|
|
String needToChangeColumnType = "";
|
|
|
|
|
|
UserDefinedJavaClassMeta userDefinedJavaClassMeta = new UserDefinedJavaClassMeta();
|
|
List<UserDefinedJavaClassMeta.FieldInfo> fields = new ArrayList<>();
|
|
UserDefinedJavaClassMeta.FieldInfo fieldInfo = new UserDefinedJavaClassMeta.FieldInfo("dataease_uuid", ValueMetaInterface.TYPE_STRING, -1, -1);
|
|
fields.add(fieldInfo);
|
|
userDefinedJavaClassMeta.setFieldInfo(fields);
|
|
List<UserDefinedJavaClassDef> definitions = new ArrayList<UserDefinedJavaClassDef>();
|
|
String tmp_code = code.replace("alterColumnTypeCode", needToChangeColumnType);
|
|
|
|
tmp_code = tmp_code.replace("handleWraps", handleWraps);
|
|
String Column_Fields = "";
|
|
if (datasourceType.equals(DatasourceTypes.excel) || datasourceType.equals(DatasourceTypes.oracle)) {
|
|
Column_Fields = String.join(",", datasetTableFields.stream().map(DatasetTableField::getOriginName).collect(Collectors.toList()));
|
|
} else {
|
|
Column_Fields = String.join(",", datasetTableFields.stream().map(DatasetTableField::getDataeaseName).collect(Collectors.toList()));
|
|
}
|
|
if (datasourceType.equals(DatasourceTypes.excel)) {
|
|
tmp_code = tmp_code.replace("handleExcelIntColumn", handleExcelIntColumn).replace("Column_Fields", Column_Fields);
|
|
} else {
|
|
tmp_code = tmp_code.replace("handleExcelIntColumn", "").replace("Column_Fields", Column_Fields);
|
|
}
|
|
UserDefinedJavaClassDef userDefinedJavaClassDef = new UserDefinedJavaClassDef(UserDefinedJavaClassDef.ClassType.TRANSFORM_CLASS, "Processor", tmp_code);
|
|
|
|
userDefinedJavaClassDef.setActive(true);
|
|
definitions.add(userDefinedJavaClassDef);
|
|
userDefinedJavaClassMeta.replaceDefinitions(definitions);
|
|
|
|
StepMeta userDefinedJavaClassStep = new StepMeta("UserDefinedJavaClass", "UserDefinedJavaClass", userDefinedJavaClassMeta);
|
|
userDefinedJavaClassStep.setLocation(300, 100);
|
|
userDefinedJavaClassStep.setDraw(true);
|
|
return userDefinedJavaClassStep;
|
|
}
|
|
|
|
public void deleteFile(String type, String dataSetTableId) {
|
|
String transName = null;
|
|
String jobName = null;
|
|
String fileName = null;
|
|
|
|
switch (type) {
|
|
case "all_scope":
|
|
transName = "trans_" + DorisTableUtils.dorisName(dataSetTableId);
|
|
jobName = "job_" + DorisTableUtils.dorisName(dataSetTableId);
|
|
fileName = DorisTableUtils.dorisTmpName(dataSetTableId);
|
|
break;
|
|
case "incremental_add":
|
|
transName = "trans_add_" + DorisTableUtils.dorisName(dataSetTableId);
|
|
jobName = "job_add_" + DorisTableUtils.dorisName(dataSetTableId);
|
|
fileName = DorisTableUtils.dorisAddName(dataSetTableId);
|
|
break;
|
|
case "incremental_delete":
|
|
transName = "trans_delete_" + DorisTableUtils.dorisName(dataSetTableId);
|
|
jobName = "job_delete_" + DorisTableUtils.dorisName(dataSetTableId);
|
|
fileName = DorisTableUtils.dorisDeleteName(dataSetTableId);
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
try {
|
|
File file = new File(root_path + fileName + "." + extention);
|
|
FileUtils.forceDelete(file);
|
|
} catch (Exception e) {
|
|
}
|
|
try {
|
|
File file = new File(root_path + jobName + ".kjb");
|
|
FileUtils.forceDelete(file);
|
|
} catch (Exception e) {
|
|
}
|
|
try {
|
|
File file = new File(root_path + transName + ".ktr");
|
|
FileUtils.forceDelete(file);
|
|
} catch (Exception e) {
|
|
}
|
|
}
|
|
|
|
public boolean isKettleRunning() {
|
|
try {
|
|
if (!InetAddress.getByName(carte).isReachable(1000)) {
|
|
return false;
|
|
}
|
|
} catch (Exception e) {
|
|
return false;
|
|
}
|
|
|
|
HttpGet getMethod = new HttpGet("http://" + carte + ":" + port);
|
|
HttpClientManager.HttpClientBuilderFacade clientBuilder = HttpClientManager.getInstance().createBuilder();
|
|
clientBuilder.setConnectionTimeout(1);
|
|
clientBuilder.setCredentials(user, passwd);
|
|
CloseableHttpClient httpClient = clientBuilder.build();
|
|
try {
|
|
HttpResponse httpResponse = httpClient.execute(getMethod);
|
|
int statusCode = httpResponse.getStatusLine().getStatusCode();
|
|
if (statusCode != -1 && statusCode < 400) {
|
|
httpResponse.getEntity().getContent().close();
|
|
return true;
|
|
} else {
|
|
return false;
|
|
}
|
|
} catch (Exception e) {
|
|
return false;
|
|
}
|
|
}
|
|
|
|
private static String alterColumnTypeCode = " if(\"FILED\".equalsIgnoreCase(filed)){\n" +
|
|
"\t if(tmp != null && tmp.equalsIgnoreCase(\"Y\")){\n" +
|
|
" get(Fields.Out, filed).setValue(r, 1);\n" +
|
|
" get(Fields.Out, filed).getValueMeta().setType(2);\n" +
|
|
" }else{\n" +
|
|
" get(Fields.Out, filed).setValue(r, 0);\n" +
|
|
" get(Fields.Out, filed).getValueMeta().setType(2);\n" +
|
|
" }\n" +
|
|
" }\n";
|
|
|
|
private static String handleExcelIntColumn = " \t\tif(tmp != null && tmp.endsWith(\".0\")){\n" +
|
|
" try {\n" +
|
|
" Long.valueOf(tmp.substring(0, tmp.length()-2));\n" +
|
|
" get(Fields.Out, filed).setValue(r, tmp.substring(0, tmp.length()-2));\n" +
|
|
" get(Fields.Out, filed).getValueMeta().setType(2);\n" +
|
|
" }catch (Exception e){}\n" +
|
|
" }";
|
|
|
|
private static String handleWraps = " if(tmp != null && ( tmp.contains(\"\\r\") || tmp.contains(\"\\n\"))){\n" +
|
|
"\t\t\ttmp = tmp.trim();\n" +
|
|
" tmp = tmp.replaceAll(\"\\r\",\" \");\n" +
|
|
" tmp = tmp.replaceAll(\"\\n\",\" \");\n" +
|
|
" get(Fields.Out, filed).setValue(r, tmp);\n" +
|
|
" } ";
|
|
|
|
private static String code = "import org.pentaho.di.core.row.ValueMetaInterface;\n" +
|
|
"import java.util.List;\n" +
|
|
"import java.io.File;\n" +
|
|
"import java.security.MessageDigest;\n" +
|
|
"import java.util.ArrayList;\n" +
|
|
"import java.util.Arrays;\n" +
|
|
"import java.util.List;\n" +
|
|
"import java.util.concurrent.ExecutorService;\n" +
|
|
"import java.util.concurrent.Executors;\n" +
|
|
"import org.pentaho.di.core.util.StringUtil;\n" +
|
|
"\n" +
|
|
"public boolean processRow(StepMetaInterface smi, StepDataInterface sdi) throws KettleException {\n" +
|
|
" if (first) {\n" +
|
|
" first = false;\n" +
|
|
" }\n" +
|
|
"\n" +
|
|
" Object[] r = getRow();\n" +
|
|
"\n" +
|
|
" if (r == null) {\n" +
|
|
" setOutputDone();\n" +
|
|
" return false;\n" +
|
|
" }\n" +
|
|
"\n" +
|
|
" r = createOutputRow(r, data.outputRowMeta.size());\n" +
|
|
" String str = \"\";\n" +
|
|
"\n" +
|
|
" List<String> fileds = Arrays.asList(\"Column_Fields\".split(\",\"));\n" +
|
|
" for (String filed : fileds) {\n" +
|
|
" String tmp = get(Fields.In, filed).getString(r);\n" +
|
|
"handleWraps \n" +
|
|
"alterColumnTypeCode \n" +
|
|
"handleExcelIntColumn \n" +
|
|
" str = str + tmp;\n" +
|
|
" }\n" +
|
|
"\n" +
|
|
" String md5 = md5(str);\n" +
|
|
" get(Fields.Out, \"dataease_uuid\").setValue(r, md5);\n" +
|
|
"\n" +
|
|
" putRow(data.outputRowMeta, r);\n" +
|
|
"\n" +
|
|
" return true;\n" +
|
|
"}\n" +
|
|
"\n" +
|
|
" private static final char[] HEX_DIGITS = {'0', '1', '2', '3', '4', '5', '6', '7', '8', '9', 'a', 'b', 'c', 'd', 'e', 'f'};\n" +
|
|
" private static final String UTF_8 = \"UTF-8\";\n" +
|
|
" public static String md5(String src) {\n" +
|
|
" return md5(src, UTF_8);\n" +
|
|
" }\n" +
|
|
" public static String md5(String src, String charset) {\n" +
|
|
" try {\n" +
|
|
" byte[] strTemp = charset == null || charset.equals(\"\") ? src.getBytes() : src.getBytes(charset);\n" +
|
|
" MessageDigest mdTemp = MessageDigest.getInstance(\"MD5\");\n" +
|
|
" mdTemp.update(strTemp);\n" +
|
|
"\n" +
|
|
" byte[] md = mdTemp.digest();\n" +
|
|
" int j = md.length;\n" +
|
|
" char[] str = new char[j * 2];\n" +
|
|
" int k = 0;\n" +
|
|
"\n" +
|
|
" for (byte byte0 : md) {\n" +
|
|
" str[k++] = HEX_DIGITS[byte0 >>> 4 & 0xf];\n" +
|
|
" str[k++] = HEX_DIGITS[byte0 & 0xf];\n" +
|
|
" }\n" +
|
|
"\n" +
|
|
" return new String(str);\n" +
|
|
" } catch (Exception e) {\n" +
|
|
" throw new RuntimeException(\"MD5 encrypt error:\", e);\n" +
|
|
" }\n" +
|
|
" }\n" +
|
|
"\n" +
|
|
" public String generateStr(int size, String[] d ){\n" +
|
|
" String str = null;\n" +
|
|
" for(int i=0;i<size;i++){\n" +
|
|
" str = str + d[i];\n" +
|
|
" }\n" +
|
|
" return str;\n" +
|
|
" }";
|
|
}
|
|
|