使用Kettle API实现数据的迁移

利用kettle的api,将一个数据源中的信息导入到另外一个数据源中:

package cn.com.saidi.job;
 
import org.apache.commons.io.FileUtils;
import org.pentaho.di.core.KettleEnvironment;
import org.pentaho.di.core.database.DatabaseMeta;
import org.pentaho.di.core.exception.KettleDatabaseException;
import org.pentaho.di.core.exception.KettleXMLException;
import org.pentaho.di.core.plugins.PluginRegistry;
import org.pentaho.di.core.plugins.StepPluginType;
import org.pentaho.di.trans.TransHopMeta;
import org.pentaho.di.trans.TransMeta;
import org.pentaho.di.trans.step.StepMeta;
import org.pentaho.di.trans.steps.insertupdate.InsertUpdateMeta;
import org.pentaho.di.trans.steps.tableinput.TableInputMeta;
 
import java.io.File;

public class TransDemo {
 
	public static TransDemo transDemo;
 
	/**
	 * 两个库中的表名
	 */
	public static String bjdt_tablename = "test1";
	public static String kettle_tablename = "test2";
 
	/**
	 * 数据库连接信息,适用于DatabaseMeta其中 一个构造器DatabaseMeta(String xml)
	 */
	public static final String[] databasesXML = {
 
			"<?xml version=\"1.0\" encoding=\"UTF-8\"?>" +
					"<connection>" +
					"<name>bjdt</name>" +
					"<server>192.168.1.122</server>" +
					"<type>Mysql</type>" +
					"<access>Native</access>" +
					"<database>daiqiaobing</database>" +
					"<port>3306</port>" +
					"<username>root</username>" +
					"<password>root</password>" +
  					"</connection>",
			"<?xml version=\"1.0\" encoding=\"UTF-8\"?>" +
					"<connection>" +
					"<name>kettle</name>" +
					"<server>192.168.1.122</server>" +
					"<type>Mysql</type>" +
					"<access>Native</access>" +
					"<database>daiqiaobing</database>" +
					"<port>3306</port>" +
					"<username>root</username>" +
					"<password>root</password>" +
 					"</connection>"
 
	};
 
	public static void main(String[] args) {
		try {
			KettleEnvironment.init();
			transDemo = new TransDemo();
			TransMeta transMeta = transDemo.generateMyOwnTrans();
			String transXml = transMeta.getXML();
			String transName = "etl/update_insert_Trans.ktr";
			File file = new File(transName);
			FileUtils.writeStringToFile(file, transXml, "UTF-8");
			System.out.println(databasesXML.length+"\n"+databasesXML[0]+"\n"+databasesXML[1]);
 		} catch (Exception e) {
			e.printStackTrace();
			return;
		}
	}
 
	/**
	 * 生成一个转化,把一个数据库中的数据转移到另一个数据库中,只有两个步骤,第一个是表输入,第二个是表插入与更新操作
	 * @return
	 * @throws KettleXMLException
	 */
	public TransMeta generateMyOwnTrans() throws KettleXMLException, KettleDatabaseException {
		System.out.println("************start to generate my own transformation***********");
		TransMeta transMeta = new TransMeta();
		//设置转化的名称
		transMeta.setName("insert_update");
		//添加转换的数据库连接
		for (int i=0;i<databasesXML.length;i++){
			DatabaseMeta databaseMeta = new DatabaseMeta(databasesXML[i]);
			transMeta.addDatabase(databaseMeta);
		}
		//registry是给每个步骤生成一个标识Id用
		PluginRegistry registry = PluginRegistry.getInstance();
		//第一个表输入步骤(TableInputMeta)
		TableInputMeta tableInput = new TableInputMeta();
		String tableInputPluginId = registry.getPluginId(StepPluginType.class, tableInput);
		//给表输入添加一个DatabaseMeta连接数据库
		DatabaseMeta database_bjdt = transMeta.findDatabase("bjdt");
		tableInput.setDatabaseMeta(database_bjdt);
		String select_sql = "SELECT name  FROM "+bjdt_tablename;
		tableInput.setSQL(select_sql);
 
		//添加TableInputMeta到转换中
		StepMeta tableInputMetaStep = new StepMeta(tableInputPluginId,"table input",tableInput);
		//给步骤添加在spoon工具中的显示位置
		tableInputMetaStep.setDraw(true);
		tableInputMetaStep.setLocation(100, 100);
		transMeta.addStep(tableInputMetaStep);
 
		//第二个步骤插入与更新
		InsertUpdateMeta insertUpdateMeta = new InsertUpdateMeta();
		String insertUpdateMetaPluginId = registry.getPluginId(StepPluginType.class,insertUpdateMeta);
		//添加数据库连接
		DatabaseMeta database_kettle = transMeta.findDatabase("kettle");
  		insertUpdateMeta.setDatabaseMeta(database_kettle);
		//设置操作的表
		insertUpdateMeta.setTableName(kettle_tablename);
		//设置用来查询的关键字
		insertUpdateMeta.setKeyLookup(new String[]{"name"});
		insertUpdateMeta.setKeyStream(new String[]{"name"});
		insertUpdateMeta.setKeyStream2(new String[]{""});//一定要加上
		insertUpdateMeta.setKeyCondition(new String[]{"="});
 
		//设置要更新的字段
 		String[] updatelookup = {"name"} ;
 
		String [] updateStream = {"name"};
 		Boolean[] updateOrNot = {true};
		insertUpdateMeta.setUpdateLookup(updatelookup);
		insertUpdateMeta.setUpdateStream(updateStream);
		insertUpdateMeta.setUpdate(updateOrNot);
		String[] lookup = insertUpdateMeta.getUpdateLookup();
		//添加步骤到转换中
		StepMeta insertUpdateStep = new StepMeta(insertUpdateMetaPluginId,"insert_update",insertUpdateMeta);
		insertUpdateStep.setDraw(true);
		insertUpdateStep.setLocation(250,100);
		transMeta.addStep(insertUpdateStep);
		//******************************************************************
 
		//******************************************************************
 
		//添加hop把两个步骤关联起来
		transMeta.addTransHop(new TransHopMeta(tableInputMetaStep, insertUpdateStep));
		System.out.println("***********the end************");
		return transMeta;
	}
 
}

上述操作将会产生一个ktr文件,接下来的操作是对ktr文件进行转换:

public static void main(String[] args) throws KettleException {
		//初始化ketlle
		KettleEnvironment.init();
		//创建转换元数据对象
		TransMeta meta = new TransMeta("etl/update_insert_Trans.ktr");
		Trans trans = new Trans(meta);
		trans.prepareExecution(null);
		trans.startThreads();
		trans.waitUntilFinished();
		if(trans.getErrors()!=0){
			System.out.println("执行失败!");
		}
	}

猜你喜欢

转载自blog.csdn.net/kone0611/article/details/83650883