1. 版本
Ubuntu 20.04
JDK 1.8
Kettle 8.3
2.下载Kettle 8.3
https://sourceforge.net/projects/pentaho/files/Pentaho%208.3/client-tools/pdi-ce-8.3.0.0-371.zip/download
3. 安装JDK 1.8 (如已安装可忽略)
4.解压 pdi-ce-8.3.0.0-371.zip
mkdir /usr/local/kettle
cd /usr/local/kettle/
unzip ~/Downloads/pdi-ce-8.3.0.0-371.zip
wget http://li.nux.ro/download/nux/dextop/el7/x86_64/nux-dextop-release-0-5.el7.nux.noarch.rpm
sudo alien nux-dextop-release-0-5.el7.nux.noarch.rpm #将rpm转换位deb,完成后会生成一个同名的xxxx.deb
sudo dpkg -i nux-dextop-release_0-6_all.deb #安装
sudo nano/etc/apt/sources.list
deb http://cz.archive.ubuntu.com/ubuntu bionic main universe # 将此条目添加到文件并保存
sudo apt-get update
sudo apt-get install libwebkitgtk-1.0-0 # 安装libwebkitgtk
sudo apt-get install libcanberra-gtk-module
5. 运行
rm -rf /home/user/data-integration/./system/karaf/caches
rm -rf /home/user/data-integration/./system/karaf/data
/usr/local/kettle/data-integration/spoon.sh
6. 连接hadoop集群前准备配置文件
cp /usr/local/hadoop/etc/hadoop/core-site.xml /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/
cp /usr/local/hadoop/etc/hadoop/core-site.xml /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/
cp /usr/local/hadoop/etc/hadoop/mapred-site.xml /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/
cp /usr/local/hadoop/etc/hadoop/yarn-site.xml /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/
cp /usr/local/hive/conf/hive-site.xml /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/
cp /usr/local/hive/jdbc/hive-jdbc-3.1.2-standalone.jar /usr/local/kettle/data-integration/lib
cp /usr/local/hive/jdbc/hive-jdbc-3.1.2-standalone.jar /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/lib
cp ~/Downloads/mysql-connector-java-8.0.27/mysql-connector-java-8.0.27.jar /usr/local/kettle/data-integration/lib
cp ~/Downloads/mysql-connector-java-8.0.27/mysql-connector-java-8.0.27.jar /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/lib
cp /usr/local/hive/lib/hive*.jar /usr/local/kettle/data-integration/lib
cp /usr/local/hive/lib/hive*.jar /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/lib
cp /usr/local/hive/lib/http*.jar /usr/local/kettle/data-integration/lib/
cp /usr/local/hive/lib/http*.jar /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/lib
7.连接hadoop集群(pending)
8. 连接hive
