1. 版本
Ubuntu 20.04
JDK 1.8
Kettle 8.3
2.下載Kettle 8.3
https://sourceforge.net/projects/pentaho/files/Pentaho%208.3/client-tools/pdi-ce-8.3.0.0-371.zip/download
3. 安裝JDK 1.8 (如已安裝可忽略)
4.解壓 pdi-ce-8.3.0.0-371.zip
mkdir /usr/local/kettle
cd /usr/local/kettle/
unzip ~/Downloads/pdi-ce-8.3.0.0-371.zip
wget http://li.nux.ro/download/nux/dextop/el7/x86_64/nux-dextop-release-0-5.el7.nux.noarch.rpm
sudo alien nux-dextop-release-0-5.el7.nux.noarch.rpm #將rpm轉換位deb,完成后會生成一個同名的xxxx.deb
sudo dpkg -i nux-dextop-release_0-6_all.deb #安裝
sudo nano/etc/apt/sources.list
deb http://cz.archive.ubuntu.com/ubuntu bionic main universe # 將此條目添加到文件並保存
sudo apt-get update
sudo apt-get install libwebkitgtk-1.0-0 # 安裝libwebkitgtk
sudo apt-get install libcanberra-gtk-module
5. 運行
rm -rf /home/user/data-integration/./system/karaf/caches
rm -rf /home/user/data-integration/./system/karaf/data
/usr/local/kettle/data-integration/spoon.sh
6. 連接hadoop集群前准備配置文件
cp /usr/local/hadoop/etc/hadoop/core-site.xml /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/
cp /usr/local/hadoop/etc/hadoop/core-site.xml /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/
cp /usr/local/hadoop/etc/hadoop/mapred-site.xml /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/
cp /usr/local/hadoop/etc/hadoop/yarn-site.xml /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/
cp /usr/local/hive/conf/hive-site.xml /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/
cp /usr/local/hive/jdbc/hive-jdbc-3.1.2-standalone.jar /usr/local/kettle/data-integration/lib
cp /usr/local/hive/jdbc/hive-jdbc-3.1.2-standalone.jar /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/lib
cp ~/Downloads/mysql-connector-java-8.0.27/mysql-connector-java-8.0.27.jar /usr/local/kettle/data-integration/lib
cp ~/Downloads/mysql-connector-java-8.0.27/mysql-connector-java-8.0.27.jar /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/lib
cp /usr/local/hive/lib/hive*.jar /usr/local/kettle/data-integration/lib
cp /usr/local/hive/lib/hive*.jar /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/lib
cp /usr/local/hive/lib/http*.jar /usr/local/kettle/data-integration/lib/
cp /usr/local/hive/lib/http*.jar /usr/local/kettle/data-integration/plugins/pentaho-big-data-plugin/hadoop-configurations/mapr60/lib
7.連接hadoop集群(pending)
8. 連接hive