一、MySQL 配置
1. 清除原有 MariaDB
sudo apt remove --purge mariadb-* --fix-missing
sudo apt autoremove -y
sudo rm -rf /var/lib/mysql/
sudo rm -rf /etc/mysql/
2. 下载并安装 MySQL
sudo wget https://repo.mysql.com//mysql-apt-config_0.8.33-1_all.deb
sudo dpkg -i mysql-apt-config_0.8.33-1_all.deb
sudo apt update
sudo apt install mysql-community-server --fix-missing
3. 启动服务并创建 Hive 用户
sudo systemctl enable mysql
sudo systemctl start mysql
sudo mysql -u root -p
CREATE DATABASE hive_metastore;
CREATE USER 'hiveuser'@'localhost' IDENTIFIED BY '123';
GRANT ALL PRIVILEGES ON hive_metastore.* TO 'hiveuser'@'localhost';
FLUSH PRIVILEGES;
EXIT;
二、Hive 配置
1. 下载解压 Hive
sudo wget https://dlcdn.apache.org/hive/hive-4.0.1/apache-hive-4.0.1-bin.tar.gz
sudo tar -xzvf apache-hive-4.0.1-bin.tar.gz
mv apache-hive-4.0.1-bin hive-4.0.1
2. 配置环境变量
echo 'export HIVE_HOME=/soft/hive-4.0.1' >> ~/.zshrc
echo 'export PATH=$PATH:$HIVE_HOME/bin' >> ~/.zshrc
source ~/.zshrc
3. 配置 hive-site.xml和hive-env.sh
cd $HIVE_HOME/conf
cp hive-default.xml.template hive-site.xml
cat > hive-site.xml <<EOF
<?xml version="1.0" encoding="UTF-8"?>
<?xml-stylesheet type="text/xsl" href="configuration.xsl"?>
<configuration>
<!-- 连接元数据库的配置 -->
<property>
<name>javax.jdo.option.ConnectionURL</name>
<value>jdbc:mysql://localhost:3306/hive_metastore?createDatabaseIfNotExist=true</value>
<description>JDBC connect string for a JDBC metastore</description>
</property>
<property>
<name>javax.jdo.option.ConnectionDriverName</name>
<value>com.mysql.cj.jdbc.Driver</value>
<description>Driver class name for a JDBC metastore</description>
</property>
<property>
<name>javax.jdo.option.ConnectionUserName</name>
<value>hiveuser</value>
<description>Username to use against metastore database</description>
</property>
<property>
<name>javax.jdo.option.ConnectionPassword</name>
<value>123</value>
<description>Password to use against metastore database</description>
</property>
<!-- Hive数据在HDFS上的存储路径 -->
<property>
<name>hive.metastore.warehouse.dir</name>
<value>/user/hive/warehouse</value>
<description>Location of default database for the warehouse</description>
</property>
<!-- Hive临时目录配置 -->
<property>
<name>hive.exec.scratchdir</name>
<value>/user/hive/tmp</value>
</property>
</configuration>
EOF
cp hive-env.sh.template hive-env.sh
echo 'export HADOOP_HOME=/soft/hadoop-3.4.1/ ' >> ./hive-env.sh
echo 'export HIVE_CONF_DIR=/soft/hive-4.0.1/conf/' >> ./hive-env.sh
4. 安装 MySQL JDBC 驱动
sudo apt list | grep mysql
sudo apt install mysql-connector-j
cp /usr/share/java/mysql-connector-j-9.2.0.jar $HIVE_HOME/lib
5. 指定代理用户
<property>
<name>hadoop.proxyuser.wgs.hosts</name>
<value>*</value> <!-- HiveServer2 所在主机,* 表示所有 -->
</property>
<property>
<name>hadoop.proxyuser.wgs.groups</name>
<value>*</value> <!-- 允许代理的用户组,* 表示所有 -->
</property>
<property>
<name>hadoop.proxyuser.wgs.users</name>
<value>*</value> <!-- 允许代理的具体用户,* 表示所有(含 wgs) -->
</property>
三、Hadoop 服务启动
start-dfs.sh
start-yarn.sh
hdfs dfs -mkdir -p /user/hive/warehouse
hdfs dfs -mkdir -p /user/hive/tmp
四、初始化与启动
schematool -dbType mysql -initSchema
hiveserver2
beeline -u jdbc:hive2://hadoop:10000 -n wgs
五、测试验证
SHOW DATABASES;
CREATE TABLE test(id INT);
INSERT INTO test VALUES(1);
SELECT * FROM test;