Control-Algorithm/demo_lqr_pendulum.py at master · zhaohaojie1998/Control-Algorithm · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
"""LQR倒立摆控制"""
import time
import numpy as np
import gymnasium as gym
from controller import LQR, LTISystem
from controller.utils import matplotlib_context, setup_seed, tic, toc

def lqr_pendulum_control():
    # 仿真参数
    dt = 0.05  # 与gym环境的dt保持一致, 必须0.05
    total_time = 50.0
    time_steps = int(total_time / dt)

    # 倒立摆系统参数（与gym环境一致）
    m = 1.0  # 摆杆质量
    l = 1.0  # 摆杆长度
    g = 10  # 重力加速度

    # 系统矩阵（线性化模型，平衡点在竖直向上位置）
    # 状态向量：[theta, theta_dot]^T，其中theta是摆杆与竖直方向的夹角
    # 控制量：u是施加在摆杆上的力矩
    # 线性化动力学方程：theta'' = (3*g/(2*l))*theta + (3/(m*l**2))*u
    A = [[0, 1],
         [3*g/(2*l), 0]]
    B = [[0],
         [3/(m*l**2)]]

    sys = LTISystem(A, B)
    print("能控性:", sys.is_controllable())
    print("能观性:", sys.is_observable())
    print("可镇定性:", sys.is_stabilizable())
    print("可检测性:", sys.is_detectable())
    print("开环稳定:", sys.is_stable())
    print("Laypunov开环稳定:", sys.is_lyapunov_stable(np.eye(2)))

    # 权重矩阵
    Q = np.diag([1000, 100]) # 角度误差处罚, 角速度误差处罚
    R = 0.01 # 控制惩罚

    # 初始化LQR控制器
    lqr_controller = LQR(sys, Q, R, dt)
    print("LQR倒立摆控制器参数:")
    print(lqr_controller)
    print("LQR闭环稳定:", lqr_controller.stable)

    # 仿真
    time.sleep(5)
    print("\n====================仿真开始====================")
    env = gym.make("Pendulum-v1", g=g, max_episode_steps=time_steps, render_mode="human")
    # 初始状态需要接近线性化平衡点的位置，否则LQR控制器无法收敛
    obs, info = env.reset(options={"x_init": 0.1, "y_init": 0.01}) # 平衡状态为 0

    tic()
    for _ in range(time_steps):
        tic()
        x = np.array(env.unwrapped.state) # 状态向量：[theta, theta_dot]
        u = lqr_controller(x)
        toc("LQR控制律求解")

        obs, reward, terminated, truncated, info = env.step(u)
        if terminated or truncated:
            break
    toc("仿真")

    # 获取最终状态
    θf, dθf = env.unwrapped.state
    env.close()

    # 输出
    lqr_controller.show(name='Pendulum-v1')
    print('倒立摆控制最终状态:')
    print(f'  摆杆角度: {θf:.4f}')
    print(f'  摆杆角速度: {dθf:.4f}')
    print('LQR性能指标J:')
    print(f'  J = {lqr_controller.J:.4f}')

    # 计算控制精度
    angle_error = np.abs(θf)
    angular_velocity_error = np.abs(dθf)
    print('控制精度:')
    print(f'  角度误差: {angle_error:.4f}')
    print(f'  角速度误差: {angular_velocity_error:.4f}')


if __name__ == '__main__':
    setup_seed(114514)
    with matplotlib_context():
        lqr_pendulum_control()