feat: 添加聚类算法和 Q 学习算法

- 新增 clustering_algorithms.py 文件，实现 K 均值和 K 中心点聚类算法 - 新增 route.py 文件，实现基于 Q学习的路径规划算法 - 添加分析聚类结果和可视化功能 - 实现并行 Q学习训练，提高训练效率
2025-03-30 02:52:03 +08:00 · 2025-03-30 02:52:03 +08:00 · 161b7a0eea
commit 161b7a0eea
4 changed files with 174 additions and 0 deletions
--- a/clustering_algorithms.py
+++ b/clustering_algorithms.py
@ -0,0 +1,77 @@
 # 导入必要的库
 import numpy as np
 from sklearn.datasets import load_iris
 from sklearn.cluster import KMeans
 from sklearn_extra.cluster import KMedoids
 from sklearn.metrics import silhouette_score
 import matplotlib.pyplot as plt
 import matplotlib
 import os
 import psutil
 # 设置环境变量以消除Joblib警告
 os.environ['LOKY_MAX_CPU_COUNT'] = str(psutil.cpu_count(logical=False))
 # 设置Matplotlib支持中文的字体
 matplotlib.rcParams['font.sans-serif'] = ['SimHei']  # 使用黑体
 matplotlib.rcParams['axes.unicode_minus'] = False  # 解决负号显示问题
 # 加载Iris数据集
 iris = load_iris()
 X = iris.data  # 特征数据
 y = iris.target  # 目标标签
 # K均值聚类算法
 def kmeans_clustering(X, n_clusters=3):
    """
    使用K均值算法对数据进行聚类
    :param X: 输入数据
    :param n_clusters: 聚类数量
    :return: 聚类标签
    """
    kmeans = KMeans(n_clusters=n_clusters, random_state=42)  # 初始化KMeans对象
    kmeans.fit(X)  # 拟合数据
    labels = kmeans.labels_  # 获取聚类标签
    return labels
 # K中心点聚类算法
 def kmedoids_clustering(X, n_clusters=3):
    """
    使用K中心点算法对数据进行聚类
    :param X: 输入数据
    :param n_clusters: 聚类数量
    :return: 聚类标签
    """
    kmedoids = KMedoids(n_clusters=n_clusters, random_state=42)  # 初始化KMedoids对象
    kmedoids.fit(X)  # 拟合数据
    labels = kmedoids.labels_  # 获取聚类标签
    return labels
 # 分析聚类结果
 def analyze_clustering(X, labels, algorithm_name):
    """
    分析聚类结果并可视化
    :param X: 输入数据
    :param labels: 聚类标签
    :param algorithm_name: 算法名称
    """
    silhouette_avg = silhouette_score(X, labels)  # 计算轮廓系数
    print(f"{algorithm_name} 轮廓系数: {silhouette_avg}")
    # 可视化聚类结果
    plt.scatter(X[:, 0], X[:, 1], c=labels, cmap='viridis')
    plt.title(f"{algorithm_name} 聚类结果")
    plt.show()
 # 主函数
 def main():
    # 使用K均值算法进行聚类
    kmeans_labels = kmeans_clustering(X)
    analyze_clustering(X, kmeans_labels, "K均值")
    # 使用K中心点算法进行聚类
    kmedoids_labels = kmedoids_clustering(X)
    analyze_clustering(X, kmedoids_labels, "K中心点")
 if __name__ == "__main__":
    main()
--- a/myplot-1.png
+++ b/myplot-1.png
--- a/myplot-2.png
+++ b/myplot-2.png
--- a/route.py
+++ b/route.py
@ -0,0 +1,97 @@
 import numpy as np  # Import NumPy for numerical operations
 import random  # Import random module for exploration
 import multiprocessing as mp  # Import multiprocessing for parallel computing
 #import cupy as cp
 try:
    import cupy as cp  # Import CuPy for GPU acceleration
    GPU_AVAILABLE = True  # Set flag if CuPy is available
 except ImportError:
    GPU_AVAILABLE = False  # Set flag if CuPy is not available
 # Define the environment
 grid_size = (4, 4)  # Grid size (4x4)
 start = (0, 0)  # Start position
 end = (3, 3)  # End position
 obstacles = {(1, 0), (2, 1), (1, 2), (0, 3), (3, 2)}  # Set of obstacles
 # Define possible actions and their effects on position
 actions = {'up': (-1, 0), 'down': (1, 0), 'left': (0, -1), 'right': (0, 1)}
 def is_valid(state):
    """Check if a state is within the grid and not an obstacle."""
    return (0 <= state[0] < grid_size[0]) and (0 <= state[1] < grid_size[1]) and (state not in obstacles)
 def get_next_state(state, action):
    """Get the next state based on the current state and action."""
    new_state = (state[0] + actions[action][0], state[1] + actions[action][1])
    return new_state if is_valid(new_state) else state
 # Q-Learning parameters
 alpha = 0.5  # Learning rate
 gamma = 0.9  # Discount factor
 epsilon = 0.1  # Increased exploration rate for better exploration
 episodes = 5000  # Increased total training episodes for better learning
 np.random.seed(42)  # Set random seed for reproducibility
 random.seed(42)
 # Initialize the Q-table with all states and actions
 grid_states = [(i, j) for i in range(grid_size[0]) for j in range(grid_size[1]) if (i, j) not in obstacles]
 Q = {state: {action: 0 for action in actions} for state in grid_states}
 # GPU acceleration setup (if available)
 if GPU_AVAILABLE:
    Q = {state: {action: 0.0 for action in actions} for state in grid_states}   # Initialize Q-table on GPU
    actions_list = list(actions.keys())  # Store actions as a list
 def train_q_learning(_):
    """Function to train Q-learning in parallel using multiple processes."""
    local_Q = {state: Q[state].copy() for state in grid_states}  # Create a local copy of Q-table
    for _ in range(episodes // mp.cpu_count()):  # Each process handles a fraction of episodes
        state = start  # Start at the initial position
        while state != end:  # Run until reaching the goal
            # Choose an action using ε-greedy policy
            action = max(local_Q[state], key=local_Q[state].get) if random.uniform(0, 1) > epsilon else random.choice(
                list(actions))
            next_state = get_next_state(state, action)  # Get the next state
            reward = 1 if next_state == end else -0.1  # Define rewards
            # Update Q-value using the Bellman equation
            local_Q[state][action] += alpha * (
                        reward + gamma * max(local_Q[next_state].values()) - local_Q[state][action])
            state = next_state  # Move to next state
    return local_Q  # Return the updated local Q-table
 # Parallel Q-learning training
 if __name__ == "__main__":
    num_processes = max(1, mp.cpu_count() // 2)  # Use half the available CPU cores
    with mp.Pool(num_processes) as pool:  # Create a process pool with reduced number of CPU cores
        results = pool.map(train_q_learning, range(num_processes))  # Distribute training across multiple processes
    # Merge Q-tables from all processes
    for state in grid_states:
        for action in actions:
            Q[state][action] = sum(r[state][action] for r in results) / len(results)  # Average Q-values
 # Compute the optimal path from start to end
 def get_best_path():
    """Find the best path using the learned Q-values."""
    state = start  # Start at the initial position
    path = [state]  # Initialize path
    visited = set()  # Track visited states to avoid loops
    while state != end:
        if state in visited:
            break  # Avoid infinite loops
        visited.add(state)  # Mark state as visited
        action = max(Q[state], key=Q[state].get)  # Choose the best action based on Q-values
        state = get_next_state(state, action)  # Move to the next state
        path.append(state)  # Append to path
    return path  # Return the computed path
 print(get_best_path())  # Print the optimal path