23-05-21

pso 기본 알고리즘을 이용한 tensorflow model의 pso 알고리즘화 - xor 문제, mnist 분류 성공
2025-12-20 04:50:45 +09:00 · 2023-05-21 14:00:03 +09:00
commit 7c5f3a53a3
6 changed files with 1251 additions and 0 deletions
--- a/pso_tf.py
+++ b/pso_tf.py
@@ -0,0 +1,261 @@
+import numpy as np
+import tensorflow as tf
+from tensorflow import keras
+from tqdm import tqdm
+
+
+class PSO(object):
+    """
+    Class implementing PSO algorithm
+    """
+
+    def __init__(self, model, loss_method=keras.losses.MeanSquaredError(), optimizer=keras.optimizers.SGD(), n_particles=5):
+        """
+        Initialize the key variables.
+
+        Args:
+            model : 학습할 모델 객체 (Sequential)
+            loss_method : 손실 함수
+            optimizer : 최적화 함수
+            n_particles(int) : 파티클의 개수
+        """
+        self.model = model                      # 모델
+        self.n_particles = n_particles          # 파티클의 개수
+        self.loss_method = loss_method          # 손실 함수
+        self.optimizer = optimizer              # 최적화 함수
+        self.model_structure = self.model.to_json()  # 모델의 구조
+        self.init_weights = self.model.get_weights()          # 검색할 차원
+        self.particle_depth = len(self.model.get_weights())    # 검색할 차원의 깊이
+        self.particles_weights = [None] * n_particles                 # 파티클의 위치
+        for _ in tqdm(range(self.n_particles), desc="init particles position"):
+            # particle_node = []
+            m = keras.models.model_from_json(self.model_structure)
+            m.compile(loss=self.loss_method, optimizer=self.optimizer)
+
+            self.particles_weights[_] = m.get_weights()
+
+            # self.particles_weights.append(particle_node)
+
+        # print(f"particles_weights > {self.particles_weights}")
+        # self.particles_weights = np.random.uniform(size=(n_particles, self.particle_depth)) \
+            # * self.init_pos
+        # 입력받은 파티클의 개수 * 검색할 차원의 크기 만큼의 균등한 위치를 생성
+        # self.velocities = [None] * self.n_particles
+        self.velocities = [
+            [0 for i in range(self.particle_depth)] for n in range(n_particles)]
+        for i in tqdm(range(n_particles), desc="init velocities"):
+            # print(i)
+            for index, layer in enumerate(self.init_weights):
+                # print(f"index > {index}")
+                # print(f"layer > {layer.shape}")
+                self.velocities[i][index] = np.random.rand(
+                    *layer.shape) / 5 - 0.10
+                # if layer.ndim == 1:
+                #     self.velocities[i][index] = np.random.uniform(
+                #         size=(layer.shape[0],))
+                # elif layer.ndim == 2:
+                #     self.velocities[i][index] = np.random.uniform(
+                #         size=(layer.shape[0], layer.shape[1]))
+                # elif layer.ndim == 3:
+                #     self.velocities[i][index] = np.random.uniform(
+                #         size=(layer.shape[0], layer.shape[1], layer.shape[2]))
+        # print(f"type > {type(self.velocities)}")
+        # print(f"velocities > {self.velocities}")
+
+        # print(f"velocities > {self.velocities}")
+        # for i, layer in enumerate(self.init_weights):
+        #     self.velocities[i] = np.random.rand(*layer.shape) / 5 - 0.10
+
+        # self.velocities = np.random.uniform(
+        #     size=(n_particles, self.particle_depth))
+        # 입력받은 파티클의 개수 * 검색할 차원의 크기 만큼의 속도를 무작위로 초기화
+        # 최대 사이즈로 전역 최적갑 저장 - global best
+        self.g_best = self.model.get_weights()      # 전역 최적값(최적의 가중치)
+        self.p_best = self.particles_weights            # 각 파티클의 최적값(최적의 가중치)
+        self.p_best_score = [np.inf for i in range(
+            n_particles)]  # 각 파티클의 최적값의 점수
+        self.g_best_score = np.inf                  # 전역 최적값의 점수(초기화 - 무한대)
+        self.g_history = []
+        self.history = []
+
+    def _update_weights(self, weights, v):
+        """
+        Update particle position
+
+        Args:
+            weights (array-like) : 파티클의 현재 가중치
+            v (array-like) : 가중치의 속도
+
+        Returns:
+            (array-like) : 파티클의 새로운 가중치(위치)
+        """
+        # w = np.array(w)  # 각 파티클의 위치
+        # v = np.array(v)  # 각 파티클의 속도(방향과 속력을 가짐)
+        # print(f"len(w) > {len(w)}")
+        # print(f"len(v) > {len(v)}")
+        new_weights = [0 for i in range(len(weights))]
+        for i in range(len(weights)):
+            # print(f"shape > w : {np.shape(w[i])}, v : {np.shape(v[i])}")
+            new_weights[i] = tf.add(weights[i], v[i])
+        # new_w = tf.add(w, v)   # 각 파티클을 랜덤한 속도만큼 진행
+        return new_weights    # 진행한 파티클들의 위치를 반환
+
+    def _update_velocity(self, weights, v, p_best, c0=0.5, c1=1.5, w=0.75):
+        """
+            Update particle velocity
+
+            Args:
+                weights (array-like) : 파티클의 현재 가중치
+                v (array-like) : 속도
+                p_best(array-like) : 각 파티클의 최적의 위치 (최적의 가중치)
+                c0 (float) : 인지 스케일링 상수 (가중치의 중요도 - 지역) - 지역 관성
+                c1 (float) : 사회 스케일링 상수 (가중치의 중요도 - 전역) - 전역 관성
+                w (float) : 관성 상수 (현재 속도의 중요도)
+
+            Returns:
+                (array-like) : 각 파티클의 새로운 속도
+        """
+        # x = np.array(x)
+        # v = np.array(v)
+        # assert np.shape(weights) == np.shape(v), "Position and velocity must have same shape."
+        # 두 데이터의 shape 이 같지 않으면 오류 출력
+        # 0에서 1사이의 숫자를 랜덤 생성
+        r0 = np.random.rand()
+        r1 = np.random.rand()
+        # print(f"type > weights : {type(weights)}")
+        # print(f"type > v : {type(v)}")
+        # print(
+        # f"shape > weights : {np.shape(weights[0])}, v : {np.shape(v[0])}")
+        # print(f"len > weights : {len(weights)}, v : {len(v)}")
+        # p_best = np.array(p_best)
+        # g_best = np.array(g_best)
+
+        # 가중치(상수)*속도 + \
+        # 스케일링 상수*랜덤 가중치*(나의 최적값 - 처음 위치) + \
+        # 전역 스케일링 상수*랜덤 가중치*(전체 최적값 - 처음 위치)
+        # for i, layer in enumerate(weights):
+        new_velocity = [None] * len(weights)
+        for i, layer in enumerate(weights):
+
+            new_v = w*v[i]
+            new_v = new_v + c0*r0*(p_best[i] - layer)
+            # m2 = tf.multiply(tf.multiply(c0, r0),
+            #  tf.subtract(p_best[i], layer))
+            new_v = new_v + c1*r1*(self.g_best[i] - layer)
+            # m3 = tf.multiply(tf.multiply(c1, r1),
+            #  tf.subtract(g_best[i], layer))
+            new_velocity[i] = new_v
+            # new_v[i] = tf.add(m1, tf.add(m2, m3))
+            # new_v[i] = tf.add_n([m1, m2, m3])
+            # new_v[i] = tf.add_n(
+            # tf.multiply(w, v[i]),
+            # tf.multiply(tf.multiply(c0, r0),
+            # tf.subtract(p_best[i], layer)),
+            # tf.multiply(tf.multiply(c1, r1),
+            # tf.subtract(g_best[i], layer)))
+        # new_v = w*v + c0*r0*(p_best - weights) + c1*r1*(g_best - weights)
+        return new_velocity
+
+    def _get_score(self, x, y):
+        """
+        Compute the score of the current position of the particles.
+
+        Args:
+            x (array-like): The current position of the particles
+            y (array-like): The current position of the particles
+        Returns:
+            (array-like) : 추론에 대한 점수
+        """
+        #  = self.model
+        # model.set_weights(weights)
+        score = self.model.evaluate(x, y, verbose=0)
+
+        return score
+
+    def optimize(self, x_train, y_train, x_test, y_test, maxiter=20, epoch=10, verbose=0):
+        """
+        Run the PSO optimization process utill the stoping critera is met.
+        Cas for minization. The aim is to minimize the cost function
+
+        Args:
+            maxiter (int): the maximum number of iterations before stopping the optimization
+            파티클의 최종 위치를 위한 반복 횟수
+        Returns:
+            The best solution found (array-like)
+        """
+        for _ in range(maxiter):
+            loss = 0
+            acc = 0
+            for i in tqdm(range(self.n_particles), desc=f"Iteration {_} / {maxiter}", ascii=True):
+                weights = self.particles_weights[i]  # 각 파티클 추출
+                v = self.velocities[i]    # 각 파티클의 다음 속도 추출
+                p_best = self.p_best[i]   # 결과치 저장할 변수 지정
+                self.velocities[i] = self._update_velocity(
+                    weights, v, p_best)
+                # 다음에 움직일 속도 = 최초 위치, 현재 속도, 현재 위치, 최종 위치
+                self.particles_weights[i] = self._update_weights(weights, v)
+                # 현재 위치 = 최초 위치 현재 속도
+                # Update the besst position for particle i
+                # 내 현재 위치가 내 위치의 최소치보다 작으면 갱신
+
+                self.model.set_weights(self.particles_weights[i])
+                self.model.fit(x_train, y_train, epochs=epoch,
+                               verbose=0, validation_data=(x_test, y_test))
+                self.particles_weights[i] = self.model.get_weights()
+
+                score = self._get_score(x_test, y_test)
+
+                # print(f"score : {score}")
+                # print(f"loss : {loss}")
+                # print(f"p_best_score : {self.p_best_score[i]}")
+
+                if score[0] < self.p_best_score[i]:
+                    self.p_best_score[i] = score[0]
+                    self.p_best[i] = self.particles_weights[i]
+                    if score[0] < self.g_best_score:
+                        self.g_best_score = score[0]
+                        self.g_best = self.particles_weights[i].copy()
+                        self.g_history.append(self.g_best.copy())
+
+                self.score = score[0]
+                loss = score[0]
+                acc = score[1]
+                # if self.func(self.particles_weights[i]) < self.func(p_best):
+                # self.p_best[i] = self.particles_weights[i]
+                # if self.
+                # Update the best position overall
+                # 내 현재 위치가 전체 위치 최소치보다 작으면 갱신
+                # if self.func(self.particles_weights[i]) < self.func(self.g_best):
+                # self.g_best = self.particles_weights[i]
+                # self.g_history.append(self.g_best)
+                # print(f"{i} particle score : {score[0]}")
+            print(f"loss : {loss} | acc : {acc}")
+
+            # self.history.append(self.particles_weights.copy())
+
+        # 전체 최소 위치, 전체 최소 벡터
+        return self.g_best, self._get_score(x_test, y_test)
+
+    """
+    Returns:
+        현재 전체 위치
+    """
+
+    def position(self):
+        return self.particles_weights.copy()
+
+    """
+    Returns:
+        전체 위치 벡터 history
+    """
+
+    def position_history(self):
+        return self.history.copy()
+
+    """
+    Returns:
+        global best 의 갱신된 값의 변화를 반환
+    """
+
+    def global_history(self):
+        return self.g_history.copy()