PSO/pso_tf.py

import numpy as np
import tensorflow as tf
from tensorflow import keras
from tqdm import tqdm


class PSO(object):
    """
    Class implementing PSO algorithm
    """

    def __init__(self, model: keras.models, loss_method=keras.losses.MeanSquaredError(), n_particles=5):
        """
        Initialize the key variables.

        Args:
            model : 학습할 모델 객체 (Sequential)
            loss_method : 손실 함수
            optimizer : 최적화 함수
            n_particles(int) : 파티클의 개수
        """
        self.model = model                      # 모델
        self.n_particles = n_particles          # 파티클의 개수
        self.loss_method = loss_method          # 손실 함수
        self.model_structure = self.model.to_json()  # 모델의 구조
        self.init_weights = self.model.get_weights()          # 검색할 차원
        self.particle_depth = len(self.model.get_weights())    # 검색할 차원의 깊이
        self.particles_weights = [None] * n_particles                 # 파티클의 위치
        for _ in tqdm(range(self.n_particles), desc="init particles position"):
            # particle_node = []
            m = keras.models.model_from_json(self.model_structure)
            m.compile(loss=self.loss_method,
                      optimizer="adam", metrics=["accuracy"])
            self.particles_weights[_] = m.get_weights()
            # print(f"shape > {self.particles_weights[_][0]}")

            # self.particles_weights.append(particle_node)

        # print(f"particles_weights > {self.particles_weights}")
        # self.particles_weights = np.random.uniform(size=(n_particles, self.particle_depth)) \
            # * self.init_pos
        # 입력받은 파티클의 개수 * 검색할 차원의 크기 만큼의 균등한 위치를 생성
        # self.velocities = [None] * self.n_particles
        self.velocities = [
            [0 for i in range(self.particle_depth)] for n in range(n_particles)]
        for i in tqdm(range(n_particles), desc="init velocities"):
            # print(i)
            for index, layer in enumerate(self.init_weights):
                # print(f"index > {index}")
                # print(f"layer > {layer.shape}")
                self.velocities[i][index] = np.random.rand(
                    *layer.shape) / 5 - 0.10
                # if layer.ndim == 1:
                #     self.velocities[i][index] = np.random.uniform(
                #         size=(layer.shape[0],))
                # elif layer.ndim == 2:
                #     self.velocities[i][index] = np.random.uniform(
                #         size=(layer.shape[0], layer.shape[1]))
                # elif layer.ndim == 3:
                #     self.velocities[i][index] = np.random.uniform(
                #         size=(layer.shape[0], layer.shape[1], layer.shape[2]))
        # print(f"type > {type(self.velocities)}")
        # print(f"velocities > {self.velocities}")

        # print(f"velocities > {self.velocities}")
        # for i, layer in enumerate(self.init_weights):
        #     self.velocities[i] = np.random.rand(*layer.shape) / 5 - 0.10

        # self.velocities = np.random.uniform(
        #     size=(n_particles, self.particle_depth))
        # 입력받은 파티클의 개수 * 검색할 차원의 크기 만큼의 속도를 무작위로 초기화
        # 최대 사이즈로 전역 최적갑 저장 - global best
        self.g_best = self.model.get_weights()      # 전역 최적값(최적의 가중치)
        self.p_best = self.particles_weights            # 각 파티클의 최적값(최적의 가중치)
        self.p_best_score = [0 for i in range(
            n_particles)]  # 각 파티클의 최적값의 점수
        self.g_best_score = 0                  # 전역 최적값의 점수(초기화 - 무한대)
        self.g_history = []
        self.loss_history = [[] for i in range(n_particles)]
        self.acc_history = [[] for i in range(n_particles)]
        self.g_best_score_history = []
        self.history = []

    def _update_weights(self, weights, v):
        """
        Update particle position

        Args:
            weights (array-like) : 파티클의 현재 가중치
            v (array-like) : 가중치의 속도

        Returns:
            (array-like) : 파티클의 새로운 가중치(위치)
        """
        # w = np.array(w)  # 각 파티클의 위치
        # v = np.array(v)  # 각 파티클의 속도(방향과 속력을 가짐)
        # print(f"len(w) > {len(w)}")
        # print(f"len(v) > {len(v)}")
        new_weights = [0 for i in range(len(weights))]
        for i in range(len(weights)):
            # print(f"shape > w : {np.shape(w[i])}, v : {np.shape(v[i])}")
            new_weights[i] = tf.add(weights[i], v[i])
        # new_w = tf.add(w, v)   # 각 파티클을 랜덤한 속도만큼 진행
        return new_weights    # 진행한 파티클들의 위치를 반환

    def _update_velocity(self, weights, v, p_best, c0=0.5, c1=1.5, w=0.75):
        """
            Update particle velocity

            Args:
                weights (array-like) : 파티클의 현재 가중치
                v (array-like) : 속도
                p_best(array-like) : 각 파티클의 최적의 위치 (최적의 가중치)
                c0 (float) : 인지 스케일링 상수 (가중치의 중요도 - 지역) - 지역 관성
                c1 (float) : 사회 스케일링 상수 (가중치의 중요도 - 전역) - 전역 관성
                w (float) : 관성 상수 (현재 속도의 중요도)

            Returns:
                (array-like) : 각 파티클의 새로운 속도
        """
        # x = np.array(x)
        # v = np.array(v)
        # assert np.shape(weights) == np.shape(v), "Position and velocity must have same shape."
        # 두 데이터의 shape 이 같지 않으면 오류 출력
        # 0에서 1사이의 숫자를 랜덤 생성
        r0 = np.random.rand()
        r1 = np.random.rand()
        # print(f"type > weights : {type(weights)}")
        # print(f"type > v : {type(v)}")
        # print(
        # f"shape > weights : {np.shape(weights[0])}, v : {np.shape(v[0])}")
        # print(f"len > weights : {len(weights)}, v : {len(v)}")
        # p_best = np.array(p_best)
        # g_best = np.array(g_best)

        # 가중치(상수)*속도 + \
        # 스케일링 상수*랜덤 가중치*(나의 최적값 - 처음 위치) + \
        # 전역 스케일링 상수*랜덤 가중치*(전체 최적값 - 처음 위치)
        # for i, layer in enumerate(weights):
        new_velocity = [None] * len(weights)
        for i, layer in enumerate(weights):

            new_v = w*v[i]
            new_v = new_v + c0*r0*(p_best[i] - layer)
            new_v = new_v + c1*r1*(self.g_best[i] - layer)
            new_velocity[i] = new_v

            # m2 = tf.multiply(tf.multiply(c0, r0),
            #  tf.subtract(p_best[i], layer))
            # m3 = tf.multiply(tf.multiply(c1, r1),
            #  tf.subtract(g_best[i], layer))
            # new_v[i] = tf.add(m1, tf.add(m2, m3))
            # new_v[i] = tf.add_n([m1, m2, m3])
            # new_v[i] = tf.add_n(
            # tf.multiply(w, v[i]),
            # tf.multiply(tf.multiply(c0, r0),
            # tf.subtract(p_best[i], layer)),
            # tf.multiply(tf.multiply(c1, r1),
            # tf.subtract(g_best[i], layer)))
        # new_v = w*v + c0*r0*(p_best - weights) + c1*r1*(g_best - weights)
        return new_velocity

    def _get_score(self, x, y):
        """
        Compute the score of the current position of the particles.

        Args:
            x (array-like): The current position of the particles
            y (array-like): The current position of the particles
        Returns:
            (array-like) : 추론에 대한 점수
        """
        #  = self.model
        # model.set_weights(weights)
        score = self.model.evaluate(x, y, verbose=0)

        return score

    def optimize(self, x_train, y_train, x_test, y_test, maxiter=10, c0=0.5, c1=1.5, w=0.75):
        """
        Run the PSO optimization process utill the stoping critera is met.
        Cas for minization. The aim is to minimize the cost function

        Args:
            maxiter (int): the maximum number of iterations before stopping the optimization
            파티클의 최종 위치를 위한 반복 횟수
        Returns:
            The best solution found (array-like)
        """
        for _ in range(maxiter):
            loss = 0
            acc = 0
            for i in tqdm(range(self.n_particles), desc=f"Iter {_}/{maxiter}", ascii=True):
                weights = self.particles_weights[i]  # 각 파티클 추출
                v = self.velocities[i]    # 각 파티클의 다음 속도 추출
                p_best = self.p_best[i]   # 결과치 저장할 변수 지정
                # 2. 속도 계산
                self.velocities[i] = self._update_velocity(
                    weights, v, p_best, c0, c1, w)
                # 다음에 움직일 속도 = 최초 위치, 현재 속도, 현재 위치, 최종 위치
                # 3. 위치 업데이트
                self.particles_weights[i] = self._update_weights(weights, v)
                # 현재 위치 = 최초 위치 현재 속도
                # Update the besst position for particle i
                # 내 현재 위치가 내 위치의 최소치보다 작으면 갱신
                self.model.set_weights(self.particles_weights[i].copy())
                # self.model.fit(x_train, y_train, epochs=epochs, batch_size=batch_size,
                #    verbose=0, validation_data=(x_test, y_test))
                # self.particles_weights[i] = self.model.get_weights()
                # 4. 평가
                self.model.compile(loss=self.loss_method,
                                   optimizer='adam', metrics=['accuracy'])
                score = self._get_score(x_test, y_test)
                # print(score)

                # print(f"score : {score}")
                # print(f"loss : {loss}")
                # print(f"p_best_score : {self.p_best_score[i]}")

                if score[1] > self.p_best_score[i]:
                    self.p_best_score[i] = score[1]
                    self.p_best[i] = self.particles_weights[i].copy()
                    if score[1] > self.g_best_score:
                        self.g_best_score = score[1]
                        self.g_best = self.particles_weights[i].copy()
                        self.g_history.append(self.g_best.copy())
                        self.g_best_score_history.append(
                            self.g_best_score)

                self.score = score
                self.loss_history[i].append(score[0])
                self.acc_history[i].append(score[1])
                # if self.func(self.particles_weights[i]) < self.func(p_best):
                # self.p_best[i] = self.particles_weights[i]
                # if self.
                # Update the best position overall
                # 내 현재 위치가 전체 위치 최소치보다 작으면 갱신
                # if self.func(self.particles_weights[i]) < self.func(self.g_best):
                # self.g_best = self.particles_weights[i]
                # self.g_history.append(self.g_best)
                # print(f"{i} particle score : {score[0]}")
            print(
                f"loss avg : {self.score[0]/self.n_particles} | acc avg : {self.score[1]/self.n_particles} | best score : {self.g_best_score}")

            # self.history.append(self.particles_weights.copy())

        # 전체 최소 위치, 전체 최소 벡터
        return self.g_best, self._get_score(x_test, y_test)

    """
    Returns:
        현재 전체 위치
    """

    def position(self):
        return self.particles_weights.copy()

    """
    Returns:
        전체 위치 벡터 history
    """

    def position_history(self):
        return self.history.copy()

    """
    Returns:
        global best 의 갱신된 값의 변화를 반환
    """

    def global_history(self):
        return self.g_history.copy()

    """
    Returns:
        global best score 의 갱신된 값의 변화를 반환
    """

    def global_score_history(self):
        return self.g_best_score_history.copy()

    def all_history(self):
        return self.loss_history, self.acc_history.copy()