Add 코드

seongahjo
Commit 7740983a1707f34f7fdc951b4d6b5a10aaf1a4d3 7740983a 1 parent 97880809
Showing 19 changed files with 968 additions and 0 deletions
document/2014104150_조성아_캡스톤디자인2_중간보고서.pdf
document/4월 면담서.pdf
document/면담확인서_5월.pdf
document/캡스톤디자인2_주제보고서.docx
project/.gitignore
project/DNN/__init__.py
project/DNN/loss.py
project/DNN/model.py
project/LICENSE
project/MCTS.py
project/README.md
project/__init__.py
project/agent.py
project/browser.py
project/config.py
project/main.py
project/memory.py
project/similarity.py
project/state.py
--- a/document/2014104150_조성아_캡스톤디자인2_중간보고서.pdf 0 → 100644
View file @7740983
+++ b/document/2014104150_조성아_캡스톤디자인2_중간보고서.pdf 0 → 100644
View file @7740983
--- a/document/4월 면담서.pdf 0 → 100644
View file @7740983
+++ b/document/4월 면담서.pdf 0 → 100644
View file @7740983
--- a/document/면담확인서_5월.pdf 0 → 100644
View file @7740983
+++ b/document/면담확인서_5월.pdf 0 → 100644
View file @7740983
--- a/document/캡스톤디자인2_주제보고서.docx 0 → 100644
View file @7740983
+++ b/document/캡스톤디자인2_주제보고서.docx 0 → 100644
View file @7740983
--- a/project/.gitignore 0 → 100644
View file @7740983
+++ b/project/.gitignore 0 → 100644
View file @7740983
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+.idea
+
+# C extensions
+*.so
+
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+.hypothesis/
+.pytest_cache/
+
+# Translations
+*.mo
+*.pot
+
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+
+# Flask stuff:
+instance/
+.webassets-cache
+
+# Scrapy stuff:
+.scrapy
+
+# Sphinx documentation
+docs/_build/
+
+# PyBuilder
+target/
+
+# Jupyter Notebook
+.ipynb_checkpoints
+
+# pyenv
+.python-version
+
+# celery beat schedule file
+celerybeat-schedule
+
+# SageMath parsed files
+*.sage.py
+
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+
+# Spyder project settings
+.spyderproject
+.spyproject
+
+# Rope project settings
+.ropeproject
+
+# mkdocs documentation
+/site
+
+# mypy
+.mypy_cache/
--- a/project/DNN/__init__.py 0 → 100644
View file @7740983
+++ b/project/DNN/__init__.py 0 → 100644
View file @7740983
--- a/project/DNN/loss.py 0 → 100644
View file @7740983
+++ b/project/DNN/loss.py 0 → 100644
View file @7740983
+
+import tensorflow as tf
+
+def softmax_cross_entropy_with_logits(y_true, y_pred):
+
+	p = y_pred
+	pi = y_true
+
+	zero = tf.zeros(shape = tf.shape(pi), dtype=tf.float32)
+	where = tf.equal(pi, zero)
+
+	negatives = tf.fill(tf.shape(pi), -100.0) 
+	p = tf.where(where, negatives, p)
+
+	loss = tf.nn.softmax_cross_entropy_with_logits(labels = pi, logits = p)
+
+	return loss
+
+
+
+
+
+
--- a/project/DNN/model.py 0 → 100644
View file @7740983
+++ b/project/DNN/model.py 0 → 100644
View file @7740983
+import config
+import numpy as np
+
+from keras.models import load_model, Model
+from keras.layers import Input, Dense, Conv1D, Flatten, BatchNormalization, LeakyReLU, add
+from keras.optimizers import SGD
+from keras import regularizers
+
+from DNN.loss import softmax_cross_entropy_with_logits
+
+
+class GeneralModel(object):
+    def __init__(self, reg_const, learning_rate, input_dim, output_dim):
+        self.reg_const = reg_const
+        self.learning_rate = learning_rate
+        self.input_dim = input_dim
+        self.output_dim = output_dim
+
+    def predict(self, x):
+        return self.model.predict(x)
+
+    def fit(self, states, targets, epochs, verbose, validation_split, batch_size):
+        return self.model.fit(states, targets, epochs=epochs, verbose=verbose, validation_split=validation_split,
+                              batch_size=batch_size)
+
+    def write(self, game, version):
+        self.model.save('models/version' + "{0:0>4}".format(version) + '.h5')
+
+    def read(self, game, run_number, version):
+        return load_model(str(run_number).zfill(4) + "/models/version" + "{0:0>4}".format
+        (version) + '.h5', custom_objects={'softmax_cross_entropy_with_logits': softmax_cross_entropy_with_logits})
+
+
+class ResidualCNN(GeneralModel):
+    def __init__(self, reg_const, learning_rate, input_dim, output_dim, hidden_layers):
+        GeneralModel.__init__(self, reg_const, learning_rate, input_dim, output_dim)
+        self.hidden_layers = hidden_layers
+        self.num_layers = len(hidden_layers)
+        self.model = self._build_model()
+
+    def residual_layer(self, input_block, filters, kernel_size):
+
+        x = self.conv_layer(input_block, filters, kernel_size)
+
+        x = Conv1D(
+            filters=filters
+            , kernel_size=kernel_size
+            , data_format="channels_last"
+            , padding='same'
+            , use_bias=False
+            , activation='linear'
+            , kernel_regularizer=regularizers.l2(self.reg_const)
+        )(x)
+
+        x = BatchNormalization(axis=1)(x)
+
+        x = add([input_block, x])
+
+        x = LeakyReLU()(x)
+
+        return x
+
+    def conv_layer(self, x, filters, kernel_size):
+
+        x = Conv1D(
+            filters=filters
+            , kernel_size=kernel_size
+            , data_format="channels_last"
+            , padding='same'
+            , use_bias=False
+            , activation='linear'
+            , kernel_regularizer=regularizers.l2(self.reg_const)
+        )(x)
+
+        x = BatchNormalization(axis=1)(x)
+        x = LeakyReLU()(x)
+
+        return x
+
+    def value_head(self, x):
+        x = Conv1D(
+            filters=2
+            , kernel_size=1
+            , data_format="channels_last"
+            , padding='same'
+            , use_bias=False
+            , activation='linear'
+            , kernel_regularizer=regularizers.l2(self.reg_const)
+        )(x)
+
+        x = BatchNormalization(axis=1)(x)
+        x = LeakyReLU()(x)
+
+        x = Flatten()(x)
+
+        x = Dense(
+            self.output_dim
+            , use_bias=False
+            , activation='linear'
+            , kernel_regularizer=regularizers.l2(self.reg_const)
+            , name='value_head'
+        )(x)
+
+        return x
+
+    def policy_head(self, x):
+        x = Conv1D(
+            filters=2
+            , kernel_size=1
+            , data_format="channels_last"
+            , padding='same'
+            , use_bias=False
+            , activation='linear'
+            , kernel_regularizer=regularizers.l2(self.reg_const)
+        )(x)
+
+        x = BatchNormalization(axis=1)(x)
+        x = LeakyReLU()(x)
+
+        x = Flatten()(x)
+
+        x = Dense(
+            self.output_dim
+            , use_bias=False
+            , activation='linear'
+            , kernel_regularizer=regularizers.l2(self.reg_const)
+            , name='policy_head'
+        )(x)
+
+        return x
+
+    def _build_model(self):
+        # image shape
+        # 그냥 배열 shape
+
+        main_input = Input(shape=self.input_dim, name='main_input')
+
+        x = self.conv_layer(main_input, self.hidden_layers[0]['filters'], self.hidden_layers[0]['kernel_size'])
+
+        if len(self.hidden_layers) > 1:
+            for h in self.hidden_layers[1:]:
+                x = self.residual_layer(x, h['filters'], h['kernel_size'])
+
+        vh = self.value_head(x)
+        ph = self.policy_head(x)
+
+        model = Model(inputs=[main_input], outputs=[ph])
+        model.compile(loss=softmax_cross_entropy_with_logits,
+                      optimizer=SGD(lr=self.learning_rate, momentum=config.MOMENTUM),
+                      loss_weights=[0.5]
+                      )
+
+        return model
+
+    def convertToModelInput(self, state):
+        # [20,20]
+        inputToModel = state.state_check  # np.append(state.binary, [(state.playerTurn + 1)/2] * self.input_dim[1] * self.input_dim[2])
+        inputToModel = np.reshape(inputToModel, self.input_dim)
+        return inputToModel
--- a/project/LICENSE 0 → 100644
View file @7740983
+++ b/project/LICENSE 0 → 100644
View file @7740983
+MIT License
+
+Copyright (c) 2019 seongahjo
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
--- a/project/MCTS.py 0 → 100644
View file @7740983
+++ b/project/MCTS.py 0 → 100644
View file @7740983
+import numpy as np
+import logging
+import config
+
+
+class Node(object):
+
+    def __init__(self, state):
+        self.state = state
+        self.id = state.id
+        self.edges = []
+
+    def is_leaf(self):
+        if len(self.edges) > 0:
+            return False
+        else:
+            return True
+
+
+class Edge(object):
+
+    def __init__(self, in_node, out_node, prior, action):
+        self.id = in_node.state.id + '|' + out_node.state.id
+        self.inNode = in_node
+        self.outNode = out_node
+        self.action = action
+
+        self.stats = {
+            'N': 0,
+            'W': 0,
+            'Q': 0,
+            'P': prior,
+        }
+
+
+# N 이 횟수
+# W 가 win
+# Q 가 승률
+# P 가
+
+class MCTS(object):
+
+    def __init__(self, root, cpuct):
+        self.root = root
+        self.tree = {}
+        self.cpuct = cpuct
+        self.add_node(root)
+
+    def __len__(self):
+        return len(self.tree)
+
+    def moveToLeaf(self):
+
+        breadcrumbs = []
+        current_node = self.root
+
+        done = 0
+        value = 0
+
+        while not current_node.is_leaf():
+
+            max_qu = -99999
+
+            if current_node == self.root:
+                epsilon = config.EPSILON
+                nu = np.random.dirichlet([config.ALPHA] * len(current_node.edges))
+            else:
+                epsilon = 0
+                nu = [0] * len(current_node.edges)
+
+            Nb = 0
+            for action, edge in current_node.edges:
+                Nb = Nb + edge.stats['N']
+
+            for idx, (action, edge) in enumerate(current_node.edges):
+
+                U = self.cpuct * \
+                    ((1 - epsilon) * edge.stats['P'] + epsilon * nu[idx]) * \
+                    np.sqrt(Nb) / (1 + edge.stats['N'])
+
+                Q = edge.stats['Q']
+
+                if Q + U > max_qu:
+                    max_qu = Q + U
+                    simulation_action = action
+                    simulation_edge = edge
+
+            new_state, value, done = current_node.state.takeAction(simulation_action)
+            current_node = simulation_edge.outNode
+            breadcrumbs.append(simulation_edge)
+
+        return current_node, value, done, breadcrumbs
+
+    def back_fill(self, value, breadcrumbs):
+        for edge in breadcrumbs:
+            edge.stats['N'] = edge.stats['N'] + 1
+            edge.stats['W'] = edge.stats['W'] + value
+            edge.stats['Q'] = edge.stats['W'] / edge.stats['N']
+
+    def add_node(self, node):
+        self.tree[node.id] = node
--- a/project/README.md 0 → 100644
View file @7740983
+++ b/project/README.md 0 → 100644
View file @7740983
+## D.sAIgn
+Web Design Automation from screenshot by Reinforcement Learning
+
+**Now only train is availble**
+## Feature
+* Monte Carlo Tree Search 
+* DQN
+
+## Installation
+* `Python 3`
+
+
+## Usage
+* configure `config.py`
+* `python main.py`
+
+## Roadmap
+- [ ] run D.sAIgn using trained model
+- [ ] see remarkable result
+- [ ] fast train by multiprocessing
+- [ ] find majorly used css properties
+- [ ] offer pretrained model  
+
+## License
+D.sAIgn is released under [MIT License]
+
+[MIT License]:https://github.com/seongahjo/D.sAIgn/blob/master/LICENSE
+ 
\ No newline at end of file
--- a/project/__init__.py 0 → 100644
View file @7740983
+++ b/project/__init__.py 0 → 100644
View file @7740983
+__all__ = ['config']
\ No newline at end of file
--- a/project/agent.py 0 → 100644
View file @7740983
+++ b/project/agent.py 0 → 100644
View file @7740983
+# %matplotlib inline
+
+import numpy as np
+import random
+import config
+import MCTS as mc
+
+import time
+
+from browser import Chrome
+from similarity import Similarity
+from state import State
+
+
+class Agent():
+    def __init__(self, name, state_size, action_size, mcts_simulations, cpuct, model=None):
+        self.name = name
+        self.action_size = action_size
+
+        self.cpuct = cpuct
+        self.similarity = Similarity('result.png')
+        self.MCTSsimulations = mcts_simulations
+        self.model = model
+        self.browser = Chrome('kakao.html')
+        self.mcts = None
+        self.gameState = State([set() for i in range(20)],
+                               0,
+                               np.ones((20, config.NUM_ACTIONS), dtype=np.int),
+                               ['screen_out', 'tit_white', 'desc_newsfeed', 'hide', 'mArticle', 'txt_date',
+                                'main_summary', 'service_info', 'ico_corp', 'tit_black',
+                                'summary_info', 'link_newsfeed', 'img_thumb', 'now_stock', 'kakaoWrap', 'kakaoContent',
+                                'main_service', 'num_stock', 'main_stock', 'tit_newsfeed'], self.browser,
+                               self.similarity)
+
+        self.state_size = 20
+        self.train_overall_loss = []
+        self.train_value_loss = []
+        self.train_policy_loss = []
+        self.val_overall_loss = []
+        self.val_value_loss = []
+        self.val_policy_loss = []
+
+    def simulate(self):
+
+        ##### MOVE THE LEAF NODE
+        leaf, value, done, breadcrumbs = self.mcts.moveToLeaf()
+        ##### EVALUATE THE LEAF NODE
+        value, breadcrumbs = self.evaluateLeaf(leaf, value, done, breadcrumbs)
+        ##### BACKFILL THE VALUE THROUGH THE TREE
+        self.mcts.back_fill(value, breadcrumbs)
+
+    def act(self, state, tau):
+
+        if self.mcts is None or state.id not in self.mcts.tree:
+            self.buildMCTS(state)
+        else:
+            self.changeRootMCTS(state)
+
+        #### run the simulation
+        for sim in range(self.MCTSsimulations):
+            self.simulate()
+
+        #### get action values
+        pi, values = self.getAV(1)
+
+        ####pick the action
+        action, value = self.chooseAction(pi, values, tau)
+        print('action {} '.format(action))
+        nextState, _, _ = state.takeAction(action)
+
+        return action, pi, value
+
+    def get_preds(self, state):
+        # predict the leaf
+        inputToModel = np.array([self.model.convertToModelInput(state)])
+        preds = self.model.predict(inputToModel)
+        logits_array = preds
+        logits = logits_array[0]
+        allowedActions = state.allowedActions
+
+        mask = np.ones(config.NUM_ACTIONS, dtype=bool)
+        mask[allowedActions] = False
+
+        # sim = np.zeros(config.NUM_ACTIONS, dtype=np.float)
+        # for act in allowedActions:
+        #     new_state, _, _ = state.takeAction(act)
+        #     sim[act] += new_state.similarity * 100
+        # logits = sim
+        # print('sim : {} '.format(logits))
+        # print('probs : {} '.format(probs))
+        # probs = np.ones(config.NUM_ACTIONS)
+
+        logits[mask] = -100
+
+        # SOFTMAX
+        odds = np.exp(logits)
+        probs = odds / np.sum(odds)  ###put this just before the for?
+
+        return probs, allowedActions
+
+    def evaluateLeaf(self, leaf, value, done, breadcrumbs):
+
+        if done == 0:
+
+            probs, allowedActions = self.get_preds(leaf.state)
+            probs = probs[allowedActions]
+
+            for idx, act in enumerate(allowedActions):
+                newState, _, _ = leaf.state.takeAction(act)
+                if newState.id not in self.mcts.tree:
+                    node = mc.Node(newState)
+                    self.mcts.add_node(node)
+                else:
+                    node = self.mcts.tree[newState.id]
+
+                newEdge = mc.Edge(leaf, node, probs[idx], act)
+                leaf.edges.append((act, newEdge))
+
+        return (value, breadcrumbs)
+
+    def getAV(self, tau):
+        edges = self.mcts.root.edges
+        pi = np.zeros(self.action_size, dtype=np.integer)
+        values = np.zeros(self.action_size, dtype=np.float32)
+
+        for action, edge in edges:
+            pi[action] = pow(edge.stats['N'], 1 / tau)
+            values[action] = edge.stats['Q']
+
+        pi = pi / (np.sum(pi) * 1.0)
+        return pi, values
+
+    def chooseAction(self, pi, values, tau):
+        if tau == 0:
+            actions = np.argwhere(pi == max(pi))
+            action = random.choice(actions)[0]
+        else:
+            action_idx = np.random.multinomial(1, pi)
+            action = np.where(action_idx == 1)[0][0]
+        value = values[action]
+        return action, value
+
+    def replay(self, ltmemory):
+
+        for i in range(config.TRAINING_LOOPS):
+            minibatch = random.sample(ltmemory, min(config.BATCH_SIZE, len(ltmemory)))
+
+            training_states = np.array([self.model.convertToModelInput(row['state']) for row in minibatch])
+            training_targets = np.array([row['AV'] for row in minibatch])
+
+            fit = self.model.fit(training_states, training_targets, epochs=config.EPOCHS, verbose=1, validation_split=0,
+                                 batch_size=32)
+        time.sleep(1.0)
+        print('\n')
+
+    def predict(self, inputToModel):
+        preds = self.model.predict(inputToModel)
+        return preds
+
+    def buildMCTS(self, state):
+        self.root = mc.Node(state)
+        self.mcts = mc.MCTS(self.root, self.cpuct)
+
+    def changeRootMCTS(self, state):
+        self.mcts.root = self.mcts.tree[state.id]
+
+    def reset(self):
+        self.gameState = State([set() for i in range(20)], 0,
+                               np.ones((20, config.NUM_ACTIONS), dtype=np.int),
+                               ['screen_out', 'tit_white', 'desc_newsfeed', 'hide', 'mArticle', 'txt_date',
+                                'main_summary', 'service_info', 'ico_corp', 'tit_black',
+                                'summary_info', 'link_newsfeed', 'img_thumb', 'now_stock', 'kakaoWrap', 'kakaoContent',
+                                'main_service', 'num_stock', 'main_stock', 'tit_newsfeed'], self.browser,
+                               self.similarity)
+        return self.gameState
+
+    def step(self, action):
+        next_state, value, done = self.gameState.takeAction(action)
+        self.gameState = next_state
+        info = None
+        return next_state, value, done, info
--- a/project/browser.py 0 → 100644
View file @7740983
+++ b/project/browser.py 0 → 100644
View file @7740983
+import datetime
+import os
+from selenium import webdriver
+from selenium.common.exceptions import WebDriverException
+import config
+
+
+class Browser(object):
+    def __init__(self):
+        pass
+
+    def capture(self):
+        pass
+
+
+class Chrome(Browser):
+    def __init__(self, html):
+        self.html = html
+        self.browser = self._runChrome()
+
+    def _runChrome(self):
+        options = webdriver.ChromeOptions()
+        options.add_argument('headless')
+        options.add_argument('no-sandbox')
+        driver = webdriver.Chrome(options=options)
+        driver.set_window_size(config.WIDTH, config.HEIGHT)
+        return driver
+
+    def capture(self):
+        """
+        현재 상태를 크롬으로 캡쳐한 파일 반환
+        :return: image_path
+        """
+        date_time = datetime.datetime.now()
+        date_time = date_time.strftime('%Y-%m-%d-%H-%M-%S')
+        file_path = 'image/' + str(date_time) + '.png'
+        now_path = 'file://' + os.path.join(os.getcwd(), self.html)
+        try:
+            self.browser.get(now_path)
+        except WebDriverException:
+            self.browser = self._runChrome()
+            self.browser.get(now_path)
+        self.browser.save_screenshot(file_path)
+        return file_path
--- a/project/config.py 0 → 100644
View file @7740983
+++ b/project/config.py 0 → 100644
View file @7740983
+#### SELF PLAY
+EPISODES = 30
+MCTS_SIMS = 50
+MEMORY_SIZE = 30000
+TURNS_UNTIL_TAU0 = 10  # turn on which it starts playing deterministically
+CPUCT = 1
+EPSILON = 0.2
+ALPHA = 0.8
+
+INPUT_SHAPE = (20, 21)
+
+#### RETRAINING
+BATCH_SIZE = 256
+EPOCHS = 50
+REG_CONST = 0.0001
+LEARNING_RATE = 0.1
+MOMENTUM = 0.9
+TRAINING_LOOPS = 10
+
+HIDDEN_CNN_LAYERS = [
+    {'filters': 75, 'kernel_size': 4}
+    , {'filters': 75, 'kernel_size': 4}
+    , {'filters': 75, 'kernel_size': 4}
+    , {'filters': 75, 'kernel_size': 4}
+    , {'filters': 75, 'kernel_size': 4}
+    , {'filters': 75, 'kernel_size': 4}
+]
+
+HIDDEN_2D_CNN_LAYERS = [
+    {'filters': 75, 'kernel_size': (4, 4)}
+    , {'filters': 75, 'kernel_size': (4, 4)}
+    , {'filters': 75, 'kernel_size': (4, 4)}
+    , {'filters': 75, 'kernel_size': (4, 4)}
+    , {'filters': 75, 'kernel_size': (4, 4)}
+    , {'filters': 75, 'kernel_size': (4, 4)}
+]
+
+#### EVALUATION
+EVAL_EPISODES = 20
+SCORING_THRESHOLD = 1.3
+
+ACTION_MEANING = {
+    0: 'overflow: hidden;    position: absolute;    width: 0;    height: 0;    line-height: 0;    text-indent: -9999px',
+    1: 'position: absolute;    top: 15px;    left: 20px;    color: #fff;    font-weight: normal;    font-size: 14px;    font-family: "NotoSans Regular", "Malgun Gothic", "맑은 고딕", "Apple SD Gothic Neo", "돋움", dotum, sans-serif',
+    2: 'padding-top: 8px;    font-size: 14px;    line-height: 22px;    color: #666;    display: -webkit-box;    overflow: hidden;    max-height: 66px;    -webkit-box-orient: vertical;    -webkit-line-clamp: 3',
+    3: 'display: none',
+    4: 'position: relative;    width: 1160px;    margin: 0 auto;    padding-bottom: 180px;    width: 100%',
+    5: 'display: block;    padding-top: 28px;    font-size: 12px;    clear: both',
+    6: 'overflow: hidden;    max-width: 1800px;    margin: 0 auto;    padding: 35px 60px 0;    padding-left: 20px;    padding-right: 20px',
+    7: 'float: left;    width: 33.33%;    padding: 0 20px;    box-sizing: border-box',
+    8: 'margin: 22px 0 0 21px;    width: 18px;    height: 14px;    margin-top: 21px;    background-position: -40px 0;    display: inline-block;    background-position: -70px 0;    width: 17px;    height: 3px;    margin: 20px 0 0 4px;    background-position: -90px 0',
+    9: 'position: absolute;    top: 15px;    left: 20px;    color: #1e1e1e;    font-weight: normal;    font-size: 14px;    font-family: "NotoSans Regular", "Malgun Gothic", "맑은 고딕", "Apple SD Gothic Neo", "돋움", dotum, sans-serif',
+    10: 'float: left;    width: 33.33%;    padding: 0 20px;    box-sizing: border-box',
+    11: 'display: block;    position: relative',
+    12: 'width: 100%;    margin-bottom: 14px',
+    13: 'float: left',
+    14: 'position: relative;    min-width: 1320px;    background-color: #fff',
+    15: 'padding-top: 122px;    padding-top: 0',
+    16: 'overflow: hidden;    max-width: 1800px;    margin: 0 auto;    padding: 76px 60px 0;    padding-left: 20px;    padding-right: 20px;',
+    17: 'font-weight: bold;    font-size: 28px;    line-height: 45px;    padding-left: 2px;    color: #003cff;    font-size: 32px;    font-weight: bold;    color: #1e1e1e;    display: inline-block;    font-size: 20px;    vertical-align: top',
+    18: 'padding-top: 33px;    color: #1e1e1e',
+    19: 'text-decoration: underline;    display: block;    padding-top: 18px;    font-size: 20px;    line-height: 32px;    color: #1e1e1e',
+}
+WIDTH = 800
+HEIGHT = 600
+
+IMAGE_SIZE = (224, 224)
+
+LAST_ACTION = len(ACTION_MEANING)
+NUM_ACTIONS = len(ACTION_MEANING) + 1
--- a/project/main.py 0 → 100644
View file @7740983
+++ b/project/main.py 0 → 100644
View file @7740983
+import pickle
+import random
+
+from DNN.model import ResidualCNN
+from agent import Agent
+import config
+import os
+
+
+def playMatches(web, EPISODES, turns_until_tau0, memory=None):
+    # scores = {player1.name:0, "drawn": 0, player2.name:0}
+    # sp_scores = {'sp':0, "drawn": 0, 'nsp':0}
+    # points = {player1.name:[], player2.name:[]}
+
+    for e in range(EPISODES):
+
+        state = web.reset()
+
+        done = 0
+        web.mcts = None
+        turn = 0
+        while done == 0:
+            turn = turn + 1
+
+            #### Run the MCTS algo and return an action
+
+            action, pi, value = web.act(state, 1)
+
+            if memory is not None:
+                # Commit the move to memory
+                memory.commit_stmemory(state, pi)
+
+            # Do the action
+            state, value, done, _ = web.step(action)
+
+            if done == 1:
+                if memory is not None:
+                    # If the game is finished, assign the values correctly to the game moves
+                    for move in memory.stmemory:
+                        move['value'] = value
+
+                print('done')
+                memory.commit_ltmemory()
+        return memory
+
+
+iteration = 0
+cnn = ResidualCNN(config.REG_CONST, config.LEARNING_RATE, config.INPUT_SHAPE, config.NUM_ACTIONS,
+                  config.HIDDEN_CNN_LAYERS)
+current_player = Agent('current_player', 20, config.NUM_ACTIONS, config.MCTS_SIMS, config.CPUCT, cnn)
+memory = None
+run_folder = './run/'
+if not os.path.exists(run_folder):
+    os.mkdir(run_folder)
+
+while 1:
+    iteration += 1
+    print('ITERATION NUMBER ' + str(iteration))
+    memory = playMatches(current_player, config.EPISODES, turns_until_tau0=config.TURNS_UNTIL_TAU0, memory=memory)
+    memory.clear_stmemory()
+
+    if len(memory.ltmemory) >= config.MEMORY_SIZE:
+
+        ######## RETRAINING ########
+        print('RETRAINING...')
+        current_player.replay(memory.ltmemory)
+        print('')
+
+        if iteration % 5 == 0:
+            pickle.dump(memory, open(run_folder + "memory/memory" + str(iteration).zfill(4) + ".p", "wb"))
+
+        memory_samp = random.sample(memory.ltmemory, min(1000, len(memory.ltmemory)))
+
+    else:
+        print('MEMORY SIZE: ' + str(len(memory.ltmemory)))
--- a/project/memory.py 0 → 100644
View file @7740983
+++ b/project/memory.py 0 → 100644
View file @7740983
+import numpy as np
+from collections import deque
+
+import config
+
+
+class Memory:
+    def __init__(self, memory_size):
+        self.MEMORY_SIZE = config.MEMORY_SIZE or memory_size
+        self.ltmemory = deque(maxlen=self.MEMORY_SIZE)
+        self.stmemory = deque(maxlen=self.MEMORY_SIZE)
+
+    # 학습할 때
+    # 인덱스
+    # state_check
+
+    # AV는 label
+
+    def commit_stmemory(self, state, action_value):
+        self.stmemory.append({
+            'state': state.state_check
+            , 'AV': action_value
+        })
+
+    def commit_ltmemory(self):
+        for i in self.stmemory:
+            self.ltmemory.append(i)
+        self.clear_stmemory()
+
+    def clear_stmemory(self):
+        self.stmemory = deque(maxlen=config.MEMORY_SIZE)
--- a/project/similarity.py 0 → 100644
View file @7740983
+++ b/project/similarity.py 0 → 100644
View file @7740983
+import keras
+import numpy as np
+from keras.applications.vgg16 import preprocess_input, VGG16
+from keras.preprocessing import image
+from numpy.linalg import norm
+
+keras.backend.set_image_data_format('channels_first')
+
+def preprocess_image(img_path):
+    img = image.load_img(img_path, target_size=(224, 224))
+    img_data = image.img_to_array(img, data_format='channels_first')
+    img_data = np.expand_dims(img_data, axis=0)
+    img_data = preprocess_input(img_data)
+    return img_data
+
+
+class Similarity(object):
+    def __init__(self, dest_file_path):
+        self.model = VGG16(weights='imagenet', include_top=False)
+        self.dest = preprocess_image(dest_file_path)
+
+    def _feature(self, image):
+        image_features = self.model.predict(image)
+        image_features = image_features.reshape(7 * 7 * 512)
+        return image_features
+
+    def similarity(self, before_image):
+        """
+        capture를 통해 얻은 이미지와 목표 이미지간 유사도를 계산
+        :return: 현재 이미지와 목표 이미지 유사도
+        """
+        before = self._feature(before_image)
+        after = self._feature(self.dest)
+        return np.dot(before, after) / (norm(before) * norm(after))
+# image path
+# image..
--- a/project/state.py 0 → 100644
View file @7740983
+++ b/project/state.py 0 → 100644
View file @7740983
+import base64
+import config
+import numpy as np
+import copy
+
+from similarity import preprocess_image
+
+
+class State(object):
+    def __init__(self, board, index, state_check, class_names, browser, sim_func):
+        self.class_names = class_names  # 클래스 이름들
+        self.board = board  # 현재 상황 (set list)
+        self.index = index  # 현재 위치
+        self.id = self._convertStateToId()  # state를 식별할 id
+        self.state_check = state_check
+        self.allowedActions = self._available_action()
+        self.browser = browser
+        self._make_css(state_check)
+        self.sim_func = sim_func
+        self.now_image = preprocess_image(self.browser.capture())
+        self.similarity = sim_func.similarity(self.now_image)
+        # np.ones((len(self.board), config.NUM_ACTIONS), dtype=np.int)  # 실제 확인
+
+    def _available_action(self):
+        return np.nonzero(self.state_check[self.index])[0]
+
+    def _convertStateToId(self):
+        id = '{}'.format(self.index).join(map(lambda f: str(f) if len(f) != 0 else '{}', self.board))
+        b64 = base64.b64encode(id.encode('utf-8'))
+        return str(b64)
+
+    def _checkForEndGame(self):
+        if self.index >= len(self.board) - 2:
+            return True
+        return False
+
+    def takeAction(self, act):
+        """
+        액션대로 상태를 변경
+        :param act:
+        :returns newState:
+                 value:
+                 done:
+        """
+        if act >= config.NUM_ACTIONS:
+            raise IndexError
+
+        newBoard = copy.deepcopy(self.board)
+        newStateCheck = copy.deepcopy(self.state_check)
+        value = 0
+        done = 0
+        index = self.index
+        if act == config.LAST_ACTION:
+            index += 1
+        else:
+            newBoard[index].add(act)
+            newStateCheck[index][act] = 0
+        newState = State(newBoard, index, newStateCheck, self.class_names, self.browser, self.sim_func)
+        if newState._checkForEndGame():
+            print('done')
+            done = 1
+        if newState.similarity >= 0.8:
+            done = 1
+            value = 1
+            print('good')
+
+        return newState, value, done
+
+    def _make_css(self, state_check):
+        """
+        state_check로 css 작성
+        :return: file_name
+        """
+        file_name = 'main.css'
+        with open(file_name, 'w') as f:
+            for class_index, actions in enumerate(state_check):
+                class_index = int(class_index)
+                f.write(".{}".format(self.class_names[class_index]))
+                f.write("{")
+                for action_index, action in enumerate(actions):
+                    if action == 0:
+                        f.write(" {}; ".format(config.ACTION_MEANING[action_index]))
+                f.write("}\n")
+
+        return file_name
+
+    def reset(self):
+        """
+        상태 초기화
+        :return:
+        """
+        self.index = 0
+        self.state_check = np.ones((len(self.board), config.NUM_ACTIONS))