1880e8fb67b7cbcb6e75c743d45cebf7cba3f876,contents/9_Deep_Deterministic_Policy_Gradient_DDPG/DDPG_update.py,DDPG,init,#DDPG#,36

Before Change


        self.ct_params = tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES, scope="Critic/target")

        // target net replacement
        self.soft_replace = [[tf.assign(ta, (1 - TAU) * ta + TAU * ea), tf.assign(tc, (1 - TAU) * tc + TAU * ec)]
                             for ta, ea, tc, ec in zip(self.at_params, self.ae_params, self.ct_params, self.ce_params)]

        q_target = self.R + GAMMA * q_

After Change


        self.ct_params = tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES, scope="Critic/target")

        // target net replacement
        self.soft_replace = [tf.assign(t, (1 - TAU) * t + TAU * e)
                             for t, e in zip(self.at_params + self.ct_params, self.ae_params + self.ce_params)]

        q_target = self.R + GAMMA * q_
        // in the feed_dic for the td_error, the self.a should change to actions in memory

In pattern: SUPERPATTERN

Frequency: 3

Non-data size: 2

Instances

Link

Project Name: MorvanZhou/Reinforcement-learning-with-tensorflow

Commit Name: 1880e8fb67b7cbcb6e75c743d45cebf7cba3f876

Time: 2018-11-16

Author: morvanzhou@gmail.com

File Name: contents/9_Deep_Deterministic_Policy_Gradient_DDPG/DDPG_update.py

Class Name: DDPG

Method Name: __init__

Link

Project Name: QUANTAXIS/QUANTAXIS

Commit Name: 94db34e6f69f7874cb47b9a08a2a2ccbd6ac9079

Time: 2019-02-09

Author: yutiansut@qq.com

File Name: QUANTAXIS/QAARP/QARisk.py

Class Name: QA_Performance

Method Name: pnl_fifo

Link

Project Name: datascienceinc/Skater

Commit Name: 2ae494d00ce9fcf11fe85517c7136d205be4d545

Time: 2018-02-18

Author: pramitchoudhary@ip-172-30-0-2.us-west-2.compute.internal

File Name: skater/core/global_interpretation/interpretable_models/rule_lists.py

Class Name: BayesianRuleLists

Method Name: fit

1880e8fb67b7cbcb6e75c743d45cebf7cba3f876,contents/9_Deep_Deterministic_Policy_Gradient_DDPG/DDPG_update.py,DDPG,__init__,#DDPG#,36

Before Change

After Change

Instances

1880e8fb67b7cbcb6e75c743d45cebf7cba3f876,contents/9_Deep_Deterministic_Policy_Gradient_DDPG/DDPG_update.py,DDPG,init,#DDPG#,36