gymcts 1.4.3__py3-none-any.whl → 1.4.4__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- gymcts/gymcts_neural_agent.py +2 -0
- {gymcts-1.4.3.dist-info → gymcts-1.4.4.dist-info}/METADATA +1 -1
- {gymcts-1.4.3.dist-info → gymcts-1.4.4.dist-info}/RECORD +6 -6
- {gymcts-1.4.3.dist-info → gymcts-1.4.4.dist-info}/WHEEL +0 -0
- {gymcts-1.4.3.dist-info → gymcts-1.4.4.dist-info}/licenses/LICENSE +0 -0
- {gymcts-1.4.3.dist-info → gymcts-1.4.4.dist-info}/top_level.txt +0 -0
gymcts/gymcts_neural_agent.py
CHANGED
|
@@ -168,6 +168,8 @@ class GymctsNeuralNode(GymctsNode):
|
|
|
168
168
|
elif GymctsNeuralNode.score_variate == "PUCT_v1":
|
|
169
169
|
return exploitation_term + c * p_sa * math.sqrt(2 * math.log(n_s) / (n_sa))
|
|
170
170
|
elif GymctsNeuralNode.score_variate == "PUCT_v2":
|
|
171
|
+
if n_sa == 0:
|
|
172
|
+
return float("inf") # Avoid division by zero
|
|
171
173
|
return exploitation_term + c * p_sa * math.sqrt(n_s) / n_sa
|
|
172
174
|
elif GymctsNeuralNode.score_variate == "PUCT_v3":
|
|
173
175
|
return exploitation_term + c * (p_sa ** GymctsNeuralNode.PUCT_v3_mu) * math.sqrt(n_s / (1 + n_sa))
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: gymcts
|
|
3
|
-
Version: 1.4.
|
|
3
|
+
Version: 1.4.4
|
|
4
4
|
Summary: A minimalistic implementation of the Monte Carlo Tree Search algorithm for planning problems fomulated as gymnaisum reinforcement learning environments.
|
|
5
5
|
Author: Alexander Nasuta
|
|
6
6
|
Author-email: Alexander Nasuta <alexander.nasuta@wzl-iqs.rwth-aachen.de>
|
|
@@ -5,12 +5,12 @@ gymcts/gymcts_agent.py,sha256=FzMPjHXyKN6enNJubmYEouvb0wBbE1-bpxuLuW4J1gU,10960
|
|
|
5
5
|
gymcts/gymcts_deepcopy_wrapper.py,sha256=lCCT5-6JVCwUCP__4uPMMkT5HnO2JWm2ebzJ69zXp9c,6792
|
|
6
6
|
gymcts/gymcts_distributed_agent.py,sha256=Ha9UBQvFjoErfMWvPyN0JcTYz-JaiJ4eWjLMikp9Yhs,11569
|
|
7
7
|
gymcts/gymcts_env_abc.py,sha256=iqrFNNSa-kZyAGk1UN2BjkdkV6NufAkYJT8d7PlQ07E,2525
|
|
8
|
-
gymcts/gymcts_neural_agent.py,sha256=
|
|
8
|
+
gymcts/gymcts_neural_agent.py,sha256=_PV_lNYVyZDjrPBRYK-DWiQRwUGnleAt3SKbwCZKCWU,16326
|
|
9
9
|
gymcts/gymcts_node.py,sha256=KAR5y1MrT8c_7ZXwTuCj77B7DiERDfHplF8avs76JHU,13410
|
|
10
10
|
gymcts/gymcts_tree_plotter.py,sha256=PR6C7q9Q4kuz1aLGyD7-aZsxk3RqlHZpOqmOiRpCyK0,3547
|
|
11
11
|
gymcts/logger.py,sha256=RI7B9cvbBGrj0_QIAI77wihzuu2tPG_-z9GM2Mw5aHE,926
|
|
12
|
-
gymcts-1.4.
|
|
13
|
-
gymcts-1.4.
|
|
14
|
-
gymcts-1.4.
|
|
15
|
-
gymcts-1.4.
|
|
16
|
-
gymcts-1.4.
|
|
12
|
+
gymcts-1.4.4.dist-info/licenses/LICENSE,sha256=UGe75WojDiw_77SEnK2aysEDlElRlkWie7U7NaAFx00,1072
|
|
13
|
+
gymcts-1.4.4.dist-info/METADATA,sha256=y_-_ktxyZpaLdB0i81ggKepZNycG-P1jiqqadBMwSzI,23864
|
|
14
|
+
gymcts-1.4.4.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
15
|
+
gymcts-1.4.4.dist-info/top_level.txt,sha256=E8MoLsPimUPD0H1Y6lum4TVe-lhSDAyBAXGrkYIT52w,7
|
|
16
|
+
gymcts-1.4.4.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|