@@ -655,14 +655,13 @@ <h1>Source code for lzero.mcts.buffer.game_buffer</h1><div class="highlight"><pr
655
655
< span class ="c1 "> # print(f'valid_len is {valid_len}')</ span >
656
656
657
657
< span class ="k "> if</ span > < span class ="n "> meta</ span > < span class ="p "> [</ span > < span class ="s1 "> 'priorities'</ span > < span class ="p "> ]</ span > < span class ="ow "> is</ span > < span class ="kc "> None</ span > < span class ="p "> :</ span >
658
- < span class ="n "> max_prio</ span > < span class ="o "> =</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> game_pos_priorities</ span > < span class ="o "> .</ span > < span class ="n "> max</ span > < span class ="p "> ()</ span > < span class ="k "> if</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> game_segment_buffer</ span > < span class ="k "> else</ span > < span class ="mi "> 1</ span >
658
+ < span class ="k "> if</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> game_segment_buffer</ span > < span class ="p "> :</ span >
659
+ < span class ="n "> max_prio</ span > < span class ="o "> =</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> game_pos_priorities</ span > < span class ="o "> .</ span > < span class ="n "> max</ span > < span class ="p "> ()</ span > < span class ="k "> if</ span > < span class ="nb "> len</ span > < span class ="p "> (</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> game_pos_priorities</ span > < span class ="p "> )</ span > < span class ="o "> ></ span > < span class ="mi "> 0</ span > < span class ="k "> else</ span > < span class ="mi "> 1</ span >
660
+ < span class ="k "> else</ span > < span class ="p "> :</ span >
661
+ < span class ="n "> max_prio</ span > < span class ="o "> =</ span > < span class ="mi "> 1</ span >
662
+
659
663
< span class ="c1 "> # if no 'priorities' provided, set the valid part of the new-added game history the max_prio</ span >
660
- < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> game_pos_priorities</ span > < span class ="o "> =</ span > < span class ="n "> np</ span > < span class ="o "> .</ span > < span class ="n "> concatenate</ span > < span class ="p "> (</ span >
661
- < span class ="p "> (</ span >
662
- < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> game_pos_priorities</ span > < span class ="p "> ,</ span > < span class ="p "> [</ span > < span class ="n "> max_prio</ span >
663
- < span class ="k "> for</ span > < span class ="n "> _</ span > < span class ="ow "> in</ span > < span class ="nb "> range</ span > < span class ="p "> (</ span > < span class ="n "> valid_len</ span > < span class ="p "> )]</ span > < span class ="o "> +</ span > < span class ="p "> [</ span > < span class ="mf "> 0.</ span > < span class ="k "> for</ span > < span class ="n "> _</ span > < span class ="ow "> in</ span > < span class ="nb "> range</ span > < span class ="p "> (</ span > < span class ="n "> valid_len</ span > < span class ="p "> ,</ span > < span class ="n "> data_length</ span > < span class ="p "> )]</ span >
664
- < span class ="p "> )</ span >
665
- < span class ="p "> )</ span >
664
+ < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> game_pos_priorities</ span > < span class ="o "> =</ span > < span class ="n "> np</ span > < span class ="o "> .</ span > < span class ="n "> concatenate</ span > < span class ="p "> ((</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> game_pos_priorities</ span > < span class ="p "> ,</ span > < span class ="p "> [</ span > < span class ="n "> max_prio</ span > < span class ="k "> for</ span > < span class ="n "> _</ span > < span class ="ow "> in</ span > < span class ="nb "> range</ span > < span class ="p "> (</ span > < span class ="n "> valid_len</ span > < span class ="p "> )]</ span > < span class ="o "> +</ span > < span class ="p "> [</ span > < span class ="mf "> 0.</ span > < span class ="k "> for</ span > < span class ="n "> _</ span > < span class ="ow "> in</ span > < span class ="nb "> range</ span > < span class ="p "> (</ span > < span class ="n "> valid_len</ span > < span class ="p "> ,</ span > < span class ="n "> data_length</ span > < span class ="p "> )]))</ span >
666
665
< span class ="k "> else</ span > < span class ="p "> :</ span >
667
666
< span class ="k "> assert</ span > < span class ="n "> data_length</ span > < span class ="o "> ==</ span > < span class ="nb "> len</ span > < span class ="p "> (</ span > < span class ="n "> meta</ span > < span class ="p "> [</ span > < span class ="s1 "> 'priorities'</ span > < span class ="p "> ]),</ span > < span class ="s2 "> " priorities should be of same length as the game steps"</ span >
668
667
< span class ="n "> priorities</ span > < span class ="o "> =</ span > < span class ="n "> meta</ span > < span class ="p "> [</ span > < span class ="s1 "> 'priorities'</ span > < span class ="p "> ]</ span > < span class ="o "> .</ span > < span class ="n "> copy</ span > < span class ="p "> ()</ span > < span class ="o "> .</ span > < span class ="n "> reshape</ span > < span class ="p "> (</ span > < span class ="o "> -</ span > < span class ="mi "> 1</ span > < span class ="p "> )</ span >
0 commit comments