Python RankingOutput示例

编程语言: Python

命名空间/包名称: ml.rl.types

方法/功能: RankingOutput

hotexamples.com的示例: 4

Python RankingOutput - 已找到4个示例。这些是从开源项目中提取的最受好评的ml.rl.types.RankingOutput现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

 def forward(
     self,
     input: rlt.PreprocessedRankingInput,
     mode: str,
     greedy: Optional[bool] = None,
 ):
     # The creation of evaluation data pages only uses these specific arguments
     assert mode in (Seq2SlateMode.RANK_MODE,
                     Seq2SlateMode.PER_SEQ_LOG_PROB_MODE)
     if mode == Seq2SlateMode.RANK_MODE:
         assert greedy
         return rlt.RankingOutput(ranked_tgt_out_idx=torch.tensor(
             [[2, 3], [3, 2], [2, 3]]).long())
     return rlt.RankingOutput(
         log_probs=torch.log(torch.tensor([0.4, 0.3, 0.7])))

示例#2

显示文件

文件： seq2slate.py 项目： zhenyu-captain/ReAgent

 def forward(
     self,
     input: rlt.PreprocessedRankingInput,
     mode: str,
     tgt_seq_len: Optional[int] = None,
     greedy: Optional[bool] = None,
 ):
     res = self.data_parallel(
         input, mode=mode, tgt_seq_len=tgt_seq_len, greedy=greedy
     )
     if mode == RANK_MODE:
         return rlt.RankingOutput(
             ranked_tgt_out_idx=res[1], ranked_tgt_out_probs=res[0]
         )
     elif mode == LOG_PROB_MODE:
         return rlt.RankingOutput(log_probs=res)

示例#3

显示文件

文件： seq2slate.py 项目： rezanazari/ReAgent

 def forward(
     self,
     input: rlt.PreprocessedRankingInput,
     mode: str,
     tgt_seq_len: Optional[int] = None,
     greedy: Optional[bool] = None,
 ):
     res = self.data_parallel(input,
                              mode=mode,
                              tgt_seq_len=tgt_seq_len,
                              greedy=greedy)
     if mode == Seq2SlateMode.RANK_MODE:
         return rlt.RankingOutput(ranked_tgt_out_idx=res[1],
                                  ranked_tgt_out_probs=res[0])
     elif mode in (
             Seq2SlateMode.PER_SYMBOL_LOG_PROB_DIST_MODE,
             Seq2SlateMode.PER_SEQ_LOG_PROB_MODE,
     ):
         return rlt.RankingOutput(log_probs=res)
     else:
         raise NotImplementedError()

示例#4

显示文件

    def forward(self, input: rlt.PreprocessedRankingInput, mode: str, greedy: bool):
        # The creation of evaluation data pages only uses these specific arguments
        assert greedy and mode == RANK_MODE
        batch_size = input.state.float_features.shape[0]
        ranked_tgt_out_idx = []

        for i in range(batch_size):
            ranked_tgt_out_idx.append(self._forward(input.state.float_features[i]))

        return rlt.RankingOutput(
            ranked_tgt_out_idx=torch.tensor(ranked_tgt_out_idx).long()
        )