File size: 1,829 Bytes
9a7d9d2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
import torch
import tensorflow as tf
import numpy as np
from transformers import Text2TextGenerationPipeline

class DemoT5QAPipeline(Text2TextGenerationPipeline):
    def _forward(self, model_inputs, **generate_kwargs):
        if self.framework == "pt":
            in_b, input_length = model_inputs["input_ids"].shape
        elif self.framework == "tf":
            in_b, input_length = tf.shape(model_inputs["input_ids"]).numpy()

        self.check_inputs(
            input_length,
            generate_kwargs.get("min_length", self.model.config.min_length),
            generate_kwargs.get("max_length", self.model.config.max_length),
        )
        outputs = self.model.generate(**model_inputs, **generate_kwargs, return_dict_in_generate=True, output_scores=True, max_new_tokens=75)
        
        # Code from the parent class
        output_ids = outputs.sequences
        out_b = output_ids.shape[0]
        if self.framework == "pt":
            output_ids = output_ids.reshape(in_b, out_b // in_b, *output_ids.shape[1:])
        elif self.framework == "tf":
            output_ids = tf.reshape(output_ids, (in_b, out_b // in_b, *output_ids.shape[1:]))

        output_sequences = outputs.sequences
        output_scores = outputs.scores
        return {"output_ids": output_ids, "output_sequences": output_sequences, "output_scores": output_scores}
    
    def postprocess(self, model_outputs):
        guess_text = super().postprocess(model_outputs)[0]['generated_text']

        transition_scores = self.model.compute_transition_scores(model_outputs['output_sequences'], model_outputs['output_scores'], normalize_logits=True)
        log_probs = np.round(np.exp(transition_scores.cpu().numpy()), 3)[0]
        guess_prob = np.product(log_probs)

        return {'guess': guess_text, 'confidence': guess_prob}