impresso-project
/

nel-mgenre-multilingual

Text2Text Generation

entity-retrieval

named-entity-disambiguation

entity-disambiguation

named-entity-linking

Inference Endpoints

Model card Files Files and versions Community

Emanuela Boros commited on Oct 18, 2024

Commit

69c8f9c

·

1 Parent(s): f68e037

added confidence

Files changed (1) hide show

generic_nel.py +7 -8

generic_nel.py CHANGED Viewed

@@ -111,26 +111,25 @@ class NelPipeline(Pipeline):
             num_beams=1,
             num_return_sequences=1,
             max_new_tokens=30,
-            # return_dict_in_generate=True,
-            # output_scores=True,
         )
-        # print(outputs)
-        # token_ids, scores = outputs.sequences, outputs.scores
         # Decode the predictions into readable text
         wikipedia_predictions = self.tokenizer.batch_decode(
-            outputs, skip_special_tokens=True
         )
         # Process the scores for each token
         # print(scores)
         # print(type(scores), len(scores), type(list(scores)))
-        # scores = torch.cat(scores, dim=0)
         #
         # # scores_tensor = scores.clone().detach()
-        # probabilities = torch.exp(scores)
         # percentages = (probabilities * 100.0).cpu().numpy().tolist()
-        percentages = [0, 1, 2, 3, 3, 5]
         # # Process each score (logits for the generated tokens)
         # for i, score in enumerate(scores):
         #     # Apply softmax to convert logits into probabilities

             num_beams=1,
             num_return_sequences=1,
             max_new_tokens=30,
+            return_dict_in_generate=True,
+            output_scores=True,
         )
+        print(outputs.keys(), "!!!!")
+        token_ids, scores = outputs.sequences, outputs.scores
         # Decode the predictions into readable text
         wikipedia_predictions = self.tokenizer.batch_decode(
+            outputs.sequences, skip_special_tokens=True
         )
         # Process the scores for each token
         # print(scores)
         # print(type(scores), len(scores), type(list(scores)))
+        scores = torch.cat(scores, dim=0)
         #
         # # scores_tensor = scores.clone().detach()
+        probabilities = torch.exp(scores)
         # percentages = (probabilities * 100.0).cpu().numpy().tolist()
         # # Process each score (logits for the generated tokens)
         # for i, score in enumerate(scores):
         #     # Apply softmax to convert logits into probabilities