Add completion options for evaluation with multi-choice problem datasets

friendliai · Aug 11, 2023 · 0ac46bd · 0ac46bd
1 parent 73e5689
commit 0ac46bd
Show file tree

Hide file tree

Showing 3 changed files with 12 additions and 0 deletions.
diff --git a/docs/docs/sdk/api/completion.mdx b/docs/docs/sdk/api/completion.mdx
@@ -75,6 +75,8 @@ following schema.
 | `bad_words` | `Optional[List[str]]` | `None` |
 | `bad_word_tokens` | `Optional[List[TokenSequence]]` | `None` |
 | `include_output_logits` | `Optional[bool]` | `None` |
+| `include_output_logprobs` | `Optional[bool]` | `None` |
+| `forced_output_tokens` | `Optional[List[int]]` | `None` |
 | `eos_token` | `Optional[List[int]]` | `None` |
 
 Followings are the descriptions for each field.
@@ -105,6 +107,8 @@ Followings are the descriptions for each field.
 - **bad_words**: Text phrases that should not be generated. For a bad word phrase that contains N tokens, if the first N-1 tokens appears at the last of the generated result, the logit for the last token of the phrase is set to -inf. We recommend using `bad_word_tokens` because it is clearer (more details in the document for `stop` field). Defaults to empty list.
 - **bad_word_tokens**: Same as the above `bad_words` field, but receives token sequences instead of text phrases. This is similar to Hugging Face's <a href="https://huggingface.co/docs/transformers/v4.26.0/en/main_classes/text_generation#transformers.GenerationConfig.bad_words_ids(List[List[int]]," target="_top">`bad_word_ids`</a> argument.
 - **include_output_logits**: Whether to include the output logits to the generation output.
+- **include_output_logprobs**: Whether to include the output logprobs to the generation output.
+- **forced_output_tokens**: A token sequence that is enforced as a generation output. This option can be used when evaluating the model for the datasets with multi-choice problems (e.g., [HellaSwag](https://huggingface.co/datasets/hellaswag), [MMLU](https://huggingface.co/datasets/cais/mmlu)). When this option is used with `include_output_logits` or `include_output_logprobs` option, you can easily get the logits or logprobs for the evaluation.
 - **eos_token**: A list of endpoint sentence tokens.
 
 :::note

diff --git a/periflow/schema/api/v1/completion.py b/periflow/schema/api/v1/completion.py
@@ -50,6 +50,10 @@ class V1CompletionOptions(BaseModel):
     bad_words: Optional[List[str]] = None  # List of bad words.
     bad_word_tokens: Optional[List[TokenSequence]] = None  # List of bad word tokens.
     include_output_logits: Optional[bool] = None  # Include logits in the output.
+    include_output_logprobs: Optional[bool] = None  # Include logprobs in the output.
+    forced_output_tokens: Optional[
+        List[int]
+    ] = None  # List of tokens enforced to be generated.
     eos_token: Optional[List[int]] = None  # List of EOS tokens.
 
 

diff --git a/periflow/sdk/api/completion.py b/periflow/sdk/api/completion.py
@@ -98,6 +98,8 @@ def create(
             | `bad_words` | `Optional[List[str]]` | `None` |
             | `bad_word_tokens` | `Optional[List[TokenSequence]]` | `None` |
             | `include_output_logits` | `Optional[bool]` | `None` |
+            | `include_output_logprobs` | `Optional[bool]` | `None` |
+            | `forced_output_tokens` | `Optional[List[int]]` | `None` |
             | `eos_token` | `Optional[List[int]]` | `None` |
 
             Followings are the descriptions for each field.
@@ -128,6 +130,8 @@ def create(
             - **bad_words**: Text phrases that should not be generated. For a bad word phrase that contains N tokens, if the first N-1 tokens appears at the last of the generated result, the logit for the last token of the phrase is set to -inf. We recommend using `bad_word_tokens` because it is clearer (more details in the document for `stop` field). Defaults to empty list.
             - **bad_word_tokens**: Same as the above `bad_words` field, but receives token sequences instead of text phrases. This is similar to Hugging Face's <a href="https://huggingface.co/docs/transformers/v4.26.0/en/main_classes/text_generation#transformers.GenerationConfig.bad_words_ids(List[List[int]]," target="_top">`bad_word_ids`</a> argument.
             - **include_output_logits**: Whether to include the output logits to the generation output.
+            - **include_output_logprobs**: Whether to include the output logprobs to the generation output.
+            - **forced_output_tokens**: A token sequence that is enforced as a generation output. This option can be used when evaluating the model for the datasets with multi-choice problems (e.g., [HellaSwag](https://huggingface.co/datasets/hellaswag), [MMLU](https://huggingface.co/datasets/cais/mmlu)). When this option is used with `include_output_logits` or `include_output_logprobs` option, you can easily get the logits or logprobs for the evaluation.
             - **eos_token**: A list of endpoint sentence tokens.
 
             :::note