Spaces:

huggingfacejs
/

inference-widgets

Running on CPU Upgrade

App Files Files Community

machineuser commited on Feb 12, 2024

Commit

60fd1b8

1 Parent(s): a6b2d88

Sync widgets demo

Browse files

Files changed (3) hide show

packages/tasks/src/tasks/text-generation/inference.ts +110 -4
packages/tasks/src/tasks/text-generation/spec/input.json +18 -2
packages/tasks/src/tasks/text-generation/spec/output.json +107 -1

packages/tasks/src/tasks/text-generation/inference.ts CHANGED Viewed

@@ -26,11 +26,24 @@ export interface TextGenerationInput {
  */
 export interface TextGenerationParameters {
 	/**
-	 * Whether to use logit sampling (true) or greedy search (false).
 	 */
 	do_sample?: boolean;
 	/**
-	 * Maximum number of generated tokens.
 	 */
 	max_new_tokens?: number;
 	/**
@@ -42,6 +55,10 @@ export interface TextGenerationParameters {
 	 * Whether to prepend the prompt to the generated text.
 	 */
 	return_full_text?: boolean;
 	/**
 	 * Stop generating tokens if a member of `stop_sequences` is generated.
 	 */
@@ -79,10 +96,99 @@ export interface TextGenerationParameters {
  * Outputs for Text Generation inference
  */
 export interface TextGenerationOutput {
-	generatedText: unknown;
 	/**
 	 * The generated text
 	 */
-	generated_text?: string;
 	[property: string]: unknown;
 }

  */
 export interface TextGenerationParameters {
 	/**
+	 * The number of sampling queries to run. Only the best one (in terms of total logprob) will
+	 * be returned.
+	 */
+	best_of?: number;
+	/**
+	 * Whether or not to output decoder input details
+	 */
+	decoder_input_details?: boolean;
+	/**
+	 * Whether or not to output details
+	 */
+	details?: boolean;
+	/**
+	 * Whether to use logits sampling instead of greedy decoding when generating new tokens.
 	 */
 	do_sample?: boolean;
 	/**
+	 * The maximum number of tokens to generate.
 	 */
 	max_new_tokens?: number;
 	/**
 	 * Whether to prepend the prompt to the generated text.
 	 */
 	return_full_text?: boolean;
+	/**
+	 * The random sampling seed.
+	 */
+	seed?: number;
 	/**
 	 * Stop generating tokens if a member of `stop_sequences` is generated.
 	 */
  * Outputs for Text Generation inference
  */
 export interface TextGenerationOutput {
+	/**
+	 * When enabled, details about the generation
+	 */
+	details?: TextGenerationOutputDetails;
+	/**
+	 * The generated text
+	 */
+	generated_text: string;
+	[property: string]: unknown;
+}
+/**
+ * When enabled, details about the generation
+ */
+export interface TextGenerationOutputDetails {
+	/**
+	 * Details about additional sequences when best_of is provided
+	 */
+	best_of_sequences?: TextGenerationSequenceDetails[];
+	/**
+	 * The reason why the generation was stopped.
+	 */
+	finish_reason: FinishReason;
+	/**
+	 * The number of generated tokens
+	 */
+	generated_tokens: number;
+	prefill: PrefillToken[];
+	/**
+	 * The random seed used for generation
+	 */
+	seed?: number;
+	/**
+	 * The generated tokens and associated details
+	 */
+	tokens: Token[];
+	[property: string]: unknown;
+}
+export interface TextGenerationSequenceDetails {
+	/**
+	 * The reason why the generation was stopped.
+	 */
+	finish_reason: FinishReason;
 	/**
 	 * The generated text
 	 */
+	generated_text: number;
+	/**
+	 * The number of generated tokens
+	 */
+	generated_tokens: number;
+	prefill: PrefillToken[];
+	/**
+	 * The random seed used for generation
+	 */
+	seed?: number;
+	/**
+	 * The generated tokens and associated details
+	 */
+	tokens: Token[];
+	[property: string]: unknown;
+}
+/**
+ * The generated sequence reached the maximum allowed length
+ *
+ * The model generated an end-of-sentence (EOS) token
+ *
+ * One of the sequence in stop_sequences was generated
+ */
+export type FinishReason = "length" | "eos_token" | "stop_sequence";
+export interface PrefillToken {
+	id: number;
+	logprob: number;
+	/**
+	 * The text associated with that token
+	 */
+	text: string;
+	[property: string]: unknown;
+}
+export interface Token {
+	id: number;
+	logprob: number;
+	/**
+	 * Whether or not that token is a special one
+	 */
+	special: boolean;
+	/**
+	 * The text associated with that token
+	 */
+	text: string;
 	[property: string]: unknown;
 }

packages/tasks/src/tasks/text-generation/spec/input.json CHANGED Viewed

@@ -20,13 +20,25 @@
 			"description": "Additional inference parameters for Text Generation",
 			"type": "object",
 			"properties": {
 				"do_sample": {
 					"type": "boolean",
-					"description": "Whether to use logit sampling (true) or greedy search (false)."
 				},
 				"max_new_tokens": {
 					"type": "integer",
-					"description": "Maximum number of generated tokens."
 				},
 				"repetition_penalty": {
 					"type": "number",
@@ -36,6 +48,10 @@
 					"type": "boolean",
 					"description": "Whether to prepend the prompt to the generated text."
 				},
 				"stop_sequences": {
 					"type": "array",
 					"items": {

 			"description": "Additional inference parameters for Text Generation",
 			"type": "object",
 			"properties": {
+				"best_of": {
+					"type": "integer",
+					"description": "The number of sampling queries to run. Only the best one (in terms of total logprob) will be returned."
+				},
+				"decoder_input_details": {
+					"type": "boolean",
+					"description": "Whether or not to output decoder input details"
+				},
+				"details": {
+					"type": "boolean",
+					"description": "Whether or not to output details"
+				},
 				"do_sample": {
 					"type": "boolean",
+					"description": "Whether to use logits sampling instead of greedy decoding when generating new tokens."
 				},
 				"max_new_tokens": {
 					"type": "integer",
+					"description": "The maximum number of tokens to generate."
 				},
 				"repetition_penalty": {
 					"type": "number",
 					"type": "boolean",
 					"description": "Whether to prepend the prompt to the generated text."
 				},
+				"seed": {
+					"type": "integer",
+					"description": "The random sampling seed."
+				},
 				"stop_sequences": {
 					"type": "array",
 					"items": {

packages/tasks/src/tasks/text-generation/spec/output.json CHANGED Viewed

@@ -8,7 +8,113 @@
 		"generated_text": {
 			"type": "string",
 			"description": "The generated text"
 		}
 	},
-	"required": ["generatedText"]
 }

 		"generated_text": {
 			"type": "string",
 			"description": "The generated text"
+		},
+		"details": {
+			"description": "When enabled, details about the generation",
+			"title": "TextGenerationOutputDetails",
+			"allOf": [
+				{ "$ref": "#/$defs/SequenceDetails" },
+				{
+					"type": "object",
+					"properties": {
+						"best_of_sequences": {
+							"type": "array",
+							"description": "Details about additional sequences when best_of is provided",
+							"items": {
+								"allOf": [
+									{ "$ref": "#/$defs/SequenceDetails" },
+									{
+										"type": "object",
+										"properties": {
+											"generated_text": {
+												"type": "integer",
+												"description": "The generated text"
+											}
+										},
+										"required": ["generated_text"]
+									}
+								]
+							}
+						}
+					}
+				}
+			]
 		}
 	},
+	"required": ["generated_text"],
+	"$defs": {
+		"Token": {
+			"type": "object",
+			"title": "Token",
+			"properties": {
+				"id": {
+					"type": "integer"
+				},
+				"logprob": {
+					"type": "number"
+				},
+				"special": {
+					"type": "boolean",
+					"description": "Whether or not that token is a special one"
+				},
+				"text": {
+					"type": "string",
+					"description": "The text associated with that token"
+				}
+			},
+			"required": ["id", "logprob", "special", "text"]
+		},
+		"SequenceDetails": {
+			"type": "object",
+			"title": "TextGenerationSequenceDetails",
+			"properties": {
+				"finish_reason": {
+					"type": "string",
+					"description": "The reason why the generation was stopped.",
+					"oneOf": [
+						{ "const": "length", "description": "The generated sequence reached the maximum allowed length" },
+						{ "const": "eos_token", "description": "The model generated an end-of-sentence (EOS) token" },
+						{ "const": "stop_sequence", "description": "One of the sequence in stop_sequences was generated" }
+					]
+				},
+				"generated_tokens": {
+					"type": "integer",
+					"description": "The number of generated tokens"
+				},
+				"prefill": {
+					"type": "array",
+					"items": {
+						"title": "PrefillToken",
+						"type": "object",
+						"properties": {
+							"id": {
+								"type": "integer"
+							},
+							"logprob": {
+								"type": "number"
+							},
+							"text": {
+								"type": "string",
+								"description": "The text associated with that token"
+							}
+						},
+						"required": ["id", "logprob", "text"]
+					}
+				},
+				"seed": {
+					"type": "integer",
+					"description": "The random seed used for generation"
+				},
+				"tokens": {
+					"type": "array",
+					"description": "The generated tokens and associated details",
+					"items": {
+						"$ref": "#/$defs/Token"
+					}
+				}
+			},
+			"required": ["finish_reason", "generated_tokens", "prefill", "tokens"]
+		}
+	}
 }