Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
import { InferenceOutputError } from "../../lib/InferenceOutputError"; | |
import type { BaseArgs, Options } from "../../types"; | |
import { request } from "../custom/request"; | |
import type { RequestArgs } from "../../types"; | |
import { base64FromBytes } from "../../../../shared"; | |
import { toArray } from "../../utils/toArray"; | |
export type DocumentQuestionAnsweringArgs = BaseArgs & { | |
inputs: { | |
/** | |
* Raw image | |
* | |
* You can use native `File` in browsers, or `new Blob([buffer])` in node, or for a base64 image `new Blob([btoa(base64String)])`, or even `await (await fetch('...)).blob()` | |
**/ | |
image: Blob | ArrayBuffer; | |
question: string; | |
}; | |
}; | |
export interface DocumentQuestionAnsweringOutput { | |
/** | |
* A string that’s the answer within the document. | |
*/ | |
answer: string; | |
/** | |
* ? | |
*/ | |
end?: number; | |
/** | |
* A float that represents how likely that the answer is correct | |
*/ | |
score?: number; | |
/** | |
* ? | |
*/ | |
start?: number; | |
} | |
/** | |
* Answers a question on a document image. Recommended model: impira/layoutlm-document-qa. | |
*/ | |
export async function documentQuestionAnswering( | |
args: DocumentQuestionAnsweringArgs, | |
options?: Options | |
): Promise<DocumentQuestionAnsweringOutput> { | |
const reqArgs: RequestArgs = { | |
...args, | |
inputs: { | |
question: args.inputs.question, | |
// convert Blob or ArrayBuffer to base64 | |
image: base64FromBytes( | |
new Uint8Array( | |
args.inputs.image instanceof ArrayBuffer ? args.inputs.image : await args.inputs.image.arrayBuffer() | |
) | |
), | |
}, | |
} as RequestArgs; | |
const res = toArray( | |
await request<[DocumentQuestionAnsweringOutput] | DocumentQuestionAnsweringOutput>(reqArgs, { | |
...options, | |
taskHint: "document-question-answering", | |
}) | |
)?.[0]; | |
const isValidOutput = | |
typeof res?.answer === "string" && | |
(typeof res.end === "number" || typeof res.end === "undefined") && | |
(typeof res.score === "number" || typeof res.score === "undefined") && | |
(typeof res.start === "number" || typeof res.start === "undefined"); | |
if (!isValidOutput) { | |
throw new InferenceOutputError("Expected Array<{answer: string, end?: number, score?: number, start?: number}>"); | |
} | |
return res; | |
} | |