Skip to content

Commit 3349265

Browse files
committed
feat(): turn on webgpu for ocr and speech-recog
1 parent a896ab4 commit 3349265

File tree

2 files changed

+5
-2
lines changed

2 files changed

+5
-2
lines changed

src/services/ocr/ocr-worker.ts

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -42,7 +42,9 @@ async function loadOCR(model: string): Promise<void> {
4242
if (!ocr) {
4343
env.allowLocalModels = false;
4444
env.useBrowserCache = false;
45-
ocr = await pipeline('image-to-text', model || 'Xenova/trocr-small-printed');
45+
ocr = await pipeline('image-to-text', model || 'Xenova/trocr-small-printed', {
46+
device: "webgpu"
47+
});
4648
console.log("loaded ocr", ocr)
4749
resolve();
4850
}

src/services/speech-recognition/worker.ts

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,8 @@ export async function loadTranscriber(model: string = "Xenova/whisper-tiny", tim
3737
transcriber = await pipeline('automatic-speech-recognition', model || 'Xenova/whisper-tiny', {
3838
// @ts-ignore
3939
return_timestamps: timestamps,
40-
language
40+
language,
41+
device: "webgpu"
4142
});
4243

4344
resolve();

0 commit comments

Comments
 (0)