-
Notifications
You must be signed in to change notification settings - Fork 69
Expand file tree
/
Copy pathuseTokenizer.ts
More file actions
61 lines (55 loc) · 1.84 KB
/
useTokenizer.ts
File metadata and controls
61 lines (55 loc) · 1.84 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
import { useEffect, useState } from 'react';
import { TokenizerModule } from '../../modules/natural_language_processing/TokenizerModule';
import { ResourceSource } from '../../types/common';
import { ETError, getError } from '../../Error';
export const useTokenizer = ({
tokenizerSource,
preventLoad = false,
}: {
tokenizerSource: ResourceSource;
preventLoad?: boolean;
}) => {
const [error, setError] = useState<null | string>(null);
const [isReady, setIsReady] = useState(false);
const [isGenerating, setIsGenerating] = useState(false);
const [downloadProgress, setDownloadProgress] = useState(0);
useEffect(() => {
const loadModule = async () => {
try {
setIsReady(false);
TokenizerModule.onDownloadProgress(setDownloadProgress);
await TokenizerModule.load(tokenizerSource);
setIsReady(true);
} catch (err) {
setError((err as Error).message);
}
};
if (!preventLoad) {
loadModule();
}
}, [tokenizerSource, preventLoad]);
const stateWrapper = <T extends (...args: any[]) => Promise<any>>(fn: T) => {
const boundFn = fn.bind(TokenizerModule);
return async (...args: Parameters<T>): Promise<ReturnType<T>> => {
if (!isReady) throw new Error(getError(ETError.ModuleNotLoaded));
if (isGenerating) throw new Error(getError(ETError.ModelGenerating));
setIsGenerating(true);
try {
return await boundFn(...args);
} finally {
setIsGenerating(false);
}
};
};
return {
error,
isReady,
isGenerating,
downloadProgress,
decode: stateWrapper(TokenizerModule.decode),
encode: stateWrapper(TokenizerModule.encode),
getVocabSize: stateWrapper(TokenizerModule.getVocabSize),
idToToken: stateWrapper(TokenizerModule.idToToken),
tokenToId: stateWrapper(TokenizerModule.tokenToId),
};
};