2023-05-07 12:05:41 +01:00
|
|
|
import * as React from 'react';
|
2024-10-26 13:00:56 -07:00
|
|
|
import { useState, useEffect, useCallback, useRef, useMemo } from 'react';
|
|
|
|
import { Banner, ActivityIndicator, Text } from 'react-native-paper';
|
2023-06-13 18:06:54 +01:00
|
|
|
import { _, languageName } from '@joplin/lib/locale';
|
2023-05-07 12:05:41 +01:00
|
|
|
import useAsyncEffect, { AsyncEffectEvent } from '@joplin/lib/hooks/useAsyncEffect';
|
2023-09-19 11:59:30 +01:00
|
|
|
import { IconSource } from 'react-native-paper/lib/typescript/components/Icon';
|
2024-10-26 13:00:56 -07:00
|
|
|
import VoiceTyping, { OnTextCallback, VoiceTypingSession } from '../../services/voiceTyping/VoiceTyping';
|
|
|
|
import whisper from '../../services/voiceTyping/whisper';
|
|
|
|
import vosk from '../../services/voiceTyping/vosk';
|
|
|
|
import { AppState } from '../../utils/types';
|
|
|
|
import { connect } from 'react-redux';
|
2023-05-07 12:05:41 +01:00
|
|
|
|
|
|
|
interface Props {
|
2023-06-13 18:06:54 +01:00
|
|
|
locale: string;
|
2024-10-26 13:00:56 -07:00
|
|
|
provider: string;
|
2023-05-07 12:05:41 +01:00
|
|
|
onDismiss: ()=> void;
|
|
|
|
onText: (text: string)=> void;
|
|
|
|
}
|
|
|
|
|
|
|
|
enum RecorderState {
|
|
|
|
Loading = 1,
|
|
|
|
Recording = 2,
|
|
|
|
Processing = 3,
|
2023-06-11 16:13:36 +01:00
|
|
|
Error = 4,
|
2023-06-13 18:06:54 +01:00
|
|
|
Downloading = 5,
|
2023-05-07 12:05:41 +01:00
|
|
|
}
|
|
|
|
|
2024-10-26 13:00:56 -07:00
|
|
|
interface UseVoiceTypingProps {
|
|
|
|
locale: string;
|
|
|
|
provider: string;
|
|
|
|
onSetPreview: OnTextCallback;
|
|
|
|
onText: OnTextCallback;
|
|
|
|
}
|
|
|
|
|
|
|
|
const useWhisper = ({ locale, provider, onSetPreview, onText }: UseVoiceTypingProps): [Error | null, boolean, VoiceTypingSession|null] => {
|
|
|
|
const [voiceTyping, setVoiceTyping] = useState<VoiceTypingSession>(null);
|
2023-06-11 16:13:36 +01:00
|
|
|
const [error, setError] = useState<Error>(null);
|
2023-06-13 18:06:54 +01:00
|
|
|
const [mustDownloadModel, setMustDownloadModel] = useState<boolean | null>(null);
|
2023-05-07 12:05:41 +01:00
|
|
|
|
2024-10-26 13:00:56 -07:00
|
|
|
const onTextRef = useRef(onText);
|
|
|
|
onTextRef.current = onText;
|
|
|
|
const onSetPreviewRef = useRef(onSetPreview);
|
|
|
|
onSetPreviewRef.current = onSetPreview;
|
2023-06-13 18:06:54 +01:00
|
|
|
|
2024-10-26 13:00:56 -07:00
|
|
|
const voiceTypingRef = useRef(voiceTyping);
|
|
|
|
voiceTypingRef.current = voiceTyping;
|
|
|
|
|
|
|
|
const builder = useMemo(() => {
|
|
|
|
return new VoiceTyping(locale, provider?.startsWith('whisper') ? [whisper] : [vosk]);
|
|
|
|
}, [locale, provider]);
|
|
|
|
|
|
|
|
useAsyncEffect(async (event: AsyncEffectEvent) => {
|
2023-06-11 16:13:36 +01:00
|
|
|
try {
|
2024-10-26 13:00:56 -07:00
|
|
|
await voiceTypingRef.current?.stop();
|
|
|
|
|
|
|
|
if (!await builder.isDownloaded()) {
|
|
|
|
if (event.cancelled) return;
|
|
|
|
await builder.download();
|
|
|
|
}
|
|
|
|
if (event.cancelled) return;
|
|
|
|
|
|
|
|
const voiceTyping = await builder.build({
|
|
|
|
onPreview: (text) => onSetPreviewRef.current(text),
|
|
|
|
onFinalize: (text) => onTextRef.current(text),
|
|
|
|
});
|
2023-06-11 16:13:36 +01:00
|
|
|
if (event.cancelled) return;
|
2024-10-26 13:00:56 -07:00
|
|
|
setVoiceTyping(voiceTyping);
|
2023-06-11 16:13:36 +01:00
|
|
|
} catch (error) {
|
|
|
|
setError(error);
|
2023-06-13 18:06:54 +01:00
|
|
|
} finally {
|
|
|
|
setMustDownloadModel(false);
|
2023-06-11 16:13:36 +01:00
|
|
|
}
|
2024-10-26 13:00:56 -07:00
|
|
|
}, [builder]);
|
2023-06-13 18:06:54 +01:00
|
|
|
|
|
|
|
useAsyncEffect(async (_event: AsyncEffectEvent) => {
|
2024-10-26 13:00:56 -07:00
|
|
|
setMustDownloadModel(!(await builder.isDownloaded()));
|
|
|
|
}, [builder]);
|
2023-05-07 12:05:41 +01:00
|
|
|
|
2024-10-26 13:00:56 -07:00
|
|
|
return [error, mustDownloadModel, voiceTyping];
|
2023-05-07 12:05:41 +01:00
|
|
|
};
|
|
|
|
|
2024-10-26 13:00:56 -07:00
|
|
|
const VoiceTypingDialog: React.FC<Props> = props => {
|
2023-05-07 12:05:41 +01:00
|
|
|
const [recorderState, setRecorderState] = useState<RecorderState>(RecorderState.Loading);
|
2024-10-26 13:00:56 -07:00
|
|
|
const [preview, setPreview] = useState<string>('');
|
|
|
|
const [modelError, mustDownloadModel, voiceTyping] = useWhisper({
|
|
|
|
locale: props.locale,
|
|
|
|
onSetPreview: setPreview,
|
|
|
|
onText: props.onText,
|
|
|
|
provider: props.provider,
|
|
|
|
});
|
2023-05-07 12:05:41 +01:00
|
|
|
|
|
|
|
useEffect(() => {
|
2024-10-26 13:00:56 -07:00
|
|
|
if (modelError) {
|
2023-06-11 16:13:36 +01:00
|
|
|
setRecorderState(RecorderState.Error);
|
2024-10-26 13:00:56 -07:00
|
|
|
} else if (voiceTyping) {
|
2023-06-11 16:13:36 +01:00
|
|
|
setRecorderState(RecorderState.Recording);
|
|
|
|
}
|
2024-10-26 13:00:56 -07:00
|
|
|
}, [voiceTyping, modelError]);
|
2023-05-07 12:05:41 +01:00
|
|
|
|
2023-06-13 18:06:54 +01:00
|
|
|
useEffect(() => {
|
|
|
|
if (mustDownloadModel) {
|
|
|
|
setRecorderState(RecorderState.Downloading);
|
|
|
|
}
|
|
|
|
}, [mustDownloadModel]);
|
|
|
|
|
2023-05-07 12:05:41 +01:00
|
|
|
useEffect(() => {
|
|
|
|
if (recorderState === RecorderState.Recording) {
|
2024-10-26 13:00:56 -07:00
|
|
|
void voiceTyping.start();
|
2023-05-07 12:05:41 +01:00
|
|
|
}
|
2024-10-26 13:00:56 -07:00
|
|
|
}, [recorderState, voiceTyping, props.onText]);
|
2023-05-07 12:05:41 +01:00
|
|
|
|
|
|
|
const onDismiss = useCallback(() => {
|
2024-10-26 13:00:56 -07:00
|
|
|
void voiceTyping?.stop();
|
2023-05-07 12:05:41 +01:00
|
|
|
props.onDismiss();
|
2024-10-26 13:00:56 -07:00
|
|
|
}, [voiceTyping, props.onDismiss]);
|
2023-05-07 12:05:41 +01:00
|
|
|
|
|
|
|
const renderContent = () => {
|
2024-10-26 13:00:56 -07:00
|
|
|
const components: Record<RecorderState, ()=> string> = {
|
2023-06-11 16:13:36 +01:00
|
|
|
[RecorderState.Loading]: () => _('Loading...'),
|
|
|
|
[RecorderState.Recording]: () => _('Please record your voice...'),
|
|
|
|
[RecorderState.Processing]: () => _('Converting speech to text...'),
|
2023-06-13 18:06:54 +01:00
|
|
|
[RecorderState.Downloading]: () => _('Downloading %s language files...', languageName(props.locale)),
|
2024-10-26 13:00:56 -07:00
|
|
|
[RecorderState.Error]: () => _('Error: %s', modelError.message),
|
2023-05-07 12:05:41 +01:00
|
|
|
};
|
|
|
|
|
2023-06-11 16:13:36 +01:00
|
|
|
return components[recorderState]();
|
2023-05-07 12:05:41 +01:00
|
|
|
};
|
|
|
|
|
2023-06-02 15:44:00 +01:00
|
|
|
const renderIcon = () => {
|
|
|
|
const components: Record<RecorderState, IconSource> = {
|
|
|
|
[RecorderState.Loading]: ({ size }: { size: number }) => <ActivityIndicator animating={true} style={{ width: size, height: size }} />,
|
|
|
|
[RecorderState.Recording]: 'microphone',
|
|
|
|
[RecorderState.Processing]: 'microphone',
|
2023-06-13 18:06:54 +01:00
|
|
|
[RecorderState.Downloading]: ({ size }: { size: number }) => <ActivityIndicator animating={true} style={{ width: size, height: size }} />,
|
2023-06-11 16:13:36 +01:00
|
|
|
[RecorderState.Error]: 'alert-circle-outline',
|
2023-05-07 12:05:41 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
return components[recorderState];
|
|
|
|
};
|
|
|
|
|
2024-10-26 13:00:56 -07:00
|
|
|
const renderPreview = () => {
|
|
|
|
return <Text variant='labelSmall'>{preview}</Text>;
|
|
|
|
};
|
|
|
|
|
|
|
|
const headerAndStatus = <Text variant='bodyMedium'>{`${_('Voice typing...')}\n${renderContent()}`}</Text>;
|
2023-05-07 12:05:41 +01:00
|
|
|
return (
|
2023-08-18 05:42:03 -03:00
|
|
|
<Banner
|
|
|
|
visible={true}
|
|
|
|
icon={renderIcon()}
|
|
|
|
actions={[
|
|
|
|
{
|
|
|
|
label: _('Done'),
|
|
|
|
onPress: onDismiss,
|
|
|
|
},
|
2024-10-26 13:00:56 -07:00
|
|
|
]}
|
|
|
|
>
|
|
|
|
{headerAndStatus}
|
|
|
|
<Text>{'\n'}</Text>
|
|
|
|
{renderPreview()}
|
2023-08-18 05:42:03 -03:00
|
|
|
</Banner>
|
2023-05-07 12:05:41 +01:00
|
|
|
);
|
|
|
|
};
|
2024-10-26 13:00:56 -07:00
|
|
|
|
|
|
|
export default connect((state: AppState) => ({
|
|
|
|
provider: state.settings['voiceTyping.preferredProvider'],
|
|
|
|
}))(VoiceTypingDialog);
|