joplin/packages/app-mobile/components/voiceTyping/VoiceTypingDialog.tsx

import * as React from 'react';
import { useState, useEffect, useCallback, useRef, useMemo } from 'react';
import { Icon, ActivityIndicator, Text, Surface, Button } from 'react-native-paper';
import { _, languageName } from '@joplin/lib/locale';
import useAsyncEffect, { AsyncEffectEvent } from '@joplin/lib/hooks/useAsyncEffect';
import { IconSource } from 'react-native-paper/lib/typescript/components/Icon';
import VoiceTyping, { OnTextCallback, VoiceTypingSession } from '../../services/voiceTyping/VoiceTyping';
import whisper from '../../services/voiceTyping/whisper';
import vosk from '../../services/voiceTyping/vosk';
import { AppState } from '../../utils/types';
import { connect } from 'react-redux';
import { View, StyleSheet } from 'react-native';
import AccessibleView from '../accessibility/AccessibleView';

interface Props {
	locale: string;
	provider: string;
	onDismiss: ()=> void;
	onText: (text: string)=> void;
}

enum RecorderState {
	Loading = 1,
	Recording = 2,
	Processing = 3,
	Error = 4,
	Downloading = 5,
}

interface UseVoiceTypingProps {
	locale: string;
	provider: string;
	onSetPreview: OnTextCallback;
	onText: OnTextCallback;
}

const useWhisper = ({ locale, provider, onSetPreview, onText }: UseVoiceTypingProps): [Error | null, boolean, VoiceTypingSession|null] => {
	const [voiceTyping, setVoiceTyping] = useState<VoiceTypingSession>(null);
	const [error, setError] = useState<Error>(null);
	const [mustDownloadModel, setMustDownloadModel] = useState<boolean | null>(null);

	const onTextRef = useRef(onText);
	onTextRef.current = onText;
	const onSetPreviewRef = useRef(onSetPreview);
	onSetPreviewRef.current = onSetPreview;

	const voiceTypingRef = useRef(voiceTyping);
	voiceTypingRef.current = voiceTyping;

	const builder = useMemo(() => {
		return new VoiceTyping(locale, provider?.startsWith('whisper') ? [whisper] : [vosk]);
	}, [locale, provider]);

	useAsyncEffect(async (event: AsyncEffectEvent) => {
		try {
			await voiceTypingRef.current?.stop();

			if (!await builder.isDownloaded()) {
				if (event.cancelled) return;
				await builder.download();
			}
			if (event.cancelled) return;

			const voiceTyping = await builder.build({
				onPreview: (text) => onSetPreviewRef.current(text),
				onFinalize: (text) => onTextRef.current(text),
			});
			if (event.cancelled) return;
			setVoiceTyping(voiceTyping);
		} catch (error) {
			setError(error);
		} finally {
			setMustDownloadModel(false);
		}
	}, [builder]);

	useAsyncEffect(async (_event: AsyncEffectEvent) => {
		setMustDownloadModel(!(await builder.isDownloaded()));
	}, [builder]);

	useEffect(() => () => {
		void voiceTypingRef.current?.stop();
	}, []);

	return [error, mustDownloadModel, voiceTyping];
};

const styles = StyleSheet.create({
	container: {
		marginHorizontal: 1,
		width: '100%',
		maxWidth: 680,
		alignSelf: 'center',
	},
	contentWrapper: {
		flexDirection: 'row',
	},
	iconWrapper: {
		margin: 8,
		marginTop: 16,
	},
	content: {
		marginTop: 16,
		marginHorizontal: 8,
	},
	actionContainer: {
		flexDirection: 'row',
		justifyContent: 'flex-end',
	},
});

const VoiceTypingDialog: React.FC<Props> = props => {
	const [recorderState, setRecorderState] = useState<RecorderState>(RecorderState.Loading);
	const [preview, setPreview] = useState<string>('');
	const [modelError, mustDownloadModel, voiceTyping] = useWhisper({
		locale: props.locale,
		onSetPreview: setPreview,
		onText: props.onText,
		provider: props.provider,
	});

	useEffect(() => {
		if (modelError) {
			setRecorderState(RecorderState.Error);
		} else if (voiceTyping) {
			setRecorderState(RecorderState.Recording);
		}
	}, [voiceTyping, modelError]);

	useEffect(() => {
		if (mustDownloadModel) {
			setRecorderState(RecorderState.Downloading);
		}
	}, [mustDownloadModel]);

	useEffect(() => {
		if (recorderState === RecorderState.Recording) {
			void voiceTyping.start();
		}
	}, [recorderState, voiceTyping, props.onText]);

	const onDismiss = useCallback(() => {
		void voiceTyping?.stop();
		props.onDismiss();
	}, [voiceTyping, props.onDismiss]);

	const renderContent = () => {
		const components: Record<RecorderState, ()=> string> = {
			[RecorderState.Loading]: () => _('Loading...'),
			[RecorderState.Recording]: () => _('Please record your voice...'),
			[RecorderState.Processing]: () => _('Converting speech to text...'),
			[RecorderState.Downloading]: () => _('Downloading %s language files...', languageName(props.locale)),
			[RecorderState.Error]: () => _('Error: %s', modelError.message),
		};

		return components[recorderState]();
	};

	const renderIcon = () => {
		const components: Record<RecorderState, IconSource> = {
			[RecorderState.Loading]: ({ size }: { size: number }) => <ActivityIndicator animating={true} style={{ width: size, height: size }} />,
			[RecorderState.Recording]: 'microphone',
			[RecorderState.Processing]: 'microphone',
			[RecorderState.Downloading]: ({ size }: { size: number }) => <ActivityIndicator animating={true} style={{ width: size, height: size }} />,
			[RecorderState.Error]: 'alert-circle-outline',
		};

		return components[recorderState];
	};

	const renderPreview = () => {
		return <Text variant='labelSmall'>{preview}</Text>;
	};

	return (
		<Surface>
			<View style={styles.container}>
				<View style={styles.contentWrapper}>
					<View style={styles.iconWrapper}>
						<Icon source={renderIcon()} size={40}/>
					</View>
					<View style={styles.content}>
						<AccessibleView
							// Auto-focus
							refocusCounter={1}
							aria-live='polite'
							role='heading'
						>
							<Text variant='bodyMedium'>
								{_('Voice typing...')}
							</Text>
						</AccessibleView>
						<Text
							variant='bodyMedium'
							// role="status" might fit better here. However, react-native
							// doesn't seem to support it.
							role='alert'
							// Although on web, role=alert should imply aria-live=polite,
							// this does not seem to be the case for React Native:
							accessibilityLiveRegion='polite'
						>{renderContent()}</Text>
						{renderPreview()}
					</View>
				</View>
				<View style={styles.actionContainer}>
					<Button
						onPress={onDismiss}
						accessibilityHint={_('Ends voice typing')}
					>{_('Done')}</Button>
				</View>
			</View>
		</Surface>
	);
};

export default connect((state: AppState) => ({
	provider: state.settings['voiceTyping.preferredProvider'],
}))(VoiceTypingDialog);
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00			`import * as React from 'react';`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`import { useState, useEffect, useCallback, useRef, useMemo } from 'react';`
Android: Accessibility: Improve voice typing dialog screen reader accessibility (#11428) 2024-11-22 12:47:46 +02:00			`import { Icon, ActivityIndicator, Text, Surface, Button } from 'react-native-paper';`
Android: Add support for Voice Typing for most languages (#8309) 2023-06-13 19:06:54 +02:00			`import { _, languageName } from '@joplin/lib/locale';`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00			`import useAsyncEffect, { AsyncEffectEvent } from '@joplin/lib/hooks/useAsyncEffect';`
Update dependency react-native-paper to v5.10.1 (#8908) Co-authored-by: renovate[bot] <29139614+renovate[bot]@users.noreply.github.com> Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2023-09-19 12:59:30 +02:00			`import { IconSource } from 'react-native-paper/lib/typescript/components/Icon';`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`import VoiceTyping, { OnTextCallback, VoiceTypingSession } from '../../services/voiceTyping/VoiceTyping';`
			`import whisper from '../../services/voiceTyping/whisper';`
			`import vosk from '../../services/voiceTyping/vosk';`
			`import { AppState } from '../../utils/types';`
			`import { connect } from 'react-redux';`
Android: Accessibility: Improve voice typing dialog screen reader accessibility (#11428) 2024-11-22 12:47:46 +02:00			`import { View, StyleSheet } from 'react-native';`
			`import AccessibleView from '../accessibility/AccessibleView';`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00
			`interface Props {`
Android: Add support for Voice Typing for most languages (#8309) 2023-06-13 19:06:54 +02:00			`locale: string;`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`provider: string;`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00			`onDismiss: ()=> void;`
			`onText: (text: string)=> void;`
			`}`

			`enum RecorderState {`
			`Loading = 1,`
			`Recording = 2,`
			`Processing = 3,`
Mobile: Improved Vosk error handling 2023-06-11 17:13:36 +02:00			`Error = 4,`
Android: Add support for Voice Typing for most languages (#8309) 2023-06-13 19:06:54 +02:00			`Downloading = 5,`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00			`}`

Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`interface UseVoiceTypingProps {`
			`locale: string;`
			`provider: string;`
			`onSetPreview: OnTextCallback;`
			`onText: OnTextCallback;`
			`}`

			`const useWhisper = ({ locale, provider, onSetPreview, onText }: UseVoiceTypingProps): [Error \| null, boolean, VoiceTypingSession\|null] => {`
			`const [voiceTyping, setVoiceTyping] = useState<VoiceTypingSession>(null);`
Mobile: Improved Vosk error handling 2023-06-11 17:13:36 +02:00			`const [error, setError] = useState<Error>(null);`
Android: Add support for Voice Typing for most languages (#8309) 2023-06-13 19:06:54 +02:00			`const [mustDownloadModel, setMustDownloadModel] = useState<boolean \| null>(null);`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`const onTextRef = useRef(onText);`
			`onTextRef.current = onText;`
			`const onSetPreviewRef = useRef(onSetPreview);`
			`onSetPreviewRef.current = onSetPreview;`
Android: Add support for Voice Typing for most languages (#8309) 2023-06-13 19:06:54 +02:00
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`const voiceTypingRef = useRef(voiceTyping);`
			`voiceTypingRef.current = voiceTyping;`

			`const builder = useMemo(() => {`
			`return new VoiceTyping(locale, provider?.startsWith('whisper') ? [whisper] : [vosk]);`
			`}, [locale, provider]);`

			`useAsyncEffect(async (event: AsyncEffectEvent) => {`
Mobile: Improved Vosk error handling 2023-06-11 17:13:36 +02:00			`try {`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`await voiceTypingRef.current?.stop();`

			`if (!await builder.isDownloaded()) {`
			`if (event.cancelled) return;`
			`await builder.download();`
			`}`
			`if (event.cancelled) return;`

			`const voiceTyping = await builder.build({`
			`onPreview: (text) => onSetPreviewRef.current(text),`
			`onFinalize: (text) => onTextRef.current(text),`
			`});`
Mobile: Improved Vosk error handling 2023-06-11 17:13:36 +02:00			`if (event.cancelled) return;`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`setVoiceTyping(voiceTyping);`
Mobile: Improved Vosk error handling 2023-06-11 17:13:36 +02:00			`} catch (error) {`
			`setError(error);`
Android: Add support for Voice Typing for most languages (#8309) 2023-06-13 19:06:54 +02:00			`} finally {`
			`setMustDownloadModel(false);`
Mobile: Improved Vosk error handling 2023-06-11 17:13:36 +02:00			`}`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`}, [builder]);`
Android: Add support for Voice Typing for most languages (#8309) 2023-06-13 19:06:54 +02:00
			`useAsyncEffect(async (_event: AsyncEffectEvent) => {`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`setMustDownloadModel(!(await builder.isDownloaded()));`
			`}, [builder]);`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00
Android: Close voice typing session when closing the editor (#11466) 2024-12-09 17:56:25 +02:00			`useEffect(() => () => {`
			`void voiceTypingRef.current?.stop();`
			`}, []);`

Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`return [error, mustDownloadModel, voiceTyping];`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00			`};`

Android: Accessibility: Improve voice typing dialog screen reader accessibility (#11428) 2024-11-22 12:47:46 +02:00			`const styles = StyleSheet.create({`
			`container: {`
			`marginHorizontal: 1,`
			`width: '100%',`
			`maxWidth: 680,`
			`alignSelf: 'center',`
			`},`
			`contentWrapper: {`
			`flexDirection: 'row',`
			`},`
			`iconWrapper: {`
			`margin: 8,`
			`marginTop: 16,`
			`},`
			`content: {`
			`marginTop: 16,`
			`marginHorizontal: 8,`
			`},`
			`actionContainer: {`
			`flexDirection: 'row',`
			`justifyContent: 'flex-end',`
			`},`
			`});`

Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`const VoiceTypingDialog: React.FC<Props> = props => {`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00			`const [recorderState, setRecorderState] = useState<RecorderState>(RecorderState.Loading);`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`const [preview, setPreview] = useState<string>('');`
			`const [modelError, mustDownloadModel, voiceTyping] = useWhisper({`
			`locale: props.locale,`
			`onSetPreview: setPreview,`
			`onText: props.onText,`
			`provider: props.provider,`
			`});`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00
			`useEffect(() => {`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`if (modelError) {`
Mobile: Improved Vosk error handling 2023-06-11 17:13:36 +02:00			`setRecorderState(RecorderState.Error);`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`} else if (voiceTyping) {`
Mobile: Improved Vosk error handling 2023-06-11 17:13:36 +02:00			`setRecorderState(RecorderState.Recording);`
			`}`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`}, [voiceTyping, modelError]);`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00
Android: Add support for Voice Typing for most languages (#8309) 2023-06-13 19:06:54 +02:00			`useEffect(() => {`
			`if (mustDownloadModel) {`
			`setRecorderState(RecorderState.Downloading);`
			`}`
			`}, [mustDownloadModel]);`

Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00			`useEffect(() => {`
			`if (recorderState === RecorderState.Recording) {`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`void voiceTyping.start();`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00			`}`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`}, [recorderState, voiceTyping, props.onText]);`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00
			`const onDismiss = useCallback(() => {`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`void voiceTyping?.stop();`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00			`props.onDismiss();`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`}, [voiceTyping, props.onDismiss]);`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00
			`const renderContent = () => {`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`const components: Record<RecorderState, ()=> string> = {`
Mobile: Improved Vosk error handling 2023-06-11 17:13:36 +02:00			`[RecorderState.Loading]: () => _('Loading...'),`
			`[RecorderState.Recording]: () => _('Please record your voice...'),`
			`[RecorderState.Processing]: () => _('Converting speech to text...'),`
Android: Add support for Voice Typing for most languages (#8309) 2023-06-13 19:06:54 +02:00			`[RecorderState.Downloading]: () => _('Downloading %s language files...', languageName(props.locale)),`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`[RecorderState.Error]: () => _('Error: %s', modelError.message),`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00			`};`

Mobile: Improved Vosk error handling 2023-06-11 17:13:36 +02:00			`return components[recorderState]();`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00			`};`

Mobile: Write to note in realtime using voice typing 2023-06-02 16:44:00 +02:00			`const renderIcon = () => {`
			`const components: Record<RecorderState, IconSource> = {`
			`[RecorderState.Loading]: ({ size }: { size: number }) => <ActivityIndicator animating={true} style={{ width: size, height: size }} />,`
			`[RecorderState.Recording]: 'microphone',`
			`[RecorderState.Processing]: 'microphone',`
Android: Add support for Voice Typing for most languages (#8309) 2023-06-13 19:06:54 +02:00			`[RecorderState.Downloading]: ({ size }: { size: number }) => <ActivityIndicator animating={true} style={{ width: size, height: size }} />,`
Mobile: Improved Vosk error handling 2023-06-11 17:13:36 +02:00			`[RecorderState.Error]: 'alert-circle-outline',`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00			`};`

			`return components[recorderState];`
			`};`

Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00			`const renderPreview = () => {`
			`return <Text variant='labelSmall'>{preview}</Text>;`
			`};`

Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00			`return (`
Android: Accessibility: Improve voice typing dialog screen reader accessibility (#11428) 2024-11-22 12:47:46 +02:00			`<Surface>`
			`<View style={styles.container}>`
			`<View style={styles.contentWrapper}>`
			`<View style={styles.iconWrapper}>`
			`<Icon source={renderIcon()} size={40}/>`
			`</View>`
			`<View style={styles.content}>`
			`<AccessibleView`
			`// Auto-focus`
			`refocusCounter={1}`
			`aria-live='polite'`
			`role='heading'`
			`>`
			`<Text variant='bodyMedium'>`
			`{_('Voice typing...')}`
			`</Text>`
			`</AccessibleView>`
			`<Text`
			`variant='bodyMedium'`
			`// role="status" might fit better here. However, react-native`
			`// doesn't seem to support it.`
			`role='alert'`
			`// Although on web, role=alert should imply aria-live=polite,`
			`// this does not seem to be the case for React Native:`
			`accessibilityLiveRegion='polite'`
			`>{renderContent()}</Text>`
			`{renderPreview()}`
			`</View>`
			`</View>`
			`<View style={styles.actionContainer}>`
			`<Button`
			`onPress={onDismiss}`
			`accessibilityHint={_('Ends voice typing')}`
			`>{_('Done')}</Button>`
			`</View>`
			`</View>`
			`</Surface>`
Mobile: Improved Vosk support (beta, fr only) (#8131) 2023-05-07 13:05:41 +02:00			`);`
			`};`
Android: Allow switching the voice typing library to Whisper (#11158) Co-authored-by: Laurent Cozic <laurent22@users.noreply.github.com> 2024-10-26 22:00:56 +02:00
			`export default connect((state: AppState) => ({`
			`provider: state.settings['voiceTyping.preferredProvider'],`
			`}))(VoiceTypingDialog);`