whisper added
This commit is contained in:
		| @@ -11,8 +11,8 @@ import { selectTemperature } from '../store/parameters'; | |||||||
| import { openSystemPromptPanel, openTemperaturePanel } from '../store/settings-ui'; | import { openSystemPromptPanel, openTemperaturePanel } from '../store/settings-ui'; | ||||||
| import { speechRecognition } from '../speech-recognition-types.d' | import { speechRecognition } from '../speech-recognition-types.d' | ||||||
| import MicRecorder from 'mic-recorder-to-mp3'; | import MicRecorder from 'mic-recorder-to-mp3'; | ||||||
| import { selectUseOpenAIWhisper } from '../store/api-keys'; | import { selectUseOpenAIWhisper, selectOpenAIApiKey } from '../store/api-keys'; | ||||||
|  | import { Mp3Encoder } from 'lamejs'; | ||||||
|  |  | ||||||
| const Container = styled.div` | const Container = styled.div` | ||||||
|     background: #292933; |     background: #292933; | ||||||
| @@ -38,13 +38,53 @@ export interface MessageInputProps { | |||||||
|     disabled?: boolean; |     disabled?: boolean; | ||||||
| } | } | ||||||
|  |  | ||||||
|  |  | ||||||
|  |  | ||||||
|  | async function chunkAndEncodeMP3File(file: Blob): Promise<Array<File>> { | ||||||
|  |     const MAX_CHUNK_SIZE = 25 * 1024 * 1024; // 25 MB | ||||||
|  |     const audioContext = new AudioContext(); | ||||||
|  |     const audioBuffer = await audioContext.decodeAudioData(await file.arrayBuffer()); | ||||||
|  |     const duration = audioBuffer.duration; | ||||||
|  |     const sampleRate = audioBuffer.sampleRate; | ||||||
|  |     const numChannels = audioBuffer.numberOfChannels; | ||||||
|  |     const bytesPerSample = 2; // 16-bit audio | ||||||
|  |     const samplesPerChunk = Math.floor((MAX_CHUNK_SIZE / bytesPerSample) / numChannels); | ||||||
|  |     const totalSamples = Math.floor(duration * sampleRate); | ||||||
|  |     const numChunks = Math.ceil(totalSamples / samplesPerChunk); | ||||||
|  |  | ||||||
|  |     const chunks: Array<File> = []; | ||||||
|  |     for (let i = 0; i < numChunks; i++) { | ||||||
|  |         const startSample = i * samplesPerChunk; | ||||||
|  |         const endSample = Math.min(startSample + samplesPerChunk, totalSamples); | ||||||
|  |         const chunkDuration = (endSample - startSample) / sampleRate; | ||||||
|  |         const chunkBuffer = audioContext.createBuffer(numChannels, endSample - startSample, sampleRate); | ||||||
|  |         for (let c = 0; c < numChannels; c++) { | ||||||
|  |             const channelData = audioBuffer.getChannelData(c).subarray(startSample, endSample); | ||||||
|  |             chunkBuffer.copyToChannel(channelData, c); | ||||||
|  |         } | ||||||
|  |         const chunkBlob = await new Promise<Blob>((resolve) => { | ||||||
|  |             const encoder = new Mp3Encoder(numChannels, sampleRate, 128); | ||||||
|  |             const leftData = chunkBuffer.getChannelData(0); | ||||||
|  |             const rightData = numChannels === 1 ? leftData : chunkBuffer.getChannelData(1); | ||||||
|  |             const mp3Data = encoder.encodeBuffer(leftData, rightData); | ||||||
|  |             const blob = new Blob([mp3Data], { type: 'audio/mp3' }); | ||||||
|  |             resolve(blob); | ||||||
|  |         }); | ||||||
|  |         chunks.push(new File([chunkBlob], `text-${i}.mp3`, { type: 'audio/mp3' })); | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     return chunks; | ||||||
|  | } | ||||||
|  |  | ||||||
|  |  | ||||||
| export default function MessageInput(props: MessageInputProps) { | export default function MessageInput(props: MessageInputProps) { | ||||||
|     const temperature = useAppSelector(selectTemperature); |     const temperature = useAppSelector(selectTemperature); | ||||||
|     const message = useAppSelector(selectMessage); |     const message = useAppSelector(selectMessage); | ||||||
|     const [recording, setRecording] = useState(false); |     const [recording, setRecording] = useState(false); | ||||||
|     const hasVerticalSpace = useMediaQuery('(min-height: 1000px)'); |     const hasVerticalSpace = useMediaQuery('(min-height: 1000px)'); | ||||||
|     const recorder = new MicRecorder({ bitRate: 128 }) |     const recorder = useMemo(() => new MicRecorder({ bitRate: 128 }), []); | ||||||
|     const useOpenAIWhisper = useAppSelector(selectUseOpenAIWhisper); |     const useOpenAIWhisper = useAppSelector(selectUseOpenAIWhisper); | ||||||
|  |     const openAIApiKey = useAppSelector(selectOpenAIApiKey); | ||||||
|  |  | ||||||
|     const context = useAppContext(); |     const context = useAppContext(); | ||||||
|     const dispatch = useAppDispatch(); |     const dispatch = useAppDispatch(); | ||||||
| @@ -65,14 +105,14 @@ export default function MessageInput(props: MessageInputProps) { | |||||||
|     }, [context, message, dispatch]); |     }, [context, message, dispatch]); | ||||||
|  |  | ||||||
|     const onSpeechStart = () => { |     const onSpeechStart = () => { | ||||||
|  |  | ||||||
|         if (!recording) { |         if (!recording) { | ||||||
|             setRecording(true); |             setRecording(true); | ||||||
|  |  | ||||||
|             // if we are using whisper, the we will just record with the browser and send the api when done  |             // if we are using whisper, the we will just record with the browser and send the api when done  | ||||||
|             if (useOpenAIWhisper) { |             if (useOpenAIWhisper) { | ||||||
|  |                 recorder.start().catch((e: any) => console.error(e)); | ||||||
|             } else { |             } else { | ||||||
|  |  | ||||||
|                 speechRecognition.continuous = true; |                 speechRecognition.continuous = true; | ||||||
|                 speechRecognition.interimResults = true; |                 speechRecognition.interimResults = true; | ||||||
|  |  | ||||||
| @@ -86,7 +126,36 @@ export default function MessageInput(props: MessageInputProps) { | |||||||
|         } else { |         } else { | ||||||
|             setRecording(false); |             setRecording(false); | ||||||
|             if (useOpenAIWhisper) { |             if (useOpenAIWhisper) { | ||||||
|  |                 const mp3 = recorder.stop().getMp3(); | ||||||
|  |  | ||||||
|  |                 mp3.then(async ([buffer, blob]) => { | ||||||
|  |  | ||||||
|  |                     const file = new File(buffer, 'chat.mp3', { | ||||||
|  |                         type: blob.type, | ||||||
|  |                         lastModified: Date.now() | ||||||
|  |                     }); | ||||||
|  |  | ||||||
|  |                     // TODO: cut in chunks | ||||||
|  |  | ||||||
|  |                     var data = new FormData() | ||||||
|  |                     data.append('file', file); | ||||||
|  |                     data.append('model', 'whisper-1') | ||||||
|  |  | ||||||
|  |                     const response = await fetch("https://api.openai.com/v1/audio/transcriptions", { | ||||||
|  |                         method: "POST", | ||||||
|  |                         headers: { | ||||||
|  |                             'Authorization': `Bearer ${openAIApiKey}`, | ||||||
|  |                         }, | ||||||
|  |                         body: data, | ||||||
|  |                     }); | ||||||
|  |  | ||||||
|  |                     const json = await response.json() | ||||||
|  |  | ||||||
|  |                     if (json.text) { | ||||||
|  |                         dispatch(setMessage(json.text)); | ||||||
|  |                     } | ||||||
|  |  | ||||||
|  |                 }).catch((e: any) => console.error(e)); | ||||||
|             } else { |             } else { | ||||||
|                 speechRecognition.stop(); |                 speechRecognition.stop(); | ||||||
|  |  | ||||||
|   | |||||||
| @@ -244,7 +244,7 @@ export default function MessageComponent(props: { message: Message, last: boolea | |||||||
|                                 <Button variant="subtle" size="sm" compact onClick={copy} style={{ marginLeft: '1rem' }}> |                                 <Button variant="subtle" size="sm" compact onClick={copy} style={{ marginLeft: '1rem' }}> | ||||||
|                                     <i className="fa fa-clipboard" /> |                                     <i className="fa fa-clipboard" /> | ||||||
|                                     {copied ? <FormattedMessage defaultMessage="Copied" description="Label for copy-to-clipboard button after a successful copy" /> |                                     {copied ? <FormattedMessage defaultMessage="Copied" description="Label for copy-to-clipboard button after a successful copy" /> | ||||||
|                                             : <FormattedMessage defaultMessage="Copy" description="Label for copy-to-clipboard button" />} |                                         : <FormattedMessage defaultMessage="Copy" description="Label for copy-to-clipboard button" />} | ||||||
|                                 </Button> |                                 </Button> | ||||||
|                             )} |                             )} | ||||||
|                         </CopyButton> |                         </CopyButton> | ||||||
| @@ -263,7 +263,7 @@ export default function MessageComponent(props: { message: Message, last: boolea | |||||||
|                             }}> |                             }}> | ||||||
|                                 <i className="fa fa-edit" /> |                                 <i className="fa fa-edit" /> | ||||||
|                                 <span> |                                 <span> | ||||||
|                                     {editing ? <FormattedMessage defaultMessage="Cancel" description="Label for a button that appears when the user is editing the text of one of their messages, to cancel without saving changes" />  |                                     {editing ? <FormattedMessage defaultMessage="Cancel" description="Label for a button that appears when the user is editing the text of one of their messages, to cancel without saving changes" /> | ||||||
|                                         : <FormattedMessage defaultMessage="Edit" description="Label for the button the user can click to edit the text of one of their messages" />} |                                         : <FormattedMessage defaultMessage="Edit" description="Label for the button the user can click to edit the text of one of their messages" />} | ||||||
|                                 </span> |                                 </span> | ||||||
|                             </Button> |                             </Button> | ||||||
|   | |||||||
| @@ -26,7 +26,7 @@ export interface OpenAIResponseChunk { | |||||||
|  |  | ||||||
| function parseResponseChunk(buffer: any): OpenAIResponseChunk { | function parseResponseChunk(buffer: any): OpenAIResponseChunk { | ||||||
|     const chunk = buffer.toString().replace('data: ', '').trim(); |     const chunk = buffer.toString().replace('data: ', '').trim(); | ||||||
|      |  | ||||||
|     if (chunk === '[DONE]') { |     if (chunk === '[DONE]') { | ||||||
|         return { |         return { | ||||||
|             done: true, |             done: true, | ||||||
| @@ -51,7 +51,7 @@ export async function createChatCompletion(messages: OpenAIMessage[], parameters | |||||||
|     const configuration = new Configuration({ |     const configuration = new Configuration({ | ||||||
|         apiKey: parameters.apiKey, |         apiKey: parameters.apiKey, | ||||||
|     }); |     }); | ||||||
|      |  | ||||||
|     const openai = new OpenAIApi(configuration); |     const openai = new OpenAIApi(configuration); | ||||||
|  |  | ||||||
|     const response = await openai.createChatCompletion({ |     const response = await openai.createChatCompletion({ | ||||||
| @@ -129,6 +129,7 @@ export async function createStreamingChatCompletion(messages: OpenAIMessage[], p | |||||||
|     }); |     }); | ||||||
|  |  | ||||||
|     eventSource.addEventListener('message', async (event: any) => { |     eventSource.addEventListener('message', async (event: any) => { | ||||||
|  |  | ||||||
|         if (event.data === '[DONE]') { |         if (event.data === '[DONE]') { | ||||||
|             emitter.emit('done'); |             emitter.emit('done'); | ||||||
|             return; |             return; | ||||||
| @@ -147,7 +148,7 @@ export async function createStreamingChatCompletion(messages: OpenAIMessage[], p | |||||||
|  |  | ||||||
|     eventSource.stream(); |     eventSource.stream(); | ||||||
|  |  | ||||||
|     return {  |     return { | ||||||
|         emitter, |         emitter, | ||||||
|         cancel: () => eventSource.close(), |         cancel: () => eventSource.close(), | ||||||
|     }; |     }; | ||||||
|   | |||||||
							
								
								
									
										8
									
								
								server/src/endpoints/whisper.ts
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										8
									
								
								server/src/endpoints/whisper.ts
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,8 @@ | |||||||
|  | import express from 'express'; | ||||||
|  | import RequestHandler from "./base"; | ||||||
|  |  | ||||||
|  | export default class WhisperRequestHandler extends RequestHandler { | ||||||
|  |     handler(req: express.Request, res: express.Response): any { | ||||||
|  |         res.json({ status: 'ok' }); | ||||||
|  |     } | ||||||
|  | } | ||||||
| @@ -18,6 +18,7 @@ import BasicCompletionRequestHandler from './endpoints/completion/basic'; | |||||||
| import StreamingCompletionRequestHandler from './endpoints/completion/streaming'; | import StreamingCompletionRequestHandler from './endpoints/completion/streaming'; | ||||||
| import SessionRequestHandler from './endpoints/session'; | import SessionRequestHandler from './endpoints/session'; | ||||||
| import GetShareRequestHandler from './endpoints/get-share'; | import GetShareRequestHandler from './endpoints/get-share'; | ||||||
|  | import WhisperRequestHandler from './endpoints/whisper'; | ||||||
| import { configurePassport } from './passport'; | import { configurePassport } from './passport'; | ||||||
| import { configureAuth0 } from './auth0'; | import { configureAuth0 } from './auth0'; | ||||||
| import DeleteChatRequestHandler from './endpoints/delete-chat'; | import DeleteChatRequestHandler from './endpoints/delete-chat'; | ||||||
| @@ -82,6 +83,7 @@ export default class ChatServer { | |||||||
|         this.app.post('/chatapi/sync', (req, res) => new SyncRequestHandler(this, req, res)); |         this.app.post('/chatapi/sync', (req, res) => new SyncRequestHandler(this, req, res)); | ||||||
|         this.app.get('/chatapi/share/:id', (req, res) => new GetShareRequestHandler(this, req, res)); |         this.app.get('/chatapi/share/:id', (req, res) => new GetShareRequestHandler(this, req, res)); | ||||||
|         this.app.post('/chatapi/share', (req, res) => new ShareRequestHandler(this, req, res)); |         this.app.post('/chatapi/share', (req, res) => new ShareRequestHandler(this, req, res)); | ||||||
|  |         this.app.post('/chatapi/whisper', (req, res) => new WhisperRequestHandler(this, req, res)); | ||||||
|  |  | ||||||
|         if (process.env.ENABLE_SERVER_COMPLETION) { |         if (process.env.ENABLE_SERVER_COMPLETION) { | ||||||
|             this.app.post('/chatapi/completion', (req, res) => new BasicCompletionRequestHandler(this, req, res)); |             this.app.post('/chatapi/completion', (req, res) => new BasicCompletionRequestHandler(this, req, res)); | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user