feat(socket): allow full customization of socket servers

timmywil · timmywil · commit d50a95998b71 · 2021-03-15T15:52:44.000-04:00
BREAKING CHANGE: this changes the API for asrSocketServer, googleASRSocketServer,
  and startStream() so that more WebSocket options can be passed as arguments.

To migrate, change asrSocketServer(server) to asrSocketServer({ server }).
Change googleASRSocketServer(server) to googleASRSocketServer({ server }).
Change startStream(() =&gt; isPlaying) to startStream({ isPlaying: () =&gt; isPlaying }).
diff --git a/README.md b/README.md
@@ -52,7 +52,7 @@ If you'd prefer to use Google ASR, follow these [instructions for setting up Goo
 
 ▸ **spokestackMiddleware**(): function
 
-_Defined in [server/expressMiddleware.ts:37](https://github.com/spokestack/node-spokestack/blob/7555411/src/server/expressMiddleware.ts#L37)_
+_Defined in [server/expressMiddleware.ts:37](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/server/expressMiddleware.ts#L37)_
 
 Express middleware for adding a proxy to the Spokestack GraphQL API.
 A proxy is necessary to avoid exposing your Spokestack token secret on the client.
@@ -87,9 +87,9 @@ const graphQLFetcher = (graphQLParams) =>
 
 ### asrSocketServer
 
-▸ **asrSocketServer**(`server`: Server, `asrConfig?`: Omit<SpokestackASRConfig, \"sampleRate\"\>): void
+▸ **asrSocketServer**(`serverConfig`: ServerOptions, `asrConfig?`: Omit<SpokestackASRConfig, \"sampleRate\"\>): void
 
-_Defined in [server/socketServer.ts:25](https://github.com/spokestack/node-spokestack/blob/7555411/src/server/socketServer.ts#L25)_
+_Defined in [server/socketServer.ts:25](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/server/socketServer.ts#L25)_
 
 Adds a web socket server to the given HTTP server
 to stream ASR using Spokestack ASR.
@@ -100,28 +100,28 @@ import { createServer } from 'http'
 const port = parseInt(process.env.PORT || '3000', 10)
 const server = createServer() // or express()
 // Attach the websocket server to the HTTP server
-asrSocketServer(server)
+asrSocketServer({ server })
 server.listen(port, () => {
   console.log(`Listening at http://localhost:${port}`)
 })
 ```
 
 #### Parameters:
 
-| Name        | Type                                       | Default value |
-| ----------- | ------------------------------------------ | ------------- |
-| `server`    | Server                                     | -             |
-| `asrConfig` | Omit<SpokestackASRConfig, \"sampleRate\"\> | {}            |
+| Name           | Type                                       | Default value |
+| -------------- | ------------------------------------------ | ------------- |
+| `serverConfig` | ServerOptions                              | -             |
+| `asrConfig`    | Omit<SpokestackASRConfig, \"sampleRate\"\> | {}            |
 
 **Returns:** void
 
 ---
 
 ### googleASRSocketServer
 
-▸ **googleASRSocketServer**(`server`: Server): void
+▸ **googleASRSocketServer**(`serverConfig`: ServerOptions): void
 
-_Defined in [server/socketServer.ts:110](https://github.com/spokestack/node-spokestack/blob/7555411/src/server/socketServer.ts#L110)_
+_Defined in [server/socketServer.ts:110](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/server/socketServer.ts#L110)_
 
 Adds a web socket server to the given HTTP server
 to stream ASR using Google Speech.
@@ -132,25 +132,25 @@ import { createServer } from 'http'
 const port = parseInt(process.env.PORT || '3000', 10)
 const server = createServer() // or express()
 // Attach the websocket server to the HTTP server
-googleASRSocketServer(server)
+googleASRSocketServer({ server })
 server.listen(port, () => {
   console.log(`Listening at http://localhost:${port}`)
 })
 ```
 
 #### Parameters:
 
-| Name     | Type   |
-| -------- | ------ |
-| `server` | Server |
+| Name           | Type          |
+| -------------- | ------------- |
+| `serverConfig` | ServerOptions |
 
 **Returns:** void
 
 ### asr
 
 ▸ **asr**(`content`: string \| Uint8Array, `sampleRate`: number): Promise<string \| null\>
 
-_Defined in [server/asr.ts:43](https://github.com/spokestack/node-spokestack/blob/7555411/src/server/asr.ts#L43)_
+_Defined in [server/asr.ts:43](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/server/asr.ts#L43)_
 
 A one-off method for processing speech to text
 using Spokestack ASR.
@@ -203,7 +203,7 @@ expressApp.post('/asr', fileUpload(), (req, res) => {
 
 ▸ **googleASR**(`content`: string \| Uint8Array, `sampleRate`: number): Promise<string \| null\>
 
-_Defined in [server/asr.ts:97](https://github.com/spokestack/node-spokestack/blob/7555411/src/server/asr.ts#L97)_
+_Defined in [server/asr.ts:97](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/server/asr.ts#L97)_
 
 A one-off method for processing speech to text
 using Google Speech.
@@ -254,7 +254,7 @@ expressApp.post('/asr', fileUpload(), (req, res) => {
 
 ▸ **encryptSecret**(`body`: string): string
 
-_Defined in [server/encryptSecret.ts:13](https://github.com/spokestack/node-spokestack/blob/7555411/src/server/encryptSecret.ts#L13)_
+_Defined in [server/encryptSecret.ts:13](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/server/encryptSecret.ts#L13)_
 
 This is a convenience method for properly authorizing
 requests to the Spokestack graphql API.
@@ -283,7 +283,7 @@ These functions are available exports from `spokestack/client`.
 
 ▸ **record**(`config?`: RecordConfig): Promise<AudioBuffer\>
 
-_Defined in [client/record.ts:84](https://github.com/spokestack/node-spokestack/blob/7555411/src/client/record.ts#L84)_
+_Defined in [client/record.ts:84](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/client/record.ts#L84)_
 
 A method to record audio for a given number of seconds
 
@@ -363,31 +363,31 @@ fetch('/asr', {
 
 • `Optional` **onProgress**: undefined \| (remaining: number) => void
 
-_Defined in [client/record.ts:16](https://github.com/spokestack/node-spokestack/blob/7555411/src/client/record.ts#L16)_
+_Defined in [client/record.ts:16](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/client/record.ts#L16)_
 
 A callback function to be called each second of recording.
 
 ##### onStart
 
 • `Optional` **onStart**: undefined \| () => void
 
-_Defined in [client/record.ts:14](https://github.com/spokestack/node-spokestack/blob/7555411/src/client/record.ts#L14)_
+_Defined in [client/record.ts:14](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/client/record.ts#L14)_
 
 A callback function to be called when recording starts
 
 ##### time
 
 • `Optional` **time**: undefined \| number
 
-_Defined in [client/record.ts:12](https://github.com/spokestack/node-spokestack/blob/7555411/src/client/record.ts#L12)_
+_Defined in [client/record.ts:12](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/client/record.ts#L12)_
 
 The total time to record. Default: 3
 
 ### startStream
 
-▸ **startStream**(`isPlaying`: () => boolean): Promise<WebSocket, [ProcessorReturnValue]\>
+▸ **startStream**(`__namedParameters`: { address: undefined \| string ; isPlaying: () => boolean }): Promise<WebSocket, [ProcessorReturnValue]\>
 
-_Defined in [client/recordStream.ts:29](https://github.com/spokestack/node-spokestack/blob/7555411/src/client/recordStream.ts#L29)_
+_Defined in [client/recordStream.ts:44](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/client/recordStream.ts#L44)_
 
 Returns a function to start recording using a native WebSocket.
 This assumes the socket is hosted on the current server.
@@ -397,7 +397,10 @@ import { startStream } from 'spokestack/client'
 
 // ...
 try {
-  const [ws] = await startStream(() => this.isPlaying)
+  const [ws] = await startStream({
+    address: 'wss://localhost:3000',
+    isPlaying: () => this.isPlaying
+  })
   ws.addEventListener('open', () => console.log('Recording started'))
   ws.addEventListener('close', () => console.log('Recording stopped'))
   ws.addEventListener('message', (e) => console.log('Speech processed: ', e.data))
@@ -408,9 +411,9 @@ try {
 
 #### Parameters:
 
-| Name        | Type          | Description                                                                                                   |
-| ----------- | ------------- | ------------------------------------------------------------------------------------------------------------- |
-| `isPlaying` | () => boolean | A function returning whether audio is currently playing. This is necessary to prevent recording played audio. |
+| Name                | Type                                                        |
+| ------------------- | ----------------------------------------------------------- |
+| `__namedParameters` | { address: undefined \| string ; isPlaying: () => boolean } |
 
 **Returns:** Promise<WebSocket, [ProcessorReturnValue]\>
 
@@ -420,7 +423,7 @@ try {
 
 ▸ **stopStream**(): void
 
-_Defined in [client/recordStream.ts:80](https://github.com/spokestack/node-spokestack/blob/7555411/src/client/recordStream.ts#L80)_
+_Defined in [client/recordStream.ts:97](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/client/recordStream.ts#L97)_
 
 Stop the current recording stream if one exists.
 
@@ -435,7 +438,7 @@ stopStream()
 
 ▸ **convertFloat32ToInt16**(`fp32Samples`: Float32Array): Int16Array
 
-_Defined in [client/convertFloat32ToInt16.ts:16](https://github.com/spokestack/node-spokestack/blob/7555411/src/client/convertFloat32ToInt16.ts#L16)_
+_Defined in [client/convertFloat32ToInt16.ts:16](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/client/convertFloat32ToInt16.ts#L16)_
 
 A utility method to convert Float32Array audio
 to an Int16Array to be passed directly to Speech APIs
@@ -466,7 +469,7 @@ These are low-level functions for working with your own processors, available fr
 
 ▸ **startProcessor**(): Promise<Error] \| [null, [ProcessorReturnValue]\>
 
-_Defined in [client/processor.ts:32](https://github.com/spokestack/node-spokestack/blob/7555411/src/client/processor.ts#L32)_
+_Defined in [client/processor.ts:32](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/client/processor.ts#L32)_
 
 Underlying utility method for recording audio,
 used by the `record` and `recordStream` methods.
@@ -485,7 +488,7 @@ We'll switch to AudioWorklet when it does.
 
 ▸ **stopProcessor**(): void
 
-_Defined in [client/processor.ts:60](https://github.com/spokestack/node-spokestack/blob/7555411/src/client/processor.ts#L60)_
+_Defined in [client/processor.ts:60](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/client/processor.ts#L60)_
 
 Underlying utility method to stop the current processor
 if it exists and disconnect the microphone.
@@ -498,19 +501,19 @@ if it exists and disconnect the microphone.
 
 • **context**: AudioContext
 
-_Defined in [client/processor.ts:18](https://github.com/spokestack/node-spokestack/blob/7555411/src/client/processor.ts#L18)_
+_Defined in [client/processor.ts:18](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/client/processor.ts#L18)_
 
 ##### processor
 
 • **processor**: ScriptProcessorNode
 
-_Defined in [client/processor.ts:19](https://github.com/spokestack/node-spokestack/blob/7555411/src/client/processor.ts#L19)_
+_Defined in [client/processor.ts:19](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/client/processor.ts#L19)_
 
 ### concatenateAudioBuffers
 
 ▸ **concatenateAudioBuffers**(`buffer1`: AudioBuffer \| null, `buffer2`: AudioBuffer \| null, `context`: AudioContext): null \| AudioBuffer
 
-_Defined in [client/concatenateAudioBuffers.ts:4](https://github.com/spokestack/node-spokestack/blob/7555411/src/client/concatenateAudioBuffers.ts#L4)_
+_Defined in [client/concatenateAudioBuffers.ts:4](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/client/concatenateAudioBuffers.ts#L4)_
 
 A utility method to concatenate two AudioBuffers
 
@@ -528,7 +531,7 @@ A utility method to concatenate two AudioBuffers
 
 ▸ **countdown**(`time`: number, `progress`: (remaining: number) => void, `complete`: () => void): void
 
-_Defined in [client/countdown.ts:7](https://github.com/spokestack/node-spokestack/blob/7555411/src/client/countdown.ts#L7)_
+_Defined in [client/countdown.ts:7](https://github.com/spokestack/node-spokestack/blob/47dbb86/src/client/countdown.ts#L7)_
 
 Countdown a number of seconds
 
diff --git a/examples/with-next/pages/index.tsx b/examples/with-next/pages/index.tsx
@@ -177,7 +177,7 @@ export default class Index extends PureComponent {
     } else {
       this.initialize()
       try {
-        const [ws] = await startStream(() => this.playing)
+        const [ws] = await startStream({ isPlaying: () => this.playing })
         ws.addEventListener('open', () =>
           this.setState({ status: 'Recording...', streaming: true })
         )
diff --git a/examples/with-next/server/index.ts b/examples/with-next/server/index.ts
@@ -107,9 +107,9 @@ app.prepare().then(() => {
 
   const server = createServer(expressApp)
   if (useGoogleAsr) {
-    googleASRSocketServer(server)
+    googleASRSocketServer({ server })
   } else {
-    asrSocketServer(server)
+    asrSocketServer({ server })
   }
   server.listen(port, () => {
     console.log(`Listening at http://localhost:${port}`)
diff --git a/src/client/recordStream.ts b/src/client/recordStream.ts
@@ -5,6 +5,21 @@ import { setCookie } from '../cookies'
 
 let stop: (() => void) | undefined
 
+interface StartStreamOptions {
+  /**
+   * The address (with protocol and port) of the Spokestack ASR websocket.
+   * Defaults to the same domain and port as the current window location,
+   * but with ws(s) as the protocol (depending on https).
+   * See asrSocketServer for help creating a socket server.
+   * */
+  address?: string
+  /**
+   * A function returning whether audio is currently playing.
+   * This is necessary to prevent recording played audio.
+   */
+  isPlaying: () => boolean
+}
+
 /**
  * Returns a function to start recording using a native WebSocket.
  * This assumes the socket is hosted on the current server.
@@ -14,30 +29,32 @@ let stop: (() => void) | undefined
  *
  * // ...
  * try {
- *   const [ws] = await startStream(() => this.isPlaying)
+ *   const [ws] = await startStream({
+ *    address: 'wss://localhost:3000',
+ *    isPlaying: () => this.isPlaying
+ *   })
  *   ws.addEventListener('open', () => console.log('Recording started'))
  *   ws.addEventListener('close', () => console.log('Recording stopped'))
  *   ws.addEventListener('message', (e) => console.log('Speech processed: ', e.data))
  * } catch (e) {
  *   console.error(e)
  * }
  * ```
- *
- * @param isPlaying A function returning whether audio is currently playing.
- *   This is necessary to prevent recording played audio.
  */
-export async function startStream(
-  isPlaying: () => boolean
-): Promise<[WebSocket, ProcessorReturnValue]> {
+export async function startStream({
+  address,
+  isPlaying
+}: StartStreamOptions): Promise<[WebSocket, ProcessorReturnValue]> {
+  if (!address) {
+    address = `${location.protocol === 'https:' ? 'wss:' : 'ws:'}//${location.hostname}${
+      location.port ? `:${location.port}` : ''
+    }`
+  }
   const [error, result] = await startProcessor()
   if (error) {
     throw error
   }
   const { context, processor } = result as ProcessorReturnValue
-  const address = `${location.protocol === 'https:' ? 'wss:' : 'ws:'}//${location.hostname}${
-    location.port ? `:${location.port}` : ''
-  }`
-
   const ws = new WebSocket(address)
   setCookie('sampleRate', context.sampleRate + '')
 
diff --git a/src/server/socketServer.ts b/src/server/socketServer.ts
@@ -1,6 +1,4 @@
 import spokestackService, { SpokestackASRConfig } from './spokestackASRService'
-
-import { Server } from 'http'
 import { SpeechClient } from '@google-cloud/speech'
 import WebSocket from 'ws'
 import { getCookie } from '../cookies'
@@ -16,17 +14,17 @@ import { google } from '@google-cloud/speech/build/protos/protos'
  * const port = parseInt(process.env.PORT || '3000', 10)
  * const server = createServer() // or express()
  * // Attach the websocket server to the HTTP server
- * asrSocketServer(server)
+ * asrSocketServer({ server })
  * server.listen(port, () => {
  *   console.log(`Listening at http://localhost:${port}`)
  * })
  * ```
  */
 export function asrSocketServer(
-  server: Server,
+  serverConfig: WebSocket.ServerOptions,
   asrConfig: Omit<SpokestackASRConfig, 'sampleRate'> = {}
 ): void {
-  const wss = new WebSocket.Server({ server })
+  const wss = new WebSocket.Server(serverConfig)
   console.log('Websocket started')
 
   wss.on('connection', async (ws, request) => {
@@ -101,14 +99,14 @@ export function asrSocketServer(
  * const port = parseInt(process.env.PORT || '3000', 10)
  * const server = createServer() // or express()
  * // Attach the websocket server to the HTTP server
- * googleASRSocketServer(server)
+ * googleASRSocketServer({ server })
  * server.listen(port, () => {
  *   console.log(`Listening at http://localhost:${port}`)
  * })
  * ```
  */
-export function googleASRSocketServer(server: Server): void {
-  const wss = new WebSocket.Server({ server })
+export function googleASRSocketServer(serverConfig: WebSocket.ServerOptions): void {
+  const wss = new WebSocket.Server(serverConfig)
   console.log('Websocket started')
 
   wss.on('connection', (ws, request) => {

Original file line number	Diff line number	Diff line change
`@@ -177,7 +177,7 @@ export default class Index extends PureComponent {`
`177`	`177`	`} else {`
`178`	`178`	`this.initialize()`
`179`	`179`	`try {`
`180`		`- const [ws] = await startStream(() => this.playing)`
	`180`	`+ const [ws] = await startStream({ isPlaying: () => this.playing })`
`181`	`181`	`ws.addEventListener('open', () =>`
`182`	`182`	`this.setState({ status: 'Recording...', streaming: true })`
`183`	`183`	`)`