├── .eslintrc.json
├── .gitignore
├── .prettierrc
├── README.md
├── package-lock.json
├── public
    ├── index.html
    ├── openai-logomark.svg
    └── robots.txt
├── readme
    ├── readme.png
    └── realtime-console-demo.png
├── relay-server
    ├── index.js
    └── lib
    │   └── relay.js
├── src
    ├── App.scss
    ├── App.tsx
    ├── components
    │   ├── Map.scss
    │   ├── Map.tsx
    │   ├── button
    │   │   ├── Button.scss
    │   │   └── Button.tsx
    │   └── toggle
    │   │   ├── Toggle.scss
    │   │   └── Toggle.tsx
    ├── index.css
    ├── index.tsx
    ├── lib
    │   └── wavtools
    │   │   ├── index.js
    │   │   └── lib
    │   │       ├── analysis
    │   │           ├── audio_analysis.js
    │   │           └── constants.js
    │   │       ├── wav_packer.js
    │   │       ├── wav_recorder.js
    │   │       ├── wav_stream_player.js
    │   │       └── worklets
    │   │           ├── audio_processor.js
    │   │           └── stream_processor.js
    ├── logo.svg
    ├── pages
    │   ├── ConsolePage.scss
    │   ├── ConsolePage.tsx
    │   └── globals.d.ts
    ├── react-app-env.d.ts
    ├── reportWebVitals.ts
    ├── setupTests.ts
    └── utils
    │   ├── conversation_config.js
    │   └── wav_renderer.ts
└── tsconfig.json


/.eslintrc.json:
--------------------------------------------------------------------------------
1 | {
2 |   "parserOptions": {
3 |     "sourceType": "module"
4 |   },
5 |   "env": {
6 |     "es2022": true
7 |   }
8 | }
9 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
  1 | # Logs
  2 | logs
  3 | *.log
  4 | npm-debug.log*
  5 | yarn-debug.log*
  6 | yarn-error.log*
  7 | lerna-debug.log*
  8 | .pnpm-debug.log*
  9 | 
 10 | # Diagnostic reports (https://nodejs.org/api/report.html)
 11 | report.[0-9]*.[0-9]*.[0-9]*.[0-9]*.json
 12 | 
 13 | # Runtime data
 14 | pids
 15 | *.pid
 16 | *.seed
 17 | *.pid.lock
 18 | 
 19 | # Directory for instrumented libs generated by jscoverage/JSCover
 20 | lib-cov
 21 | 
 22 | # Coverage directory used by tools like istanbul
 23 | coverage
 24 | *.lcov
 25 | 
 26 | # nyc test coverage
 27 | .nyc_output
 28 | 
 29 | # Grunt intermediate storage (https://gruntjs.com/creating-plugins#storing-task-files)
 30 | .grunt
 31 | 
 32 | # Bower dependency directory (https://bower.io/)
 33 | bower_components
 34 | 
 35 | # node-waf configuration
 36 | .lock-wscript
 37 | 
 38 | # Compiled binary addons (https://nodejs.org/api/addons.html)
 39 | build/Release
 40 | 
 41 | # Dependency directories
 42 | node_modules/
 43 | jspm_packages/
 44 | 
 45 | # Snowpack dependency directory (https://snowpack.dev/)
 46 | web_modules/
 47 | 
 48 | # TypeScript cache
 49 | *.tsbuildinfo
 50 | 
 51 | # Optional npm cache directory
 52 | .npm
 53 | 
 54 | # Optional eslint cache
 55 | .eslintcache
 56 | 
 57 | # Optional stylelint cache
 58 | .stylelintcache
 59 | 
 60 | # Microbundle cache
 61 | .rpt2_cache/
 62 | .rts2_cache_cjs/
 63 | .rts2_cache_es/
 64 | .rts2_cache_umd/
 65 | 
 66 | # Optional REPL history
 67 | .node_repl_history
 68 | 
 69 | # Output of 'npm pack'
 70 | *.tgz
 71 | 
 72 | # Yarn Integrity file
 73 | .yarn-integrity
 74 | 
 75 | # dotenv environment variable files
 76 | .env
 77 | .env.development.local
 78 | .env.test.local
 79 | .env.production.local
 80 | .env.local
 81 | 
 82 | # parcel-bundler cache (https://parceljs.org/)
 83 | .cache
 84 | .parcel-cache
 85 | 
 86 | # Next.js build output
 87 | .next
 88 | out
 89 | 
 90 | # Nuxt.js build / generate output
 91 | .nuxt
 92 | dist
 93 | 
 94 | # Gatsby files
 95 | .cache/
 96 | # Comment in the public line in if your project uses Gatsby and not Next.js
 97 | # https://nextjs.org/blog/next-9-1#public-directory-support
 98 | # public
 99 | 
100 | # vuepress build output
101 | .vuepress/dist
102 | 
103 | # vuepress v2.x temp and cache directory
104 | .temp
105 | .cache
106 | 
107 | # Docusaurus cache and generated files
108 | .docusaurus
109 | 
110 | # Serverless directories
111 | .serverless/
112 | 
113 | # FuseBox cache
114 | .fusebox/
115 | 
116 | # DynamoDB Local files
117 | .dynamodb/
118 | 
119 | # TernJS port file
120 | .tern-port
121 | 
122 | # Stores VSCode versions used for testing VSCode extensions
123 | .vscode-test
124 | 
125 | # yarn v2
126 | .yarn/cache
127 | .yarn/unplugged
128 | .yarn/build-state.yml
129 | .yarn/install-state.gz
130 | .pnp.*
131 | 


--------------------------------------------------------------------------------
/.prettierrc:
--------------------------------------------------------------------------------
1 | {
2 |   "tabWidth": 2,
3 |   "useTabs": false,
4 |   "singleQuote": true
5 | }
6 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | # OpenAI Realtime Console
 2 | 
 3 | The OpenAI Realtime Console is intended as an inspector and interactive API reference
 4 | for the OpenAI Realtime API. It comes packaged with two utility libraries,
 5 | [openai/openai-realtime-api-beta](https://github.com/openai/openai-realtime-api-beta)
 6 | that acts as a **Reference Client** (for browser and Node.js) and
 7 | [`/src/lib/wavtools`](./src/lib/wavtools) which allows for simple audio
 8 | management in the browser.
 9 | 
10 | <img src="/readme/readme.png" width="800" />
11 | 


--------------------------------------------------------------------------------
/public/index.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | <html lang="en">
 3 |   <head>
 4 |     <meta charset="utf-8" />
 5 |     <link rel="icon" href="%PUBLIC_URL%/openai-logomark.svg" />
 6 |     <meta name="viewport" content="width=device-width, initial-scale=1" />
 7 |     <title>realtime console</title>
 8 |     <!-- Fonts -->
 9 |     <link
10 |       href="https://fonts.googleapis.com/css2?family=Roboto+Mono:ital,wght@0,100..700;1,100..700&display=swap"
11 |       rel="stylesheet"
12 |     />
13 |     <!-- Leaflet / OpenStreetMap -->
14 |     <link
15 |       rel="stylesheet"
16 |       href="https://unpkg.com/leaflet@1.6.0/dist/leaflet.css"
17 |       integrity="sha512-xwE/Az9zrjBIphAcBb3F6JVqxf46+CDLwfLMHloNu6KEQCAWi6HcDUbeOfBIptF7tcCzusKFjFw2yuvEpDL9wQ=="
18 |       crossorigin=""
19 |     />
20 |     <script
21 |       src="https://unpkg.com/leaflet@1.6.0/dist/leaflet.js"
22 |       integrity="sha512-gZwIG9x3wUXg2hdXF6+rVkLF/0Vi9U8D2Ntg4Ga5I5BZpVkVxlJWbSQtXPSiUTtC0TjtGOmxa1AJPuV0CPthew=="
23 |       crossorigin=""
24 |     ></script>
25 |   </head>
26 |   <body>
27 |     <noscript>You need to enable JavaScript to run this app.</noscript>
28 |     <div id="root"></div>
29 |     <!--
30 |       This HTML file is a template.
31 |       If you open it directly in the browser, you will see an empty page.
32 | 
33 |       You can add webfonts, meta tags, or analytics to this file.
34 |       The build step will place the bundled scripts into the <body> tag.
35 | 
36 |       To begin the development, run `npm start` or `yarn start`.
37 |       To create a production bundle, use `npm run build` or `yarn build`.
38 |     -->
39 |   </body>
40 | </html>
41 | 


--------------------------------------------------------------------------------
/public/openai-logomark.svg:
--------------------------------------------------------------------------------
1 | <svg viewBox="0 0 320 320" xmlns="http://www.w3.org/2000/svg"><path d="m297.06 130.97c7.26-21.79 4.76-45.66-6.85-65.48-17.46-30.4-52.56-46.04-86.84-38.68-15.25-17.18-37.16-26.95-60.13-26.81-35.04-.08-66.13 22.48-76.91 55.82-22.51 4.61-41.94 18.7-53.31 38.67-17.59 30.32-13.58 68.54 9.92 94.54-7.26 21.79-4.76 45.66 6.85 65.48 17.46 30.4 52.56 46.04 86.84 38.68 15.24 17.18 37.16 26.95 60.13 26.8 35.06.09 66.16-22.49 76.94-55.86 22.51-4.61 41.94-18.7 53.31-38.67 17.57-30.32 13.55-68.51-9.94-94.51zm-120.28 168.11c-14.03.02-27.62-4.89-38.39-13.88.49-.26 1.34-.73 1.89-1.07l63.72-36.8c3.26-1.85 5.26-5.32 5.24-9.07v-89.83l26.93 15.55c.29.14.48.42.52.74v74.39c-.04 33.08-26.83 59.9-59.91 59.97zm-128.84-55.03c-7.03-12.14-9.56-26.37-7.15-40.18.47.28 1.3.79 1.89 1.13l63.72 36.8c3.23 1.89 7.23 1.89 10.47 0l77.79-44.92v31.1c.02.32-.13.63-.38.83l-64.41 37.19c-28.69 16.52-65.33 6.7-81.92-21.95zm-16.77-139.09c7-12.16 18.05-21.46 31.21-26.29 0 .55-.03 1.52-.03 2.2v73.61c-.02 3.74 1.98 7.21 5.23 9.06l77.79 44.91-26.93 15.55c-.27.18-.61.21-.91.08l-64.42-37.22c-28.63-16.58-38.45-53.21-21.95-81.89zm221.26 51.49-77.79-44.92 26.93-15.54c.27-.18.61-.21.91-.08l64.42 37.19c28.68 16.57 38.51 53.26 21.94 81.94-7.01 12.14-18.05 21.44-31.2 26.28v-75.81c.03-3.74-1.96-7.2-5.2-9.06zm26.8-40.34c-.47-.29-1.3-.79-1.89-1.13l-63.72-36.8c-3.23-1.89-7.23-1.89-10.47 0l-77.79 44.92v-31.1c-.02-.32.13-.63.38-.83l64.41-37.16c28.69-16.55 65.37-6.7 81.91 22 6.99 12.12 9.52 26.31 7.15 40.1zm-168.51 55.43-26.94-15.55c-.29-.14-.48-.42-.52-.74v-74.39c.02-33.12 26.89-59.96 60.01-59.94 14.01 0 27.57 4.92 38.34 13.88-.49.26-1.33.73-1.89 1.07l-63.72 36.8c-3.26 1.85-5.26 5.31-5.24 9.06l-.04 89.79zm14.63-31.54 34.65-20.01 34.65 20v40.01l-34.65 20-34.65-20z"/></svg>


--------------------------------------------------------------------------------
/public/robots.txt:
--------------------------------------------------------------------------------
1 | # https://www.robotstxt.org/robotstxt.html
2 | User-agent: *
3 | Disallow:
4 | 


--------------------------------------------------------------------------------
/readme/readme.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/CharmingMonkeyDev/AI-call-agent-in-real-time/07ff3b62aaa906063fcec66612f3065f5bc8f5c0/readme/readme.png


--------------------------------------------------------------------------------
/readme/realtime-console-demo.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/CharmingMonkeyDev/AI-call-agent-in-real-time/07ff3b62aaa906063fcec66612f3065f5bc8f5c0/readme/realtime-console-demo.png


--------------------------------------------------------------------------------
/relay-server/index.js:
--------------------------------------------------------------------------------
 1 | import { RealtimeRelay } from './lib/relay.js';
 2 | import dotenv from 'dotenv';
 3 | dotenv.config({ override: true });
 4 | 
 5 | const OPENAI_API_KEY = process.env.OPENAI_API_KEY;
 6 | 
 7 | if (!OPENAI_API_KEY) {
 8 |   console.error(
 9 |     `Environment variable "OPENAI_API_KEY" is required.\n` +
10 |       `Please set it in your .env file.`
11 |   );
12 |   process.exit(1);
13 | }
14 | 
15 | const PORT = parseInt(process.env.PORT) || 8081;
16 | 
17 | const relay = new RealtimeRelay(OPENAI_API_KEY);
18 | relay.listen(PORT);
19 | 


--------------------------------------------------------------------------------
/relay-server/lib/relay.js:
--------------------------------------------------------------------------------
 1 | import { WebSocketServer } from 'ws';
 2 | import { RealtimeClient } from '@openai/realtime-api-beta';
 3 | 
 4 | export class RealtimeRelay {
 5 |   constructor(apiKey) {
 6 |     this.apiKey = apiKey;
 7 |     this.sockets = new WeakMap();
 8 |     this.wss = null;
 9 |   }
10 | 
11 |   listen(port) {
12 |     this.wss = new WebSocketServer({ port });
13 |     this.wss.on('connection', this.connectionHandler.bind(this));
14 |     this.log(`Listening on ws://localhost:${port}`);
15 |   }
16 | 
17 |   async connectionHandler(ws, req) {
18 |     if (!req.url) {
19 |       this.log('No URL provided, closing connection.');
20 |       ws.close();
21 |       return;
22 |     }
23 | 
24 |     const url = new URL(req.url, `http://${req.headers.host}`);
25 |     const pathname = url.pathname;
26 | 
27 |     if (pathname !== '/') {
28 |       this.log(`Invalid pathname: "${pathname}"`);
29 |       ws.close();
30 |       return;
31 |     }
32 | 
33 |     // Instantiate new client
34 |     this.log(`Connecting with key "${this.apiKey.slice(0, 3)}..."`);
35 |     const client = new RealtimeClient({ apiKey: this.apiKey });
36 | 
37 |     // Relay: OpenAI Realtime API Event -> Browser Event
38 |     client.realtime.on('server.*', (event) => {
39 |       this.log(`Relaying "${event.type}" to Client`);
40 |       ws.send(JSON.stringify(event));
41 |     });
42 |     client.realtime.on('close', () => ws.close());
43 | 
44 |     // Relay: Browser Event -> OpenAI Realtime API Event
45 |     // We need to queue data waiting for the OpenAI connection
46 |     const messageQueue = [];
47 |     const messageHandler = (data) => {
48 |       try {
49 |         const event = JSON.parse(data);
50 |         this.log(`Relaying "${event.type}" to OpenAI`);
51 |         client.realtime.send(event.type, event);
52 |       } catch (e) {
53 |         console.error(e.message);
54 |         this.log(`Error parsing event from client: ${data}`);
55 |       }
56 |     };
57 |     ws.on('message', (data) => {
58 |       if (!client.isConnected()) {
59 |         messageQueue.push(data);
60 |       } else {
61 |         messageHandler(data);
62 |       }
63 |     });
64 |     ws.on('close', () => client.disconnect());
65 | 
66 |     // Connect to OpenAI Realtime API
67 |     try {
68 |       this.log(`Connecting to OpenAI...`);
69 |       await client.connect();
70 |     } catch (e) {
71 |       this.log(`Error connecting to OpenAI: ${e.message}`);
72 |       ws.close();
73 |       return;
74 |     }
75 |     this.log(`Connected to OpenAI successfully!`);
76 |     while (messageQueue.length) {
77 |       messageHandler(messageQueue.shift());
78 |     }
79 |   }
80 | 
81 |   log(...args) {
82 |     console.log(`[RealtimeRelay]`, ...args);
83 |   }
84 | }
85 | 


--------------------------------------------------------------------------------
/src/App.scss:
--------------------------------------------------------------------------------
1 | [data-component='App'] {
2 |   height: 100%;
3 |   width: 100%;
4 |   position: relative;
5 | }
6 | 


--------------------------------------------------------------------------------
/src/App.tsx:
--------------------------------------------------------------------------------
 1 | import { ConsolePage } from './pages/ConsolePage';
 2 | import './App.scss';
 3 | 
 4 | function App() {
 5 |   return (
 6 |     <div data-component="App">
 7 |       <ConsolePage />
 8 |     </div>
 9 |   );
10 | }
11 | 
12 | export default App;
13 | 


--------------------------------------------------------------------------------
/src/components/Map.scss:
--------------------------------------------------------------------------------
 1 | [data-component='Map'] {
 2 |   position: absolute;
 3 |   width: 100%;
 4 |   height: 100%;
 5 |   .leaflet-container {
 6 |     height: 100%;
 7 |     width: 100%;
 8 |   }
 9 | }
10 | 


--------------------------------------------------------------------------------
/src/components/Map.tsx:
--------------------------------------------------------------------------------
 1 | import { MapContainer, TileLayer, Marker, Popup, useMap } from 'react-leaflet';
 2 | import { LatLngTuple } from 'leaflet';
 3 | import './Map.scss';
 4 | 
 5 | function ChangeView({ center, zoom }: { center: LatLngTuple; zoom: number }) {
 6 |   const map = useMap();
 7 |   map.setView(center, zoom);
 8 |   return null;
 9 | }
10 | 
11 | export function Map({
12 |   center,
13 |   location = 'My Location',
14 | }: {
15 |   center: LatLngTuple;
16 |   location?: string;
17 | }) {
18 |   return (
19 |     <div data-component="Map">
20 |       <MapContainer
21 |         center={center}
22 |         zoom={11}
23 |         scrollWheelZoom={false}
24 |         zoomControl={false}
25 |         attributionControl={false}
26 |       >
27 |         <ChangeView center={center} zoom={11} />
28 |         <TileLayer url="https://{s}.tile.openstreetmap.org/{z}/{x}/{y}.png" />
29 |         <Marker position={center}>
30 |           <Popup>{location}</Popup>
31 |         </Marker>
32 |       </MapContainer>
33 |     </div>
34 |   );
35 | }
36 | 


--------------------------------------------------------------------------------
/src/components/button/Button.scss:
--------------------------------------------------------------------------------
 1 | [data-component='Button'] {
 2 |   display: flex;
 3 |   align-items: center;
 4 |   gap: 8px;
 5 |   font-family: 'Roboto Mono', monospace;
 6 |   font-size: 12px;
 7 |   font-optical-sizing: auto;
 8 |   font-weight: 400;
 9 |   font-style: normal;
10 |   border: none;
11 |   background-color: #ececf1;
12 |   color: #101010;
13 |   border-radius: 1000px;
14 |   padding: 8px 24px;
15 |   min-height: 42px;
16 |   transition: transform 0.1s ease-in-out, background-color 0.1s ease-in-out;
17 |   outline: none;
18 | 
19 |   &.button-style-action {
20 |     background-color: #101010;
21 |     color: #ececf1;
22 |     &:hover:not([disabled]) {
23 |       background-color: #404040;
24 |     }
25 |   }
26 | 
27 |   &.button-style-alert {
28 |     background-color: #f00;
29 |     color: #ececf1;
30 |     &:hover:not([disabled]) {
31 |       background-color: #f00;
32 |     }
33 |   }
34 | 
35 |   &.button-style-flush {
36 |     background-color: rgba(255, 255, 255, 0);
37 |   }
38 | 
39 |   &[disabled] {
40 |     color: #999;
41 |   }
42 | 
43 |   &:not([disabled]) {
44 |     cursor: pointer;
45 |   }
46 | 
47 |   &:hover:not([disabled]) {
48 |     background-color: #d8d8d8;
49 |   }
50 | 
51 |   &:active:not([disabled]) {
52 |     transform: translateY(1px);
53 |   }
54 | 
55 |   .icon {
56 |     display: flex;
57 |     &.icon-start {
58 |       margin-left: -8px;
59 |     }
60 |     &.icon-end {
61 |       margin-right: -8px;
62 |     }
63 |     svg {
64 |       width: 16px;
65 |       height: 16px;
66 |     }
67 |   }
68 | 
69 |   &.icon-red .icon {
70 |     color: #cc0000;
71 |   }
72 |   &.icon-green .icon {
73 |     color: #009900;
74 |   }
75 |   &.icon-grey .icon {
76 |     color: #909090;
77 |   }
78 |   &.icon-fill {
79 |     svg {
80 |       fill: currentColor;
81 |     }
82 |   }
83 | }
84 | 


--------------------------------------------------------------------------------
/src/components/button/Button.tsx:
--------------------------------------------------------------------------------
 1 | import React from 'react';
 2 | import './Button.scss';
 3 | 
 4 | import { Icon } from 'react-feather';
 5 | 
 6 | interface ButtonProps extends React.ButtonHTMLAttributes<HTMLButtonElement> {
 7 |   label?: string;
 8 |   icon?: Icon;
 9 |   iconPosition?: 'start' | 'end';
10 |   iconColor?: 'red' | 'green' | 'grey';
11 |   iconFill?: boolean;
12 |   buttonStyle?: 'regular' | 'action' | 'alert' | 'flush';
13 | }
14 | 
15 | export function Button({
16 |   label = 'Okay',
17 |   icon = void 0,
18 |   iconPosition = 'start',
19 |   iconColor = void 0,
20 |   iconFill = false,
21 |   buttonStyle = 'regular',
22 |   ...rest
23 | }: ButtonProps) {
24 |   const StartIcon = iconPosition === 'start' ? icon : null;
25 |   const EndIcon = iconPosition === 'end' ? icon : null;
26 |   const classList = [];
27 |   if (iconColor) {
28 |     classList.push(`icon-${iconColor}`);
29 |   }
30 |   if (iconFill) {
31 |     classList.push(`icon-fill`);
32 |   }
33 |   classList.push(`button-style-${buttonStyle}`);
34 | 
35 |   return (
36 |     <button data-component="Button" className={classList.join(' ')} {...rest}>
37 |       {StartIcon && (
38 |         <span className="icon icon-start">
39 |           <StartIcon />
40 |         </span>
41 |       )}
42 |       <span className="label">{label}</span>
43 |       {EndIcon && (
44 |         <span className="icon icon-end">
45 |           <EndIcon />
46 |         </span>
47 |       )}
48 |     </button>
49 |   );
50 | }
51 | 


--------------------------------------------------------------------------------
/src/components/toggle/Toggle.scss:
--------------------------------------------------------------------------------
 1 | [data-component='Toggle'] {
 2 |   position: relative;
 3 |   display: flex;
 4 |   align-items: center;
 5 |   gap: 8px;
 6 |   cursor: pointer;
 7 |   overflow: hidden;
 8 | 
 9 |   background-color: #ececf1;
10 |   color: #101010;
11 |   height: 40px;
12 |   border-radius: 1000px;
13 | 
14 |   &:hover {
15 |     background-color: #d8d8d8;
16 |   }
17 | 
18 |   div.label {
19 |     position: relative;
20 |     color: #666;
21 |     transition: color 0.1s ease-in-out;
22 |     padding: 0px 16px;
23 |     z-index: 2;
24 |     user-select: none;
25 |   }
26 | 
27 |   div.label.right {
28 |     margin-left: -8px;
29 |   }
30 | 
31 |   .toggle-background {
32 |     background-color: #101010;
33 |     position: absolute;
34 |     top: 0px;
35 |     left: 0px;
36 |     width: auto;
37 |     bottom: 0px;
38 |     z-index: 1;
39 |     border-radius: 1000px;
40 |     transition: left 0.1s ease-in-out, width 0.1s ease-in-out;
41 |   }
42 | 
43 |   &[data-enabled='true'] {
44 |     div.label.right {
45 |       color: #fff;
46 |     }
47 |   }
48 | 
49 |   &[data-enabled='false'] {
50 |     div.label.left {
51 |       color: #fff;
52 |     }
53 |   }
54 | }
55 | 


--------------------------------------------------------------------------------
/src/components/toggle/Toggle.tsx:
--------------------------------------------------------------------------------
 1 | import { useState, useEffect, useRef } from 'react';
 2 | 
 3 | import './Toggle.scss';
 4 | 
 5 | export function Toggle({
 6 |   defaultValue = false,
 7 |   values,
 8 |   labels,
 9 |   onChange = () => {},
10 | }: {
11 |   defaultValue?: string | boolean;
12 |   values?: string[];
13 |   labels?: string[];
14 |   onChange?: (isEnabled: boolean, value: string) => void;
15 | }) {
16 |   if (typeof defaultValue === 'string') {
17 |     defaultValue = !!Math.max(0, (values || []).indexOf(defaultValue));
18 |   }
19 | 
20 |   const leftRef = useRef<HTMLDivElement>(null);
21 |   const rightRef = useRef<HTMLDivElement>(null);
22 |   const bgRef = useRef<HTMLDivElement>(null);
23 |   const [value, setValue] = useState<boolean>(defaultValue);
24 | 
25 |   const toggleValue = () => {
26 |     const v = !value;
27 |     const index = +v;
28 |     setValue(v);
29 |     onChange(v, (values || [])[index]);
30 |   };
31 | 
32 |   useEffect(() => {
33 |     const leftEl = leftRef.current;
34 |     const rightEl = rightRef.current;
35 |     const bgEl = bgRef.current;
36 |     if (leftEl && rightEl && bgEl) {
37 |       if (value) {
38 |         bgEl.style.left = rightEl.offsetLeft + 'px';
39 |         bgEl.style.width = rightEl.offsetWidth + 'px';
40 |       } else {
41 |         bgEl.style.left = '';
42 |         bgEl.style.width = leftEl.offsetWidth + 'px';
43 |       }
44 |     }
45 |   }, [value]);
46 | 
47 |   return (
48 |     <div
49 |       data-component="Toggle"
50 |       onClick={toggleValue}
51 |       data-enabled={value.toString()}
52 |     >
53 |       {labels && (
54 |         <div className="label left" ref={leftRef}>
55 |           {labels[0]}
56 |         </div>
57 |       )}
58 |       {labels && (
59 |         <div className="label right" ref={rightRef}>
60 |           {labels[1]}
61 |         </div>
62 |       )}
63 |       <div className="toggle-background" ref={bgRef}></div>
64 |     </div>
65 |   );
66 | }
67 | 


--------------------------------------------------------------------------------
/src/index.css:
--------------------------------------------------------------------------------
 1 | html,
 2 | body {
 3 |   padding: 0px;
 4 |   margin: 0px;
 5 |   position: relative;
 6 |   width: 100%;
 7 |   height: 100%;
 8 |   font-family: 'Assistant', sans-serif;
 9 |   font-optical-sizing: auto;
10 |   font-weight: 400;
11 |   font-style: normal;
12 |   color: #18181b;
13 |   -webkit-font-smoothing: antialiased;
14 |   -moz-osx-font-smoothing: grayscale;
15 | }
16 | 
17 | #root {
18 |   position: relative;
19 |   width: 100%;
20 |   height: 100%;
21 | }
22 | 


--------------------------------------------------------------------------------
/src/index.tsx:
--------------------------------------------------------------------------------
 1 | import React from 'react';
 2 | import ReactDOM from 'react-dom/client';
 3 | import './index.css';
 4 | import App from './App';
 5 | import reportWebVitals from './reportWebVitals';
 6 | 
 7 | const root = ReactDOM.createRoot(
 8 |   document.getElementById('root') as HTMLElement
 9 | );
10 | root.render(
11 |   <React.StrictMode>
12 |     <App />
13 |   </React.StrictMode>
14 | );
15 | 
16 | // If you want to start measuring performance in your app, pass a function
17 | // to log results (for example: reportWebVitals(console.log))
18 | // or send to an analytics endpoint. Learn more: https://bit.ly/CRA-vitals
19 | reportWebVitals();
20 | 


--------------------------------------------------------------------------------
/src/lib/wavtools/index.js:
--------------------------------------------------------------------------------
1 | import { WavPacker } from './lib/wav_packer.js';
2 | import { AudioAnalysis } from './lib/analysis/audio_analysis.js';
3 | import { WavStreamPlayer } from './lib/wav_stream_player.js';
4 | import { WavRecorder } from './lib/wav_recorder.js';
5 | 
6 | export { AudioAnalysis, WavPacker, WavStreamPlayer, WavRecorder };
7 | 


--------------------------------------------------------------------------------
/src/lib/wavtools/lib/analysis/audio_analysis.js:
--------------------------------------------------------------------------------
  1 | import {
  2 |   noteFrequencies,
  3 |   noteFrequencyLabels,
  4 |   voiceFrequencies,
  5 |   voiceFrequencyLabels,
  6 | } from './constants.js';
  7 | 
  8 | /**
  9 |  * Output of AudioAnalysis for the frequency domain of the audio
 10 |  * @typedef {Object} AudioAnalysisOutputType
 11 |  * @property {Float32Array} values Amplitude of this frequency between {0, 1} inclusive
 12 |  * @property {number[]} frequencies Raw frequency bucket values
 13 |  * @property {string[]} labels Labels for the frequency bucket values
 14 |  */
 15 | 
 16 | /**
 17 |  * Analyzes audio for visual output
 18 |  * @class
 19 |  */
 20 | export class AudioAnalysis {
 21 |   /**
 22 |    * Retrieves frequency domain data from an AnalyserNode adjusted to a decibel range
 23 |    * returns human-readable formatting and labels
 24 |    * @param {AnalyserNode} analyser
 25 |    * @param {number} sampleRate
 26 |    * @param {Float32Array} [fftResult]
 27 |    * @param {"frequency"|"music"|"voice"} [analysisType]
 28 |    * @param {number} [minDecibels] default -100
 29 |    * @param {number} [maxDecibels] default -30
 30 |    * @returns {AudioAnalysisOutputType}
 31 |    */
 32 |   static getFrequencies(
 33 |     analyser,
 34 |     sampleRate,
 35 |     fftResult,
 36 |     analysisType = 'frequency',
 37 |     minDecibels = -100,
 38 |     maxDecibels = -30,
 39 |   ) {
 40 |     if (!fftResult) {
 41 |       fftResult = new Float32Array(analyser.frequencyBinCount);
 42 |       analyser.getFloatFrequencyData(fftResult);
 43 |     }
 44 |     const nyquistFrequency = sampleRate / 2;
 45 |     const frequencyStep = (1 / fftResult.length) * nyquistFrequency;
 46 |     let outputValues;
 47 |     let frequencies;
 48 |     let labels;
 49 |     if (analysisType === 'music' || analysisType === 'voice') {
 50 |       const useFrequencies =
 51 |         analysisType === 'voice' ? voiceFrequencies : noteFrequencies;
 52 |       const aggregateOutput = Array(useFrequencies.length).fill(minDecibels);
 53 |       for (let i = 0; i < fftResult.length; i++) {
 54 |         const frequency = i * frequencyStep;
 55 |         const amplitude = fftResult[i];
 56 |         for (let n = useFrequencies.length - 1; n >= 0; n--) {
 57 |           if (frequency > useFrequencies[n]) {
 58 |             aggregateOutput[n] = Math.max(aggregateOutput[n], amplitude);
 59 |             break;
 60 |           }
 61 |         }
 62 |       }
 63 |       outputValues = aggregateOutput;
 64 |       frequencies =
 65 |         analysisType === 'voice' ? voiceFrequencies : noteFrequencies;
 66 |       labels =
 67 |         analysisType === 'voice' ? voiceFrequencyLabels : noteFrequencyLabels;
 68 |     } else {
 69 |       outputValues = Array.from(fftResult);
 70 |       frequencies = outputValues.map((_, i) => frequencyStep * i);
 71 |       labels = frequencies.map((f) => `${f.toFixed(2)} Hz`);
 72 |     }
 73 |     // We normalize to {0, 1}
 74 |     const normalizedOutput = outputValues.map((v) => {
 75 |       return Math.max(
 76 |         0,
 77 |         Math.min((v - minDecibels) / (maxDecibels - minDecibels), 1),
 78 |       );
 79 |     });
 80 |     const values = new Float32Array(normalizedOutput);
 81 |     return {
 82 |       values,
 83 |       frequencies,
 84 |       labels,
 85 |     };
 86 |   }
 87 | 
 88 |   /**
 89 |    * Creates a new AudioAnalysis instance for an HTMLAudioElement
 90 |    * @param {HTMLAudioElement} audioElement
 91 |    * @param {AudioBuffer|null} [audioBuffer] If provided, will cache all frequency domain data from the buffer
 92 |    * @returns {AudioAnalysis}
 93 |    */
 94 |   constructor(audioElement, audioBuffer = null) {
 95 |     this.fftResults = [];
 96 |     if (audioBuffer) {
 97 |       /**
 98 |        * Modified from
 99 |        * https://stackoverflow.com/questions/75063715/using-the-web-audio-api-to-analyze-a-song-without-playing
100 |        *
101 |        * We do this to populate FFT values for the audio if provided an `audioBuffer`
102 |        * The reason to do this is that Safari fails when using `createMediaElementSource`
103 |        * This has a non-zero RAM cost so we only opt-in to run it on Safari, Chrome is better
104 |        */
105 |       const { length, sampleRate } = audioBuffer;
106 |       const offlineAudioContext = new OfflineAudioContext({
107 |         length,
108 |         sampleRate,
109 |       });
110 |       const source = offlineAudioContext.createBufferSource();
111 |       source.buffer = audioBuffer;
112 |       const analyser = offlineAudioContext.createAnalyser();
113 |       analyser.fftSize = 8192;
114 |       analyser.smoothingTimeConstant = 0.1;
115 |       source.connect(analyser);
116 |       // limit is :: 128 / sampleRate;
117 |       // but we just want 60fps - cuts ~1s from 6MB to 1MB of RAM
118 |       const renderQuantumInSeconds = 1 / 60;
119 |       const durationInSeconds = length / sampleRate;
120 |       const analyze = (index) => {
121 |         const suspendTime = renderQuantumInSeconds * index;
122 |         if (suspendTime < durationInSeconds) {
123 |           offlineAudioContext.suspend(suspendTime).then(() => {
124 |             const fftResult = new Float32Array(analyser.frequencyBinCount);
125 |             analyser.getFloatFrequencyData(fftResult);
126 |             this.fftResults.push(fftResult);
127 |             analyze(index + 1);
128 |           });
129 |         }
130 |         if (index === 1) {
131 |           offlineAudioContext.startRendering();
132 |         } else {
133 |           offlineAudioContext.resume();
134 |         }
135 |       };
136 |       source.start(0);
137 |       analyze(1);
138 |       this.audio = audioElement;
139 |       this.context = offlineAudioContext;
140 |       this.analyser = analyser;
141 |       this.sampleRate = sampleRate;
142 |       this.audioBuffer = audioBuffer;
143 |     } else {
144 |       const audioContext = new AudioContext();
145 |       const track = audioContext.createMediaElementSource(audioElement);
146 |       const analyser = audioContext.createAnalyser();
147 |       analyser.fftSize = 8192;
148 |       analyser.smoothingTimeConstant = 0.1;
149 |       track.connect(analyser);
150 |       analyser.connect(audioContext.destination);
151 |       this.audio = audioElement;
152 |       this.context = audioContext;
153 |       this.analyser = analyser;
154 |       this.sampleRate = this.context.sampleRate;
155 |       this.audioBuffer = null;
156 |     }
157 |   }
158 | 
159 |   /**
160 |    * Gets the current frequency domain data from the playing audio track
161 |    * @param {"frequency"|"music"|"voice"} [analysisType]
162 |    * @param {number} [minDecibels] default -100
163 |    * @param {number} [maxDecibels] default -30
164 |    * @returns {AudioAnalysisOutputType}
165 |    */
166 |   getFrequencies(
167 |     analysisType = 'frequency',
168 |     minDecibels = -100,
169 |     maxDecibels = -30,
170 |   ) {
171 |     let fftResult = null;
172 |     if (this.audioBuffer && this.fftResults.length) {
173 |       const pct = this.audio.currentTime / this.audio.duration;
174 |       const index = Math.min(
175 |         (pct * this.fftResults.length) | 0,
176 |         this.fftResults.length - 1,
177 |       );
178 |       fftResult = this.fftResults[index];
179 |     }
180 |     return AudioAnalysis.getFrequencies(
181 |       this.analyser,
182 |       this.sampleRate,
183 |       fftResult,
184 |       analysisType,
185 |       minDecibels,
186 |       maxDecibels,
187 |     );
188 |   }
189 | 
190 |   /**
191 |    * Resume the internal AudioContext if it was suspended due to the lack of
192 |    * user interaction when the AudioAnalysis was instantiated.
193 |    * @returns {Promise<true>}
194 |    */
195 |   async resumeIfSuspended() {
196 |     if (this.context.state === 'suspended') {
197 |       await this.context.resume();
198 |     }
199 |     return true;
200 |   }
201 | }
202 | 
203 | globalThis.AudioAnalysis = AudioAnalysis;
204 | 


--------------------------------------------------------------------------------
/src/lib/wavtools/lib/analysis/constants.js:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * Constants for help with visualization
 3 |  * Helps map frequency ranges from Fast Fourier Transform
 4 |  * to human-interpretable ranges, notably music ranges and
 5 |  * human vocal ranges.
 6 |  */
 7 | 
 8 | // Eighth octave frequencies
 9 | const octave8Frequencies = [
10 |   4186.01, 4434.92, 4698.63, 4978.03, 5274.04, 5587.65, 5919.91, 6271.93,
11 |   6644.88, 7040.0, 7458.62, 7902.13,
12 | ];
13 | 
14 | // Labels for each of the above frequencies
15 | const octave8FrequencyLabels = [
16 |   'C',
17 |   'C#',
18 |   'D',
19 |   'D#',
20 |   'E',
21 |   'F',
22 |   'F#',
23 |   'G',
24 |   'G#',
25 |   'A',
26 |   'A#',
27 |   'B',
28 | ];
29 | 
30 | /**
31 |  * All note frequencies from 1st to 8th octave
32 |  * in format "A#8" (A#, 8th octave)
33 |  */
34 | export const noteFrequencies = [];
35 | export const noteFrequencyLabels = [];
36 | for (let i = 1; i <= 8; i++) {
37 |   for (let f = 0; f < octave8Frequencies.length; f++) {
38 |     const freq = octave8Frequencies[f];
39 |     noteFrequencies.push(freq / Math.pow(2, 8 - i));
40 |     noteFrequencyLabels.push(octave8FrequencyLabels[f] + i);
41 |   }
42 | }
43 | 
44 | /**
45 |  * Subset of the note frequencies between 32 and 2000 Hz
46 |  * 6 octave range: C1 to B6
47 |  */
48 | const voiceFrequencyRange = [32.0, 2000.0];
49 | export const voiceFrequencies = noteFrequencies.filter((_, i) => {
50 |   return (
51 |     noteFrequencies[i] > voiceFrequencyRange[0] &&
52 |     noteFrequencies[i] < voiceFrequencyRange[1]
53 |   );
54 | });
55 | export const voiceFrequencyLabels = noteFrequencyLabels.filter((_, i) => {
56 |   return (
57 |     noteFrequencies[i] > voiceFrequencyRange[0] &&
58 |     noteFrequencies[i] < voiceFrequencyRange[1]
59 |   );
60 | });
61 | 


--------------------------------------------------------------------------------
/src/lib/wavtools/lib/wav_packer.js:
--------------------------------------------------------------------------------
  1 | /**
  2 |  * Raw wav audio file contents
  3 |  * @typedef {Object} WavPackerAudioType
  4 |  * @property {Blob} blob
  5 |  * @property {string} url
  6 |  * @property {number} channelCount
  7 |  * @property {number} sampleRate
  8 |  * @property {number} duration
  9 |  */
 10 | 
 11 | /**
 12 |  * Utility class for assembling PCM16 "audio/wav" data
 13 |  * @class
 14 |  */
 15 | export class WavPacker {
 16 |   /**
 17 |    * Converts Float32Array of amplitude data to ArrayBuffer in Int16Array format
 18 |    * @param {Float32Array} float32Array
 19 |    * @returns {ArrayBuffer}
 20 |    */
 21 |   static floatTo16BitPCM(float32Array) {
 22 |     const buffer = new ArrayBuffer(float32Array.length * 2);
 23 |     const view = new DataView(buffer);
 24 |     let offset = 0;
 25 |     for (let i = 0; i < float32Array.length; i++, offset += 2) {
 26 |       let s = Math.max(-1, Math.min(1, float32Array[i]));
 27 |       view.setInt16(offset, s < 0 ? s * 0x8000 : s * 0x7fff, true);
 28 |     }
 29 |     return buffer;
 30 |   }
 31 | 
 32 |   /**
 33 |    * Concatenates two ArrayBuffers
 34 |    * @param {ArrayBuffer} leftBuffer
 35 |    * @param {ArrayBuffer} rightBuffer
 36 |    * @returns {ArrayBuffer}
 37 |    */
 38 |   static mergeBuffers(leftBuffer, rightBuffer) {
 39 |     const tmpArray = new Uint8Array(
 40 |       leftBuffer.byteLength + rightBuffer.byteLength
 41 |     );
 42 |     tmpArray.set(new Uint8Array(leftBuffer), 0);
 43 |     tmpArray.set(new Uint8Array(rightBuffer), leftBuffer.byteLength);
 44 |     return tmpArray.buffer;
 45 |   }
 46 | 
 47 |   /**
 48 |    * Packs data into an Int16 format
 49 |    * @private
 50 |    * @param {number} size 0 = 1x Int16, 1 = 2x Int16
 51 |    * @param {number} arg value to pack
 52 |    * @returns
 53 |    */
 54 |   _packData(size, arg) {
 55 |     return [
 56 |       new Uint8Array([arg, arg >> 8]),
 57 |       new Uint8Array([arg, arg >> 8, arg >> 16, arg >> 24]),
 58 |     ][size];
 59 |   }
 60 | 
 61 |   /**
 62 |    * Packs audio into "audio/wav" Blob
 63 |    * @param {number} sampleRate
 64 |    * @param {{bitsPerSample: number, channels: Array<Float32Array>, data: Int16Array}} audio
 65 |    * @returns {WavPackerAudioType}
 66 |    */
 67 |   pack(sampleRate, audio) {
 68 |     if (!audio?.bitsPerSample) {
 69 |       throw new Error(`Missing "bitsPerSample"`);
 70 |     } else if (!audio?.channels) {
 71 |       throw new Error(`Missing "channels"`);
 72 |     } else if (!audio?.data) {
 73 |       throw new Error(`Missing "data"`);
 74 |     }
 75 |     const { bitsPerSample, channels, data } = audio;
 76 |     const output = [
 77 |       // Header
 78 |       'RIFF',
 79 |       this._packData(
 80 |         1,
 81 |         4 + (8 + 24) /* chunk 1 length */ + (8 + 8) /* chunk 2 length */
 82 |       ), // Length
 83 |       'WAVE',
 84 |       // chunk 1
 85 |       'fmt ', // Sub-chunk identifier
 86 |       this._packData(1, 16), // Chunk length
 87 |       this._packData(0, 1), // Audio format (1 is linear quantization)
 88 |       this._packData(0, channels.length),
 89 |       this._packData(1, sampleRate),
 90 |       this._packData(1, (sampleRate * channels.length * bitsPerSample) / 8), // Byte rate
 91 |       this._packData(0, (channels.length * bitsPerSample) / 8),
 92 |       this._packData(0, bitsPerSample),
 93 |       // chunk 2
 94 |       'data', // Sub-chunk identifier
 95 |       this._packData(
 96 |         1,
 97 |         (channels[0].length * channels.length * bitsPerSample) / 8
 98 |       ), // Chunk length
 99 |       data,
100 |     ];
101 |     const blob = new Blob(output, { type: 'audio/mpeg' });
102 |     const url = URL.createObjectURL(blob);
103 |     return {
104 |       blob,
105 |       url,
106 |       channelCount: channels.length,
107 |       sampleRate,
108 |       duration: data.byteLength / (channels.length * sampleRate * 2),
109 |     };
110 |   }
111 | }
112 | 
113 | globalThis.WavPacker = WavPacker;
114 | 


--------------------------------------------------------------------------------
/src/lib/wavtools/lib/wav_recorder.js:
--------------------------------------------------------------------------------
  1 | import { AudioProcessorSrc } from './worklets/audio_processor.js';
  2 | import { AudioAnalysis } from './analysis/audio_analysis.js';
  3 | import { WavPacker } from './wav_packer.js';
  4 | 
  5 | /**
  6 |  * Decodes audio into a wav file
  7 |  * @typedef {Object} DecodedAudioType
  8 |  * @property {Blob} blob
  9 |  * @property {string} url
 10 |  * @property {Float32Array} values
 11 |  * @property {AudioBuffer} audioBuffer
 12 |  */
 13 | 
 14 | /**
 15 |  * Records live stream of user audio as PCM16 "audio/wav" data
 16 |  * @class
 17 |  */
 18 | export class WavRecorder {
 19 |   /**
 20 |    * Create a new WavRecorder instance
 21 |    * @param {{sampleRate?: number, outputToSpeakers?: boolean, debug?: boolean}} [options]
 22 |    * @returns {WavRecorder}
 23 |    */
 24 |   constructor({
 25 |     sampleRate = 44100,
 26 |     outputToSpeakers = false,
 27 |     debug = false,
 28 |   } = {}) {
 29 |     // Script source
 30 |     this.scriptSrc = AudioProcessorSrc;
 31 |     // Config
 32 |     this.sampleRate = sampleRate;
 33 |     this.outputToSpeakers = outputToSpeakers;
 34 |     this.debug = !!debug;
 35 |     this._deviceChangeCallback = null;
 36 |     this._devices = [];
 37 |     // State variables
 38 |     this.stream = null;
 39 |     this.processor = null;
 40 |     this.source = null;
 41 |     this.node = null;
 42 |     this.recording = false;
 43 |     // Event handling with AudioWorklet
 44 |     this._lastEventId = 0;
 45 |     this.eventReceipts = {};
 46 |     this.eventTimeout = 5000;
 47 |     // Process chunks of audio
 48 |     this._chunkProcessor = () => {};
 49 |     this._chunkProcessorSize = void 0;
 50 |     this._chunkProcessorBuffer = {
 51 |       raw: new ArrayBuffer(0),
 52 |       mono: new ArrayBuffer(0),
 53 |     };
 54 |   }
 55 | 
 56 |   /**
 57 |    * Decodes audio data from multiple formats to a Blob, url, Float32Array and AudioBuffer
 58 |    * @param {Blob|Float32Array|Int16Array|ArrayBuffer|number[]} audioData
 59 |    * @param {number} sampleRate
 60 |    * @param {number} fromSampleRate
 61 |    * @returns {Promise<DecodedAudioType>}
 62 |    */
 63 |   static async decode(audioData, sampleRate = 44100, fromSampleRate = -1) {
 64 |     const context = new AudioContext({ sampleRate });
 65 |     let arrayBuffer;
 66 |     let blob;
 67 |     if (audioData instanceof Blob) {
 68 |       if (fromSampleRate !== -1) {
 69 |         throw new Error(
 70 |           `Can not specify "fromSampleRate" when reading from Blob`,
 71 |         );
 72 |       }
 73 |       blob = audioData;
 74 |       arrayBuffer = await blob.arrayBuffer();
 75 |     } else if (audioData instanceof ArrayBuffer) {
 76 |       if (fromSampleRate !== -1) {
 77 |         throw new Error(
 78 |           `Can not specify "fromSampleRate" when reading from ArrayBuffer`,
 79 |         );
 80 |       }
 81 |       arrayBuffer = audioData;
 82 |       blob = new Blob([arrayBuffer], { type: 'audio/wav' });
 83 |     } else {
 84 |       let float32Array;
 85 |       let data;
 86 |       if (audioData instanceof Int16Array) {
 87 |         data = audioData;
 88 |         float32Array = new Float32Array(audioData.length);
 89 |         for (let i = 0; i < audioData.length; i++) {
 90 |           float32Array[i] = audioData[i] / 0x8000;
 91 |         }
 92 |       } else if (audioData instanceof Float32Array) {
 93 |         float32Array = audioData;
 94 |       } else if (audioData instanceof Array) {
 95 |         float32Array = new Float32Array(audioData);
 96 |       } else {
 97 |         throw new Error(
 98 |           `"audioData" must be one of: Blob, Float32Arrray, Int16Array, ArrayBuffer, Array<number>`,
 99 |         );
100 |       }
101 |       if (fromSampleRate === -1) {
102 |         throw new Error(
103 |           `Must specify "fromSampleRate" when reading from Float32Array, In16Array or Array`,
104 |         );
105 |       } else if (fromSampleRate < 3000) {
106 |         throw new Error(`Minimum "fromSampleRate" is 3000 (3kHz)`);
107 |       }
108 |       if (!data) {
109 |         data = WavPacker.floatTo16BitPCM(float32Array);
110 |       }
111 |       const audio = {
112 |         bitsPerSample: 16,
113 |         channels: [float32Array],
114 |         data,
115 |       };
116 |       const packer = new WavPacker();
117 |       const result = packer.pack(fromSampleRate, audio);
118 |       blob = result.blob;
119 |       arrayBuffer = await blob.arrayBuffer();
120 |     }
121 |     const audioBuffer = await context.decodeAudioData(arrayBuffer);
122 |     const values = audioBuffer.getChannelData(0);
123 |     const url = URL.createObjectURL(blob);
124 |     return {
125 |       blob,
126 |       url,
127 |       values,
128 |       audioBuffer,
129 |     };
130 |   }
131 | 
132 |   /**
133 |    * Logs data in debug mode
134 |    * @param {...any} arguments
135 |    * @returns {true}
136 |    */
137 |   log() {
138 |     if (this.debug) {
139 |       this.log(...arguments);
140 |     }
141 |     return true;
142 |   }
143 | 
144 |   /**
145 |    * Retrieves the current sampleRate for the recorder
146 |    * @returns {number}
147 |    */
148 |   getSampleRate() {
149 |     return this.sampleRate;
150 |   }
151 | 
152 |   /**
153 |    * Retrieves the current status of the recording
154 |    * @returns {"ended"|"paused"|"recording"}
155 |    */
156 |   getStatus() {
157 |     if (!this.processor) {
158 |       return 'ended';
159 |     } else if (!this.recording) {
160 |       return 'paused';
161 |     } else {
162 |       return 'recording';
163 |     }
164 |   }
165 | 
166 |   /**
167 |    * Sends an event to the AudioWorklet
168 |    * @private
169 |    * @param {string} name
170 |    * @param {{[key: string]: any}} data
171 |    * @param {AudioWorkletNode} [_processor]
172 |    * @returns {Promise<{[key: string]: any}>}
173 |    */
174 |   async _event(name, data = {}, _processor = null) {
175 |     _processor = _processor || this.processor;
176 |     if (!_processor) {
177 |       throw new Error('Can not send events without recording first');
178 |     }
179 |     const message = {
180 |       event: name,
181 |       id: this._lastEventId++,
182 |       data,
183 |     };
184 |     _processor.port.postMessage(message);
185 |     const t0 = new Date().valueOf();
186 |     while (!this.eventReceipts[message.id]) {
187 |       if (new Date().valueOf() - t0 > this.eventTimeout) {
188 |         throw new Error(`Timeout waiting for "${name}" event`);
189 |       }
190 |       await new Promise((res) => setTimeout(() => res(true), 1));
191 |     }
192 |     const payload = this.eventReceipts[message.id];
193 |     delete this.eventReceipts[message.id];
194 |     return payload;
195 |   }
196 | 
197 |   /**
198 |    * Sets device change callback, remove if callback provided is `null`
199 |    * @param {(Array<MediaDeviceInfo & {default: boolean}>): void|null} callback
200 |    * @returns {true}
201 |    */
202 |   listenForDeviceChange(callback) {
203 |     if (callback === null && this._deviceChangeCallback) {
204 |       navigator.mediaDevices.removeEventListener(
205 |         'devicechange',
206 |         this._deviceChangeCallback,
207 |       );
208 |       this._deviceChangeCallback = null;
209 |     } else if (callback !== null) {
210 |       // Basically a debounce; we only want this called once when devices change
211 |       // And we only want the most recent callback() to be executed
212 |       // if a few are operating at the same time
213 |       let lastId = 0;
214 |       let lastDevices = [];
215 |       const serializeDevices = (devices) =>
216 |         devices
217 |           .map((d) => d.deviceId)
218 |           .sort()
219 |           .join(',');
220 |       const cb = async () => {
221 |         let id = ++lastId;
222 |         const devices = await this.listDevices();
223 |         if (id === lastId) {
224 |           if (serializeDevices(lastDevices) !== serializeDevices(devices)) {
225 |             lastDevices = devices;
226 |             callback(devices.slice());
227 |           }
228 |         }
229 |       };
230 |       navigator.mediaDevices.addEventListener('devicechange', cb);
231 |       cb();
232 |       this._deviceChangeCallback = cb;
233 |     }
234 |     return true;
235 |   }
236 | 
237 |   /**
238 |    * Manually request permission to use the microphone
239 |    * @returns {Promise<true>}
240 |    */
241 |   async requestPermission() {
242 |     const permissionStatus = await navigator.permissions.query({
243 |       name: 'microphone',
244 |     });
245 |     if (permissionStatus.state === 'denied') {
246 |       window.alert('You must grant microphone access to use this feature.');
247 |     } else if (permissionStatus.state === 'prompt') {
248 |       try {
249 |         const stream = await navigator.mediaDevices.getUserMedia({
250 |           audio: true,
251 |         });
252 |         const tracks = stream.getTracks();
253 |         tracks.forEach((track) => track.stop());
254 |       } catch (e) {
255 |         window.alert('You must grant microphone access to use this feature.');
256 |       }
257 |     }
258 |     return true;
259 |   }
260 | 
261 |   /**
262 |    * List all eligible devices for recording, will request permission to use microphone
263 |    * @returns {Promise<Array<MediaDeviceInfo & {default: boolean}>>}
264 |    */
265 |   async listDevices() {
266 |     if (
267 |       !navigator.mediaDevices ||
268 |       !('enumerateDevices' in navigator.mediaDevices)
269 |     ) {
270 |       throw new Error('Could not request user devices');
271 |     }
272 |     await this.requestPermission();
273 |     const devices = await navigator.mediaDevices.enumerateDevices();
274 |     const audioDevices = devices.filter(
275 |       (device) => device.kind === 'audioinput',
276 |     );
277 |     const defaultDeviceIndex = audioDevices.findIndex(
278 |       (device) => device.deviceId === 'default',
279 |     );
280 |     const deviceList = [];
281 |     if (defaultDeviceIndex !== -1) {
282 |       let defaultDevice = audioDevices.splice(defaultDeviceIndex, 1)[0];
283 |       let existingIndex = audioDevices.findIndex(
284 |         (device) => device.groupId === defaultDevice.groupId,
285 |       );
286 |       if (existingIndex !== -1) {
287 |         defaultDevice = audioDevices.splice(existingIndex, 1)[0];
288 |       }
289 |       defaultDevice.default = true;
290 |       deviceList.push(defaultDevice);
291 |     }
292 |     return deviceList.concat(audioDevices);
293 |   }
294 | 
295 |   /**
296 |    * Begins a recording session and requests microphone permissions if not already granted
297 |    * Microphone recording indicator will appear on browser tab but status will be "paused"
298 |    * @param {string} [deviceId] if no device provided, default device will be used
299 |    * @returns {Promise<true>}
300 |    */
301 |   async begin(deviceId) {
302 |     if (this.processor) {
303 |       throw new Error(
304 |         `Already connected: please call .end() to start a new session`,
305 |       );
306 |     }
307 | 
308 |     if (
309 |       !navigator.mediaDevices ||
310 |       !('getUserMedia' in navigator.mediaDevices)
311 |     ) {
312 |       throw new Error('Could not request user media');
313 |     }
314 |     try {
315 |       const config = { audio: true };
316 |       if (deviceId) {
317 |         config.audio = { deviceId: { exact: deviceId } };
318 |       }
319 |       this.stream = await navigator.mediaDevices.getUserMedia(config);
320 |     } catch (err) {
321 |       throw new Error('Could not start media stream');
322 |     }
323 | 
324 |     const context = new AudioContext({ sampleRate: this.sampleRate });
325 |     const source = context.createMediaStreamSource(this.stream);
326 |     // Load and execute the module script.
327 |     try {
328 |       await context.audioWorklet.addModule(this.scriptSrc);
329 |     } catch (e) {
330 |       console.error(e);
331 |       throw new Error(`Could not add audioWorklet module: ${this.scriptSrc}`);
332 |     }
333 |     const processor = new AudioWorkletNode(context, 'audio_processor');
334 |     processor.port.onmessage = (e) => {
335 |       const { event, id, data } = e.data;
336 |       if (event === 'receipt') {
337 |         this.eventReceipts[id] = data;
338 |       } else if (event === 'chunk') {
339 |         if (this._chunkProcessorSize) {
340 |           const buffer = this._chunkProcessorBuffer;
341 |           this._chunkProcessorBuffer = {
342 |             raw: WavPacker.mergeBuffers(buffer.raw, data.raw),
343 |             mono: WavPacker.mergeBuffers(buffer.mono, data.mono),
344 |           };
345 |           if (
346 |             this._chunkProcessorBuffer.mono.byteLength >=
347 |             this._chunkProcessorSize
348 |           ) {
349 |             this._chunkProcessor(this._chunkProcessorBuffer);
350 |             this._chunkProcessorBuffer = {
351 |               raw: new ArrayBuffer(0),
352 |               mono: new ArrayBuffer(0),
353 |             };
354 |           }
355 |         } else {
356 |           this._chunkProcessor(data);
357 |         }
358 |       }
359 |     };
360 | 
361 |     const node = source.connect(processor);
362 |     const analyser = context.createAnalyser();
363 |     analyser.fftSize = 8192;
364 |     analyser.smoothingTimeConstant = 0.1;
365 |     node.connect(analyser);
366 |     if (this.outputToSpeakers) {
367 |       // eslint-disable-next-line no-console
368 |       console.warn(
369 |         'Warning: Output to speakers may affect sound quality,\n' +
370 |           'especially due to system audio feedback preventative measures.\n' +
371 |           'use only for debugging',
372 |       );
373 |       analyser.connect(context.destination);
374 |     }
375 | 
376 |     this.source = source;
377 |     this.node = node;
378 |     this.analyser = analyser;
379 |     this.processor = processor;
380 |     return true;
381 |   }
382 | 
383 |   /**
384 |    * Gets the current frequency domain data from the recording track
385 |    * @param {"frequency"|"music"|"voice"} [analysisType]
386 |    * @param {number} [minDecibels] default -100
387 |    * @param {number} [maxDecibels] default -30
388 |    * @returns {import('./analysis/audio_analysis.js').AudioAnalysisOutputType}
389 |    */
390 |   getFrequencies(
391 |     analysisType = 'frequency',
392 |     minDecibels = -100,
393 |     maxDecibels = -30,
394 |   ) {
395 |     if (!this.processor) {
396 |       throw new Error('Session ended: please call .begin() first');
397 |     }
398 |     return AudioAnalysis.getFrequencies(
399 |       this.analyser,
400 |       this.sampleRate,
401 |       null,
402 |       analysisType,
403 |       minDecibels,
404 |       maxDecibels,
405 |     );
406 |   }
407 | 
408 |   /**
409 |    * Pauses the recording
410 |    * Keeps microphone stream open but halts storage of audio
411 |    * @returns {Promise<true>}
412 |    */
413 |   async pause() {
414 |     if (!this.processor) {
415 |       throw new Error('Session ended: please call .begin() first');
416 |     } else if (!this.recording) {
417 |       throw new Error('Already paused: please call .record() first');
418 |     }
419 |     if (this._chunkProcessorBuffer.raw.byteLength) {
420 |       this._chunkProcessor(this._chunkProcessorBuffer);
421 |     }
422 |     this.log('Pausing ...');
423 |     await this._event('stop');
424 |     this.recording = false;
425 |     return true;
426 |   }
427 | 
428 |   /**
429 |    * Start recording stream and storing to memory from the connected audio source
430 |    * @param {(data: { mono: Int16Array; raw: Int16Array }) => any} [chunkProcessor]
431 |    * @param {number} [chunkSize] chunkProcessor will not be triggered until this size threshold met in mono audio
432 |    * @returns {Promise<true>}
433 |    */
434 |   async record(chunkProcessor = () => {}, chunkSize = 8192) {
435 |     if (!this.processor) {
436 |       throw new Error('Session ended: please call .begin() first');
437 |     } else if (this.recording) {
438 |       throw new Error('Already recording: please call .pause() first');
439 |     } else if (typeof chunkProcessor !== 'function') {
440 |       throw new Error(`chunkProcessor must be a function`);
441 |     }
442 |     this._chunkProcessor = chunkProcessor;
443 |     this._chunkProcessorSize = chunkSize;
444 |     this._chunkProcessorBuffer = {
445 |       raw: new ArrayBuffer(0),
446 |       mono: new ArrayBuffer(0),
447 |     };
448 |     this.log('Recording ...');
449 |     await this._event('start');
450 |     this.recording = true;
451 |     return true;
452 |   }
453 | 
454 |   /**
455 |    * Clears the audio buffer, empties stored recording
456 |    * @returns {Promise<true>}
457 |    */
458 |   async clear() {
459 |     if (!this.processor) {
460 |       throw new Error('Session ended: please call .begin() first');
461 |     }
462 |     await this._event('clear');
463 |     return true;
464 |   }
465 | 
466 |   /**
467 |    * Reads the current audio stream data
468 |    * @returns {Promise<{meanValues: Float32Array, channels: Array<Float32Array>}>}
469 |    */
470 |   async read() {
471 |     if (!this.processor) {
472 |       throw new Error('Session ended: please call .begin() first');
473 |     }
474 |     this.log('Reading ...');
475 |     const result = await this._event('read');
476 |     return result;
477 |   }
478 | 
479 |   /**
480 |    * Saves the current audio stream to a file
481 |    * @param {boolean} [force] Force saving while still recording
482 |    * @returns {Promise<import('./wav_packer.js').WavPackerAudioType>}
483 |    */
484 |   async save(force = false) {
485 |     if (!this.processor) {
486 |       throw new Error('Session ended: please call .begin() first');
487 |     }
488 |     if (!force && this.recording) {
489 |       throw new Error(
490 |         'Currently recording: please call .pause() first, or call .save(true) to force',
491 |       );
492 |     }
493 |     this.log('Exporting ...');
494 |     const exportData = await this._event('export');
495 |     const packer = new WavPacker();
496 |     const result = packer.pack(this.sampleRate, exportData.audio);
497 |     return result;
498 |   }
499 | 
500 |   /**
501 |    * Ends the current recording session and saves the result
502 |    * @returns {Promise<import('./wav_packer.js').WavPackerAudioType>}
503 |    */
504 |   async end() {
505 |     if (!this.processor) {
506 |       throw new Error('Session ended: please call .begin() first');
507 |     }
508 | 
509 |     const _processor = this.processor;
510 | 
511 |     this.log('Stopping ...');
512 |     await this._event('stop');
513 |     this.recording = false;
514 |     const tracks = this.stream.getTracks();
515 |     tracks.forEach((track) => track.stop());
516 | 
517 |     this.log('Exporting ...');
518 |     const exportData = await this._event('export', {}, _processor);
519 | 
520 |     this.processor.disconnect();
521 |     this.source.disconnect();
522 |     this.node.disconnect();
523 |     this.analyser.disconnect();
524 |     this.stream = null;
525 |     this.processor = null;
526 |     this.source = null;
527 |     this.node = null;
528 | 
529 |     const packer = new WavPacker();
530 |     const result = packer.pack(this.sampleRate, exportData.audio);
531 |     return result;
532 |   }
533 | 
534 |   /**
535 |    * Performs a full cleanup of WavRecorder instance
536 |    * Stops actively listening via microphone and removes existing listeners
537 |    * @returns {Promise<true>}
538 |    */
539 |   async quit() {
540 |     this.listenForDeviceChange(null);
541 |     if (this.processor) {
542 |       await this.end();
543 |     }
544 |     return true;
545 |   }
546 | }
547 | 
548 | globalThis.WavRecorder = WavRecorder;
549 | 


--------------------------------------------------------------------------------
/src/lib/wavtools/lib/wav_stream_player.js:
--------------------------------------------------------------------------------
  1 | import { StreamProcessorSrc } from './worklets/stream_processor.js';
  2 | import { AudioAnalysis } from './analysis/audio_analysis.js';
  3 | 
  4 | /**
  5 |  * Plays audio streams received in raw PCM16 chunks from the browser
  6 |  * @class
  7 |  */
  8 | export class WavStreamPlayer {
  9 |   /**
 10 |    * Creates a new WavStreamPlayer instance
 11 |    * @param {{sampleRate?: number}} options
 12 |    * @returns {WavStreamPlayer}
 13 |    */
 14 |   constructor({ sampleRate = 44100 } = {}) {
 15 |     this.scriptSrc = StreamProcessorSrc;
 16 |     this.sampleRate = sampleRate;
 17 |     this.context = null;
 18 |     this.stream = null;
 19 |     this.analyser = null;
 20 |     this.trackSampleOffsets = {};
 21 |     this.interruptedTrackIds = {};
 22 |   }
 23 | 
 24 |   /**
 25 |    * Connects the audio context and enables output to speakers
 26 |    * @returns {Promise<true>}
 27 |    */
 28 |   async connect() {
 29 |     this.context = new AudioContext({ sampleRate: this.sampleRate });
 30 |     if (this.context.state === 'suspended') {
 31 |       await this.context.resume();
 32 |     }
 33 |     try {
 34 |       await this.context.audioWorklet.addModule(this.scriptSrc);
 35 |     } catch (e) {
 36 |       console.error(e);
 37 |       throw new Error(`Could not add audioWorklet module: ${this.scriptSrc}`);
 38 |     }
 39 |     const analyser = this.context.createAnalyser();
 40 |     analyser.fftSize = 8192;
 41 |     analyser.smoothingTimeConstant = 0.1;
 42 |     this.analyser = analyser;
 43 |     return true;
 44 |   }
 45 | 
 46 |   /**
 47 |    * Gets the current frequency domain data from the playing track
 48 |    * @param {"frequency"|"music"|"voice"} [analysisType]
 49 |    * @param {number} [minDecibels] default -100
 50 |    * @param {number} [maxDecibels] default -30
 51 |    * @returns {import('./analysis/audio_analysis.js').AudioAnalysisOutputType}
 52 |    */
 53 |   getFrequencies(
 54 |     analysisType = 'frequency',
 55 |     minDecibels = -100,
 56 |     maxDecibels = -30
 57 |   ) {
 58 |     if (!this.analyser) {
 59 |       throw new Error('Not connected, please call .connect() first');
 60 |     }
 61 |     return AudioAnalysis.getFrequencies(
 62 |       this.analyser,
 63 |       this.sampleRate,
 64 |       null,
 65 |       analysisType,
 66 |       minDecibels,
 67 |       maxDecibels
 68 |     );
 69 |   }
 70 | 
 71 |   /**
 72 |    * Starts audio streaming
 73 |    * @private
 74 |    * @returns {Promise<true>}
 75 |    */
 76 |   _start() {
 77 |     const streamNode = new AudioWorkletNode(this.context, 'stream_processor');
 78 |     streamNode.connect(this.context.destination);
 79 |     streamNode.port.onmessage = (e) => {
 80 |       const { event } = e.data;
 81 |       if (event === 'stop') {
 82 |         streamNode.disconnect();
 83 |         this.stream = null;
 84 |       } else if (event === 'offset') {
 85 |         const { requestId, trackId, offset } = e.data;
 86 |         const currentTime = offset / this.sampleRate;
 87 |         this.trackSampleOffsets[requestId] = { trackId, offset, currentTime };
 88 |       }
 89 |     };
 90 |     this.analyser.disconnect();
 91 |     streamNode.connect(this.analyser);
 92 |     this.stream = streamNode;
 93 |     return true;
 94 |   }
 95 | 
 96 |   /**
 97 |    * Adds 16BitPCM data to the currently playing audio stream
 98 |    * You can add chunks beyond the current play point and they will be queued for play
 99 |    * @param {ArrayBuffer|Int16Array} arrayBuffer
100 |    * @param {string} [trackId]
101 |    * @returns {Int16Array}
102 |    */
103 |   add16BitPCM(arrayBuffer, trackId = 'default') {
104 |     if (typeof trackId !== 'string') {
105 |       throw new Error(`trackId must be a string`);
106 |     } else if (this.interruptedTrackIds[trackId]) {
107 |       return;
108 |     }
109 |     if (!this.stream) {
110 |       this._start();
111 |     }
112 |     let buffer;
113 |     if (arrayBuffer instanceof Int16Array) {
114 |       buffer = arrayBuffer;
115 |     } else if (arrayBuffer instanceof ArrayBuffer) {
116 |       buffer = new Int16Array(arrayBuffer);
117 |     } else {
118 |       throw new Error(`argument must be Int16Array or ArrayBuffer`);
119 |     }
120 |     this.stream.port.postMessage({ event: 'write', buffer, trackId });
121 |     return buffer;
122 |   }
123 | 
124 |   /**
125 |    * Gets the offset (sample count) of the currently playing stream
126 |    * @param {boolean} [interrupt]
127 |    * @returns {{trackId: string|null, offset: number, currentTime: number}}
128 |    */
129 |   async getTrackSampleOffset(interrupt = false) {
130 |     if (!this.stream) {
131 |       return null;
132 |     }
133 |     const requestId = crypto.randomUUID();
134 |     this.stream.port.postMessage({
135 |       event: interrupt ? 'interrupt' : 'offset',
136 |       requestId,
137 |     });
138 |     let trackSampleOffset;
139 |     while (!trackSampleOffset) {
140 |       trackSampleOffset = this.trackSampleOffsets[requestId];
141 |       await new Promise((r) => setTimeout(() => r(), 1));
142 |     }
143 |     const { trackId } = trackSampleOffset;
144 |     if (interrupt && trackId) {
145 |       this.interruptedTrackIds[trackId] = true;
146 |     }
147 |     return trackSampleOffset;
148 |   }
149 | 
150 |   /**
151 |    * Strips the current stream and returns the sample offset of the audio
152 |    * @param {boolean} [interrupt]
153 |    * @returns {{trackId: string|null, offset: number, currentTime: number}}
154 |    */
155 |   async interrupt() {
156 |     return this.getTrackSampleOffset(true);
157 |   }
158 | }
159 | 
160 | globalThis.WavStreamPlayer = WavStreamPlayer;
161 | 


--------------------------------------------------------------------------------
/src/lib/wavtools/lib/worklets/audio_processor.js:
--------------------------------------------------------------------------------
  1 | const AudioProcessorWorklet = `
  2 | class AudioProcessor extends AudioWorkletProcessor {
  3 | 
  4 |   constructor() {
  5 |     super();
  6 |     this.port.onmessage = this.receive.bind(this);
  7 |     this.initialize();
  8 |   }
  9 | 
 10 |   initialize() {
 11 |     this.foundAudio = false;
 12 |     this.recording = false;
 13 |     this.chunks = [];
 14 |   }
 15 | 
 16 |   /**
 17 |    * Concatenates sampled chunks into channels
 18 |    * Format is chunk[Left[], Right[]]
 19 |    */
 20 |   readChannelData(chunks, channel = -1, maxChannels = 9) {
 21 |     let channelLimit;
 22 |     if (channel !== -1) {
 23 |       if (chunks[0] && chunks[0].length - 1 < channel) {
 24 |         throw new Error(
 25 |           \`Channel \${channel} out of range: max \${chunks[0].length}\`
 26 |         );
 27 |       }
 28 |       channelLimit = channel + 1;
 29 |     } else {
 30 |       channel = 0;
 31 |       channelLimit = Math.min(chunks[0] ? chunks[0].length : 1, maxChannels);
 32 |     }
 33 |     const channels = [];
 34 |     for (let n = channel; n < channelLimit; n++) {
 35 |       const length = chunks.reduce((sum, chunk) => {
 36 |         return sum + chunk[n].length;
 37 |       }, 0);
 38 |       const buffers = chunks.map((chunk) => chunk[n]);
 39 |       const result = new Float32Array(length);
 40 |       let offset = 0;
 41 |       for (let i = 0; i < buffers.length; i++) {
 42 |         result.set(buffers[i], offset);
 43 |         offset += buffers[i].length;
 44 |       }
 45 |       channels[n] = result;
 46 |     }
 47 |     return channels;
 48 |   }
 49 | 
 50 |   /**
 51 |    * Combines parallel audio data into correct format,
 52 |    * channels[Left[], Right[]] to float32Array[LRLRLRLR...]
 53 |    */
 54 |   formatAudioData(channels) {
 55 |     if (channels.length === 1) {
 56 |       // Simple case is only one channel
 57 |       const float32Array = channels[0].slice();
 58 |       const meanValues = channels[0].slice();
 59 |       return { float32Array, meanValues };
 60 |     } else {
 61 |       const float32Array = new Float32Array(
 62 |         channels[0].length * channels.length
 63 |       );
 64 |       const meanValues = new Float32Array(channels[0].length);
 65 |       for (let i = 0; i < channels[0].length; i++) {
 66 |         const offset = i * channels.length;
 67 |         let meanValue = 0;
 68 |         for (let n = 0; n < channels.length; n++) {
 69 |           float32Array[offset + n] = channels[n][i];
 70 |           meanValue += channels[n][i];
 71 |         }
 72 |         meanValues[i] = meanValue / channels.length;
 73 |       }
 74 |       return { float32Array, meanValues };
 75 |     }
 76 |   }
 77 | 
 78 |   /**
 79 |    * Converts 32-bit float data to 16-bit integers
 80 |    */
 81 |   floatTo16BitPCM(float32Array) {
 82 |     const buffer = new ArrayBuffer(float32Array.length * 2);
 83 |     const view = new DataView(buffer);
 84 |     let offset = 0;
 85 |     for (let i = 0; i < float32Array.length; i++, offset += 2) {
 86 |       let s = Math.max(-1, Math.min(1, float32Array[i]));
 87 |       view.setInt16(offset, s < 0 ? s * 0x8000 : s * 0x7fff, true);
 88 |     }
 89 |     return buffer;
 90 |   }
 91 | 
 92 |   /**
 93 |    * Retrieves the most recent amplitude values from the audio stream
 94 |    * @param {number} channel
 95 |    */
 96 |   getValues(channel = -1) {
 97 |     const channels = this.readChannelData(this.chunks, channel);
 98 |     const { meanValues } = this.formatAudioData(channels);
 99 |     return { meanValues, channels };
100 |   }
101 | 
102 |   /**
103 |    * Exports chunks as an audio/wav file
104 |    */
105 |   export() {
106 |     const channels = this.readChannelData(this.chunks);
107 |     const { float32Array, meanValues } = this.formatAudioData(channels);
108 |     const audioData = this.floatTo16BitPCM(float32Array);
109 |     return {
110 |       meanValues: meanValues,
111 |       audio: {
112 |         bitsPerSample: 16,
113 |         channels: channels,
114 |         data: audioData,
115 |       },
116 |     };
117 |   }
118 | 
119 |   receive(e) {
120 |     const { event, id } = e.data;
121 |     let receiptData = {};
122 |     switch (event) {
123 |       case 'start':
124 |         this.recording = true;
125 |         break;
126 |       case 'stop':
127 |         this.recording = false;
128 |         break;
129 |       case 'clear':
130 |         this.initialize();
131 |         break;
132 |       case 'export':
133 |         receiptData = this.export();
134 |         break;
135 |       case 'read':
136 |         receiptData = this.getValues();
137 |         break;
138 |       default:
139 |         break;
140 |     }
141 |     // Always send back receipt
142 |     this.port.postMessage({ event: 'receipt', id, data: receiptData });
143 |   }
144 | 
145 |   sendChunk(chunk) {
146 |     const channels = this.readChannelData([chunk]);
147 |     const { float32Array, meanValues } = this.formatAudioData(channels);
148 |     const rawAudioData = this.floatTo16BitPCM(float32Array);
149 |     const monoAudioData = this.floatTo16BitPCM(meanValues);
150 |     this.port.postMessage({
151 |       event: 'chunk',
152 |       data: {
153 |         mono: monoAudioData,
154 |         raw: rawAudioData,
155 |       },
156 |     });
157 |   }
158 | 
159 |   process(inputList, outputList, parameters) {
160 |     // Copy input to output (e.g. speakers)
161 |     // Note that this creates choppy sounds with Mac products
162 |     const sourceLimit = Math.min(inputList.length, outputList.length);
163 |     for (let inputNum = 0; inputNum < sourceLimit; inputNum++) {
164 |       const input = inputList[inputNum];
165 |       const output = outputList[inputNum];
166 |       const channelCount = Math.min(input.length, output.length);
167 |       for (let channelNum = 0; channelNum < channelCount; channelNum++) {
168 |         input[channelNum].forEach((sample, i) => {
169 |           output[channelNum][i] = sample;
170 |         });
171 |       }
172 |     }
173 |     const inputs = inputList[0];
174 |     // There's latency at the beginning of a stream before recording starts
175 |     // Make sure we actually receive audio data before we start storing chunks
176 |     let sliceIndex = 0;
177 |     if (!this.foundAudio) {
178 |       for (const channel of inputs) {
179 |         sliceIndex = 0; // reset for each channel
180 |         if (this.foundAudio) {
181 |           break;
182 |         }
183 |         if (channel) {
184 |           for (const value of channel) {
185 |             if (value !== 0) {
186 |               // find only one non-zero entry in any channel
187 |               this.foundAudio = true;
188 |               break;
189 |             } else {
190 |               sliceIndex++;
191 |             }
192 |           }
193 |         }
194 |       }
195 |     }
196 |     if (inputs && inputs[0] && this.foundAudio && this.recording) {
197 |       // We need to copy the TypedArray, because the \`process\`
198 |       // internals will reuse the same buffer to hold each input
199 |       const chunk = inputs.map((input) => input.slice(sliceIndex));
200 |       this.chunks.push(chunk);
201 |       this.sendChunk(chunk);
202 |     }
203 |     return true;
204 |   }
205 | }
206 | 
207 | registerProcessor('audio_processor', AudioProcessor);
208 | `;
209 | 
210 | const script = new Blob([AudioProcessorWorklet], {
211 |   type: 'application/javascript',
212 | });
213 | const src = URL.createObjectURL(script);
214 | export const AudioProcessorSrc = src;
215 | 


--------------------------------------------------------------------------------
/src/lib/wavtools/lib/worklets/stream_processor.js:
--------------------------------------------------------------------------------
 1 | export const StreamProcessorWorklet = `
 2 | class StreamProcessor extends AudioWorkletProcessor {
 3 |   constructor() {
 4 |     super();
 5 |     this.hasStarted = false;
 6 |     this.hasInterrupted = false;
 7 |     this.outputBuffers = [];
 8 |     this.bufferLength = 128;
 9 |     this.write = { buffer: new Float32Array(this.bufferLength), trackId: null };
10 |     this.writeOffset = 0;
11 |     this.trackSampleOffsets = {};
12 |     this.port.onmessage = (event) => {
13 |       if (event.data) {
14 |         const payload = event.data;
15 |         if (payload.event === 'write') {
16 |           const int16Array = payload.buffer;
17 |           const float32Array = new Float32Array(int16Array.length);
18 |           for (let i = 0; i < int16Array.length; i++) {
19 |             float32Array[i] = int16Array[i] / 0x8000; // Convert Int16 to Float32
20 |           }
21 |           this.writeData(float32Array, payload.trackId);
22 |         } else if (
23 |           payload.event === 'offset' ||
24 |           payload.event === 'interrupt'
25 |         ) {
26 |           const requestId = payload.requestId;
27 |           const trackId = this.write.trackId;
28 |           const offset = this.trackSampleOffsets[trackId] || 0;
29 |           this.port.postMessage({
30 |             event: 'offset',
31 |             requestId,
32 |             trackId,
33 |             offset,
34 |           });
35 |           if (payload.event === 'interrupt') {
36 |             this.hasInterrupted = true;
37 |           }
38 |         } else {
39 |           throw new Error(\`Unhandled event "\${payload.event}"\`);
40 |         }
41 |       }
42 |     };
43 |   }
44 | 
45 |   writeData(float32Array, trackId = null) {
46 |     let { buffer } = this.write;
47 |     let offset = this.writeOffset;
48 |     for (let i = 0; i < float32Array.length; i++) {
49 |       buffer[offset++] = float32Array[i];
50 |       if (offset >= buffer.length) {
51 |         this.outputBuffers.push(this.write);
52 |         this.write = { buffer: new Float32Array(this.bufferLength), trackId };
53 |         buffer = this.write.buffer;
54 |         offset = 0;
55 |       }
56 |     }
57 |     this.writeOffset = offset;
58 |     return true;
59 |   }
60 | 
61 |   process(inputs, outputs, parameters) {
62 |     const output = outputs[0];
63 |     const outputChannelData = output[0];
64 |     const outputBuffers = this.outputBuffers;
65 |     if (this.hasInterrupted) {
66 |       this.port.postMessage({ event: 'stop' });
67 |       return false;
68 |     } else if (outputBuffers.length) {
69 |       this.hasStarted = true;
70 |       const { buffer, trackId } = outputBuffers.shift();
71 |       for (let i = 0; i < outputChannelData.length; i++) {
72 |         outputChannelData[i] = buffer[i] || 0;
73 |       }
74 |       if (trackId) {
75 |         this.trackSampleOffsets[trackId] =
76 |           this.trackSampleOffsets[trackId] || 0;
77 |         this.trackSampleOffsets[trackId] += buffer.length;
78 |       }
79 |       return true;
80 |     } else if (this.hasStarted) {
81 |       this.port.postMessage({ event: 'stop' });
82 |       return false;
83 |     } else {
84 |       return true;
85 |     }
86 |   }
87 | }
88 | 
89 | registerProcessor('stream_processor', StreamProcessor);
90 | `;
91 | 
92 | const script = new Blob([StreamProcessorWorklet], {
93 |   type: 'application/javascript',
94 | });
95 | const src = URL.createObjectURL(script);
96 | export const StreamProcessorSrc = src;
97 | 


--------------------------------------------------------------------------------
/src/logo.svg:
--------------------------------------------------------------------------------
1 | <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 841.9 595.3"><g fill="#61DAFB"><path d="M666.3 296.5c0-32.5-40.7-63.3-103.1-82.4 14.4-63.6 8-114.2-20.2-130.4-6.5-3.8-14.1-5.6-22.4-5.6v22.3c4.6 0 8.3.9 11.4 2.6 13.6 7.8 19.5 37.5 14.9 75.7-1.1 9.4-2.9 19.3-5.1 29.4-19.6-4.8-41-8.5-63.5-10.9-13.5-18.5-27.5-35.3-41.6-50 32.6-30.3 63.2-46.9 84-46.9V78c-27.5 0-63.5 19.6-99.9 53.6-36.4-33.8-72.4-53.2-99.9-53.2v22.3c20.7 0 51.4 16.5 84 46.6-14 14.7-28 31.4-41.3 49.9-22.6 2.4-44 6.1-63.6 11-2.3-10-4-19.7-5.2-29-4.7-38.2 1.1-67.9 14.6-75.8 3-1.8 6.9-2.6 11.5-2.6V78.5c-8.4 0-16 1.8-22.6 5.6-28.1 16.2-34.4 66.7-19.9 130.1-62.2 19.2-102.7 49.9-102.7 82.3 0 32.5 40.7 63.3 103.1 82.4-14.4 63.6-8 114.2 20.2 130.4 6.5 3.8 14.1 5.6 22.5 5.6 27.5 0 63.5-19.6 99.9-53.6 36.4 33.8 72.4 53.2 99.9 53.2 8.4 0 16-1.8 22.6-5.6 28.1-16.2 34.4-66.7 19.9-130.1 62-19.1 102.5-49.9 102.5-82.3zm-130.2-66.7c-3.7 12.9-8.3 26.2-13.5 39.5-4.1-8-8.4-16-13.1-24-4.6-8-9.5-15.8-14.4-23.4 14.2 2.1 27.9 4.7 41 7.9zm-45.8 106.5c-7.8 13.5-15.8 26.3-24.1 38.2-14.9 1.3-30 2-45.2 2-15.1 0-30.2-.7-45-1.9-8.3-11.9-16.4-24.6-24.2-38-7.6-13.1-14.5-26.4-20.8-39.8 6.2-13.4 13.2-26.8 20.7-39.9 7.8-13.5 15.8-26.3 24.1-38.2 14.9-1.3 30-2 45.2-2 15.1 0 30.2.7 45 1.9 8.3 11.9 16.4 24.6 24.2 38 7.6 13.1 14.5 26.4 20.8 39.8-6.3 13.4-13.2 26.8-20.7 39.9zm32.3-13c5.4 13.4 10 26.8 13.8 39.8-13.1 3.2-26.9 5.9-41.2 8 4.9-7.7 9.8-15.6 14.4-23.7 4.6-8 8.9-16.1 13-24.1zM421.2 430c-9.3-9.6-18.6-20.3-27.8-32 9 .4 18.2.7 27.5.7 9.4 0 18.7-.2 27.8-.7-9 11.7-18.3 22.4-27.5 32zm-74.4-58.9c-14.2-2.1-27.9-4.7-41-7.9 3.7-12.9 8.3-26.2 13.5-39.5 4.1 8 8.4 16 13.1 24 4.7 8 9.5 15.8 14.4 23.4zM420.7 163c9.3 9.6 18.6 20.3 27.8 32-9-.4-18.2-.7-27.5-.7-9.4 0-18.7.2-27.8.7 9-11.7 18.3-22.4 27.5-32zm-74 58.9c-4.9 7.7-9.8 15.6-14.4 23.7-4.6 8-8.9 16-13 24-5.4-13.4-10-26.8-13.8-39.8 13.1-3.1 26.9-5.8 41.2-7.9zm-90.5 125.2c-35.4-15.1-58.3-34.9-58.3-50.6 0-15.7 22.9-35.6 58.3-50.6 8.6-3.7 18-7 27.7-10.1 5.7 19.6 13.2 40 22.5 60.9-9.2 20.8-16.6 41.1-22.2 60.6-9.9-3.1-19.3-6.5-28-10.2zM310 490c-13.6-7.8-19.5-37.5-14.9-75.7 1.1-9.4 2.9-19.3 5.1-29.4 19.6 4.8 41 8.5 63.5 10.9 13.5 18.5 27.5 35.3 41.6 50-32.6 30.3-63.2 46.9-84 46.9-4.5-.1-8.3-1-11.3-2.7zm237.2-76.2c4.7 38.2-1.1 67.9-14.6 75.8-3 1.8-6.9 2.6-11.5 2.6-20.7 0-51.4-16.5-84-46.6 14-14.7 28-31.4 41.3-49.9 22.6-2.4 44-6.1 63.6-11 2.3 10.1 4.1 19.8 5.2 29.1zm38.5-66.7c-8.6 3.7-18 7-27.7 10.1-5.7-19.6-13.2-40-22.5-60.9 9.2-20.8 16.6-41.1 22.2-60.6 9.9 3.1 19.3 6.5 28.1 10.2 35.4 15.1 58.3 34.9 58.3 50.6-.1 15.7-23 35.6-58.4 50.6zM320.8 78.4z"/><circle cx="420.9" cy="296.5" r="45.7"/><path d="M520.5 78.1z"/></g></svg>


--------------------------------------------------------------------------------
/src/pages/ConsolePage.scss:
--------------------------------------------------------------------------------
  1 | [data-component='ConsolePage'] {
  2 |   font-family: 'Roboto Mono', monospace;
  3 |   font-weight: 400;
  4 |   font-style: normal;
  5 |   font-size: 12px;
  6 |   height: 100%;
  7 |   display: flex;
  8 |   flex-direction: column;
  9 |   overflow: hidden;
 10 |   margin: 0px 8px;
 11 |   & > div {
 12 |     flex-shrink: 0;
 13 |   }
 14 | 
 15 |   .spacer {
 16 |     flex-grow: 1;
 17 |   }
 18 | 
 19 |   .content-top {
 20 |     display: flex;
 21 |     align-items: center;
 22 |     padding: 8px 16px;
 23 |     min-height: 40px;
 24 |     .content-title {
 25 |       flex-grow: 1;
 26 |       display: flex;
 27 |       align-items: center;
 28 |       gap: 12px;
 29 |       img {
 30 |         width: 24px;
 31 |         height: 24px;
 32 |       }
 33 |     }
 34 |   }
 35 | 
 36 |   .content-main {
 37 |     flex-grow: 1;
 38 |     flex-shrink: 1 !important;
 39 |     margin: 0px 16px;
 40 |     display: flex;
 41 |     overflow: hidden;
 42 |     margin-bottom: 24px;
 43 |     .content-block {
 44 |       position: relative;
 45 |       display: flex;
 46 |       flex-direction: column;
 47 |       max-height: 100%;
 48 |       width: 100%;
 49 |       .content-block-title {
 50 |         flex-shrink: 0;
 51 |         padding-top: 16px;
 52 |         padding-bottom: 4px;
 53 |         position: relative;
 54 |       }
 55 |       .content-block-body {
 56 |         color: #6e6e7f;
 57 |         position: relative;
 58 |         flex-grow: 1;
 59 |         padding: 8px 0px;
 60 |         padding-top: 4px;
 61 |         line-height: 1.2em;
 62 |         overflow: auto;
 63 |         &.full {
 64 |           padding: 0px;
 65 |         }
 66 |       }
 67 |     }
 68 |     .content-right {
 69 |       width: 300px;
 70 |       flex-shrink: 0;
 71 |       display: flex;
 72 |       flex-direction: column;
 73 |       margin-left: 24px;
 74 |       gap: 24px;
 75 |       & > div {
 76 |         border-radius: 16px;
 77 |         flex-grow: 1;
 78 |         flex-shrink: 0;
 79 |         overflow: hidden;
 80 |         position: relative;
 81 |         .content-block-title {
 82 |           position: absolute;
 83 |           display: flex;
 84 |           align-items: center;
 85 |           justify-content: center;
 86 |           line-height: 2em;
 87 |           top: 16px;
 88 |           left: 16px;
 89 |           padding: 4px 16px;
 90 |           background-color: #fff;
 91 |           border-radius: 1000px;
 92 |           min-height: 32px;
 93 |           z-index: 9999;
 94 |           text-align: center;
 95 |           white-space: pre;
 96 |           &.bottom {
 97 |             top: auto;
 98 |             bottom: 16px;
 99 |             right: 16px;
100 |           }
101 |         }
102 |       }
103 |       & > div.kv {
104 |         height: 250px;
105 |         max-height: 250px;
106 |         white-space: pre;
107 |         background-color: #ececf1;
108 |         .content-block-body {
109 |           padding: 16px;
110 |           margin-top: 56px;
111 |         }
112 |       }
113 |     }
114 |     .content-logs {
115 |       flex-grow: 1;
116 |       display: flex;
117 |       flex-direction: column;
118 |       overflow: hidden;
119 |       & > div {
120 |         flex-grow: 1;
121 |       }
122 |       & > .content-actions {
123 |         flex-grow: 0;
124 |         flex-shrink: 0;
125 |         display: flex;
126 |         align-items: center;
127 |         justify-content: center;
128 |         gap: 16px;
129 |       }
130 |       & > div.events {
131 |         overflow: hidden;
132 |       }
133 |       .events {
134 |         border-top: 1px solid #e7e7e7;
135 |       }
136 |       .conversation {
137 |         display: flex;
138 |         flex-shrink: 0;
139 |         width: 100%;
140 |         overflow: hidden;
141 |         height: 200px;
142 |         min-height: 0;
143 |         max-height: 200px;
144 |         border-top: 1px solid #e7e7e7;
145 |       }
146 |     }
147 |   }
148 | 
149 |   .conversation-item {
150 |     position: relative;
151 |     display: flex;
152 |     gap: 16px;
153 |     margin-bottom: 16px;
154 |     &:not(:hover) .close {
155 |       display: none;
156 |     }
157 |     .close {
158 |       position: absolute;
159 |       top: 0px;
160 |       right: -20px;
161 |       background: #aaa;
162 |       color: #fff;
163 |       display: flex;
164 |       border-radius: 16px;
165 |       padding: 2px;
166 |       cursor: pointer;
167 |       &:hover {
168 |         background: #696969;
169 |       }
170 |       svg {
171 |         stroke-width: 3;
172 |         width: 12px;
173 |         height: 12px;
174 |       }
175 |     }
176 |     .speaker {
177 |       position: relative;
178 |       text-align: left;
179 |       gap: 16px;
180 |       width: 80px;
181 |       flex-shrink: 0;
182 |       margin-right: 16px;
183 |       &.user {
184 |         color: #0099ff;
185 |       }
186 |       &.assistant {
187 |         color: #009900;
188 |       }
189 |     }
190 |     .speaker-content {
191 |       color: #18181b;
192 |       overflow: hidden;
193 |       word-wrap: break-word;
194 |     }
195 |   }
196 | 
197 |   .event {
198 |     border-radius: 3px;
199 |     white-space: pre;
200 |     display: flex;
201 |     padding: 0px;
202 |     gap: 16px;
203 |     .event-timestamp {
204 |       text-align: left;
205 |       gap: 8px;
206 |       padding: 4px 0px;
207 |       width: 80px;
208 |       flex-shrink: 0;
209 |       margin-right: 16px;
210 |     }
211 |     .event-details {
212 |       display: flex;
213 |       flex-direction: column;
214 |       color: #18181b;
215 |       gap: 8px;
216 |       .event-summary {
217 |         padding: 4px 8px;
218 |         margin: 0px -8px;
219 |         &:hover {
220 |           border-radius: 8px;
221 |           background-color: #f0f0f0;
222 |         }
223 |         cursor: pointer;
224 |         display: flex;
225 |         gap: 8px;
226 |         align-items: center;
227 |         .event-source {
228 |           flex-shrink: 0;
229 |           display: flex;
230 |           align-items: center;
231 |           gap: 8px;
232 |           &.client {
233 |             color: #0099ff;
234 |           }
235 |           &.server {
236 |             color: #009900;
237 |           }
238 |           &.error {
239 |             color: #990000;
240 |           }
241 |           svg {
242 |             stroke-width: 3;
243 |             width: 12px;
244 |             height: 12px;
245 |           }
246 |         }
247 |       }
248 |     }
249 |   }
250 | 
251 |   .visualization {
252 |     position: absolute;
253 |     display: flex;
254 |     bottom: 4px;
255 |     right: 8px;
256 |     padding: 4px;
257 |     border-radius: 16px;
258 |     z-index: 10;
259 |     gap: 2px;
260 |     .visualization-entry {
261 |       position: relative;
262 |       display: flex;
263 |       align-items: center;
264 |       height: 40px;
265 |       width: 100px;
266 |       gap: 4px;
267 |       &.client {
268 |         color: #0099ff;
269 |       }
270 |       &.server {
271 |         color: #009900;
272 |       }
273 |       canvas {
274 |         width: 100%;
275 |         height: 100%;
276 |         color: currentColor;
277 |       }
278 |     }
279 |   }
280 | }
281 | 


--------------------------------------------------------------------------------
/src/pages/ConsolePage.tsx:
--------------------------------------------------------------------------------
  1 | /**
  2 |  * Running a local relay server will allow you to hide your API key
  3 |  * and run custom logic on the server
  4 |  *
  5 |  * Set the local relay server address to:
  6 |  * REACT_APP_LOCAL_RELAY_SERVER_URL=http://localhost:8081
  7 |  *
  8 |  * This will also require you to set OPENAI_API_KEY= in a `.env` file
  9 |  * You can run it with `npm run relay`, in parallel with `npm start`
 10 |  */
 11 | const LOCAL_RELAY_SERVER_URL: string =
 12 |   process.env.REACT_APP_LOCAL_RELAY_SERVER_URL || '';
 13 | 
 14 | import { useEffect, useRef, useCallback, useState } from 'react';
 15 | 
 16 | import { RealtimeClient } from '@openai/realtime-api-beta';
 17 | import { ItemType } from '@openai/realtime-api-beta/dist/lib/client.js';
 18 | import { WavRecorder, WavStreamPlayer } from '../lib/wavtools/index.js';
 19 | import { instructions } from '../utils/conversation_config.js';
 20 | import { WavRenderer } from '../utils/wav_renderer';
 21 | 
 22 | import { X, Edit, Zap, ArrowUp, ArrowDown } from 'react-feather';
 23 | import { Button } from '../components/button/Button';
 24 | import { Toggle } from '../components/toggle/Toggle';
 25 | import { Map } from '../components/Map';
 26 | 
 27 | import './ConsolePage.scss';
 28 | import { isJsxOpeningLikeElement } from 'typescript';
 29 | 
 30 | /**
 31 |  * Type for result from get_weather() function call
 32 |  */
 33 | interface Coordinates {
 34 |   lat: number;
 35 |   lng: number;
 36 |   location?: string;
 37 |   temperature?: {
 38 |     value: number;
 39 |     units: string;
 40 |   };
 41 |   wind_speed?: {
 42 |     value: number;
 43 |     units: string;
 44 |   };
 45 | }
 46 | 
 47 | /**
 48 |  * Type for all event logs
 49 |  */
 50 | interface RealtimeEvent {
 51 |   time: string;
 52 |   source: 'client' | 'server';
 53 |   count?: number;
 54 |   event: { [key: string]: any };
 55 | }
 56 | 
 57 | export function ConsolePage() {
 58 |   /**
 59 |    * Ask user for API Key
 60 |    * If we're using the local relay server, we don't need this
 61 |    */
 62 |   const apiKey = LOCAL_RELAY_SERVER_URL
 63 |     ? ''
 64 |     : localStorage.getItem('tmp::voice_api_key') ||
 65 |       prompt('OpenAI API Key') ||
 66 |       '';
 67 |   if (apiKey !== '') {
 68 |     localStorage.setItem('tmp::voice_api_key', apiKey);
 69 |   }
 70 | 
 71 |   /**
 72 |    * Instantiate:
 73 |    * - WavRecorder (speech input)
 74 |    * - WavStreamPlayer (speech output)
 75 |    * - RealtimeClient (API client)
 76 |    */
 77 |   const wavRecorderRef = useRef<WavRecorder>(
 78 |     new WavRecorder({ sampleRate: 24000 })
 79 |   );
 80 |   const wavStreamPlayerRef = useRef<WavStreamPlayer>(
 81 |     new WavStreamPlayer({ sampleRate: 24000 })
 82 |   );
 83 |   const clientRef = useRef<RealtimeClient>(
 84 |     new RealtimeClient(
 85 |       LOCAL_RELAY_SERVER_URL
 86 |         ? { url: LOCAL_RELAY_SERVER_URL }
 87 |         : {
 88 |             apiKey: apiKey,
 89 |             dangerouslyAllowAPIKeyInBrowser: true,
 90 |           }
 91 |     )
 92 |   );
 93 | 
 94 |   /**
 95 |    * References for
 96 |    * - Rendering audio visualization (canvas)
 97 |    * - Autoscrolling event logs
 98 |    * - Timing delta for event log displays
 99 |    */
100 |   const clientCanvasRef = useRef<HTMLCanvasElement>(null);
101 |   const serverCanvasRef = useRef<HTMLCanvasElement>(null);
102 |   const eventsScrollHeightRef = useRef(0);
103 |   const eventsScrollRef = useRef<HTMLDivElement>(null);
104 |   const startTimeRef = useRef<string>(new Date().toISOString());
105 | 
106 |   /**
107 |    * All of our variables for displaying application state
108 |    * - items are all conversation items (dialog)
109 |    * - realtimeEvents are event logs, which can be expanded
110 |    * - memoryKv is for set_memory() function
111 |    * - coords, marker are for get_weather() function
112 |    */
113 |   const [items, setItems] = useState<ItemType[]>([]);
114 |   const [realtimeEvents, setRealtimeEvents] = useState<RealtimeEvent[]>([]);
115 |   const [expandedEvents, setExpandedEvents] = useState<{
116 |     [key: string]: boolean;
117 |   }>({});
118 |   const [isConnected, setIsConnected] = useState(false);
119 |   const [canPushToTalk, setCanPushToTalk] = useState(true);
120 |   const [isRecording, setIsRecording] = useState(false);
121 |   const [memoryKv, setMemoryKv] = useState<{ [key: string]: any }>({});
122 |   const [coords, setCoords] = useState<Coordinates | null>({
123 |     lat: 37.775593,
124 |     lng: -122.418137,
125 |   });
126 |   const [marker, setMarker] = useState<Coordinates | null>(null);
127 | 
128 |   /**
129 |    * Utility for formatting the timing of logs
130 |    */
131 |   const formatTime = useCallback((timestamp: string) => {
132 |     const startTime = startTimeRef.current;
133 |     const t0 = new Date(startTime).valueOf();
134 |     const t1 = new Date(timestamp).valueOf();
135 |     const delta = t1 - t0;
136 |     const hs = Math.floor(delta / 10) % 100;
137 |     const s = Math.floor(delta / 1000) % 60;
138 |     const m = Math.floor(delta / 60_000) % 60;
139 |     const pad = (n: number) => {
140 |       let s = n + '';
141 |       while (s.length < 2) {
142 |         s = '0' + s;
143 |       }
144 |       return s;
145 |     };
146 |     return `${pad(m)}:${pad(s)}.${pad(hs)}`;
147 |   }, []);
148 | 
149 |   /**
150 |    * When you click the API key
151 |    */
152 |   const resetAPIKey = useCallback(() => {
153 |     const apiKey = prompt('OpenAI API Key');
154 |     if (apiKey !== null) {
155 |       localStorage.clear();
156 |       localStorage.setItem('tmp::voice_api_key', apiKey);
157 |       window.location.reload();
158 |     }
159 |   }, []);
160 | 
161 |   /**
162 |    * Connect to conversation:
163 |    * WavRecorder taks speech input, WavStreamPlayer output, client is API client
164 |    */
165 |   const connectConversation = useCallback(async () => {
166 |     const client = clientRef.current;
167 |     const wavRecorder = wavRecorderRef.current;
168 |     const wavStreamPlayer = wavStreamPlayerRef.current;
169 | 
170 |     // Set state variables
171 |     startTimeRef.current = new Date().toISOString();
172 |     setIsConnected(true);
173 |     setRealtimeEvents([]);
174 |     setItems(client.conversation.getItems());
175 | 
176 |     // Connect to microphone
177 |     await wavRecorder.begin();
178 | 
179 |     // Connect to audio output
180 |     await wavStreamPlayer.connect();
181 | 
182 |     // Connect to realtime API
183 |     await client.connect();
184 |     client.sendUserMessageContent([
185 |       {
186 |         type: `input_text`,
187 |         text: `Hello!`,
188 |         // text: `For testing purposes, I want you to list ten car brands. Number each item, e.g. "one (or whatever number you are one): the item name".`
189 |       },
190 |     ]);
191 | 
192 |     if (client.getTurnDetectionType() === 'server_vad') {
193 |       await wavRecorder.record((data) => client.appendInputAudio(data.mono));
194 |     }
195 |   }, []);
196 | 
197 |   /**
198 |    * Disconnect and reset conversation state
199 |    */
200 |   const disconnectConversation = useCallback(async () => {
201 |     setIsConnected(false);
202 |     setRealtimeEvents([]);
203 |     setItems([]);
204 |     setMemoryKv({});
205 |     setCoords({
206 |       lat: 37.775593,
207 |       lng: -122.418137,
208 |     });
209 |     setMarker(null);
210 | 
211 |     const client = clientRef.current;
212 |     client.disconnect();
213 | 
214 |     const wavRecorder = wavRecorderRef.current;
215 |     await wavRecorder.end();
216 | 
217 |     const wavStreamPlayer = wavStreamPlayerRef.current;
218 |     await wavStreamPlayer.interrupt();
219 |   }, []);
220 | 
221 |   const deleteConversationItem = useCallback(async (id: string) => {
222 |     const client = clientRef.current;
223 |     client.deleteItem(id);
224 |   }, []);
225 | 
226 |   /**
227 |    * In push-to-talk mode, start recording
228 |    * .appendInputAudio() for each sample
229 |    */
230 |   const startRecording = async () => {
231 |     setIsRecording(true);
232 |     const client = clientRef.current;
233 |     const wavRecorder = wavRecorderRef.current;
234 |     const wavStreamPlayer = wavStreamPlayerRef.current;
235 |     const trackSampleOffset = await wavStreamPlayer.interrupt();
236 |     if (trackSampleOffset?.trackId) {
237 |       const { trackId, offset } = trackSampleOffset;
238 |       await client.cancelResponse(trackId, offset);
239 |     }
240 |     await wavRecorder.record((data) => client.appendInputAudio(data.mono));
241 |   };
242 | 
243 |   /**
244 |    * In push-to-talk mode, stop recording
245 |    */
246 |   const stopRecording = async () => {
247 |     setIsRecording(false);
248 |     const client = clientRef.current;
249 |     const wavRecorder = wavRecorderRef.current;
250 |     await wavRecorder.pause();
251 |     client.createResponse();
252 |   };
253 | 
254 |   /**
255 |    * Switch between Manual <> VAD mode for communication
256 |    */
257 |   const changeTurnEndType = async (value: string) => {
258 |     const client = clientRef.current;
259 |     const wavRecorder = wavRecorderRef.current;
260 |     if (value === 'none' && wavRecorder.getStatus() === 'recording') {
261 |       await wavRecorder.pause();
262 |     }
263 |     client.updateSession({
264 |       turn_detection: value === 'none' ? null : { type: 'server_vad' },
265 |     });
266 |     if (value === 'server_vad' && client.isConnected()) {
267 |       await wavRecorder.record((data) => client.appendInputAudio(data.mono));
268 |     }
269 |     setCanPushToTalk(value === 'none');
270 |   };
271 | 
272 |   /**
273 |    * Auto-scroll the event logs
274 |    */
275 |   useEffect(() => {
276 |     if (eventsScrollRef.current) {
277 |       const eventsEl = eventsScrollRef.current;
278 |       const scrollHeight = eventsEl.scrollHeight;
279 |       // Only scroll if height has just changed
280 |       if (scrollHeight !== eventsScrollHeightRef.current) {
281 |         eventsEl.scrollTop = scrollHeight;
282 |         eventsScrollHeightRef.current = scrollHeight;
283 |       }
284 |     }
285 |   }, [realtimeEvents]);
286 | 
287 |   /**
288 |    * Auto-scroll the conversation logs
289 |    */
290 |   useEffect(() => {
291 |     const conversationEls = [].slice.call(
292 |       document.body.querySelectorAll('[data-conversation-content]')
293 |     );
294 |     for (const el of conversationEls) {
295 |       const conversationEl = el as HTMLDivElement;
296 |       conversationEl.scrollTop = conversationEl.scrollHeight;
297 |     }
298 |   }, [items]);
299 | 
300 |   /**
301 |    * Set up render loops for the visualization canvas
302 |    */
303 |   useEffect(() => {
304 |     let isLoaded = true;
305 | 
306 |     const wavRecorder = wavRecorderRef.current;
307 |     const clientCanvas = clientCanvasRef.current;
308 |     let clientCtx: CanvasRenderingContext2D | null = null;
309 | 
310 |     const wavStreamPlayer = wavStreamPlayerRef.current;
311 |     const serverCanvas = serverCanvasRef.current;
312 |     let serverCtx: CanvasRenderingContext2D | null = null;
313 | 
314 |     const render = () => {
315 |       if (isLoaded) {
316 |         if (clientCanvas) {
317 |           if (!clientCanvas.width || !clientCanvas.height) {
318 |             clientCanvas.width = clientCanvas.offsetWidth;
319 |             clientCanvas.height = clientCanvas.offsetHeight;
320 |           }
321 |           clientCtx = clientCtx || clientCanvas.getContext('2d');
322 |           if (clientCtx) {
323 |             clientCtx.clearRect(0, 0, clientCanvas.width, clientCanvas.height);
324 |             const result = wavRecorder.recording
325 |               ? wavRecorder.getFrequencies('voice')
326 |               : { values: new Float32Array([0]) };
327 |             WavRenderer.drawBars(
328 |               clientCanvas,
329 |               clientCtx,
330 |               result.values,
331 |               '#0099ff',
332 |               10,
333 |               0,
334 |               8
335 |             );
336 |           }
337 |         }
338 |         if (serverCanvas) {
339 |           if (!serverCanvas.width || !serverCanvas.height) {
340 |             serverCanvas.width = serverCanvas.offsetWidth;
341 |             serverCanvas.height = serverCanvas.offsetHeight;
342 |           }
343 |           serverCtx = serverCtx || serverCanvas.getContext('2d');
344 |           if (serverCtx) {
345 |             serverCtx.clearRect(0, 0, serverCanvas.width, serverCanvas.height);
346 |             const result = wavStreamPlayer.analyser
347 |               ? wavStreamPlayer.getFrequencies('voice')
348 |               : { values: new Float32Array([0]) };
349 |             WavRenderer.drawBars(
350 |               serverCanvas,
351 |               serverCtx,
352 |               result.values,
353 |               '#009900',
354 |               10,
355 |               0,
356 |               8
357 |             );
358 |           }
359 |         }
360 |         window.requestAnimationFrame(render);
361 |       }
362 |     };
363 |     render();
364 | 
365 |     return () => {
366 |       isLoaded = false;
367 |     };
368 |   }, []);
369 | 
370 |   /**
371 |    * Core RealtimeClient and audio capture setup
372 |    * Set all of our instructions, tools, events and more
373 |    */
374 |   useEffect(() => {
375 |     // Get refs
376 |     const wavStreamPlayer = wavStreamPlayerRef.current;
377 |     const client = clientRef.current;
378 | 
379 |     // Set instructions
380 |     client.updateSession({ instructions: instructions });
381 |     // Set transcription, otherwise we don't get user transcriptions back
382 |     client.updateSession({ input_audio_transcription: { model: 'whisper-1' } });
383 | 
384 |     // Add tools
385 |     client.addTool(
386 |       {
387 |         name: 'set_memory',
388 |         description: 'Saves important data about the user into memory.',
389 |         parameters: {
390 |           type: 'object',
391 |           properties: {
392 |             key: {
393 |               type: 'string',
394 |               description:
395 |                 'The key of the memory value. Always use lowercase and underscores, no other characters.',
396 |             },
397 |             value: {
398 |               type: 'string',
399 |               description: 'Value can be anything represented as a string',
400 |             },
401 |           },
402 |           required: ['key', 'value'],
403 |         },
404 |       },
405 |       async ({ key, value }: { [key: string]: any }) => {
406 |         setMemoryKv((memoryKv) => {
407 |           const newKv = { ...memoryKv };
408 |           newKv[key] = value;
409 |           return newKv;
410 |         });
411 |         return { ok: true };
412 |       }
413 |     );
414 |     client.addTool(
415 |       {
416 |         name: 'get_weather',
417 |         description:
418 |           'Retrieves the weather for a given lat, lng coordinate pair. Specify a label for the location.',
419 |         parameters: {
420 |           type: 'object',
421 |           properties: {
422 |             lat: {
423 |               type: 'number',
424 |               description: 'Latitude',
425 |             },
426 |             lng: {
427 |               type: 'number',
428 |               description: 'Longitude',
429 |             },
430 |             location: {
431 |               type: 'string',
432 |               description: 'Name of the location',
433 |             },
434 |           },
435 |           required: ['lat', 'lng', 'location'],
436 |         },
437 |       },
438 |       async ({ lat, lng, location }: { [key: string]: any }) => {
439 |         setMarker({ lat, lng, location });
440 |         setCoords({ lat, lng, location });
441 |         const result = await fetch(
442 |           `https://api.open-meteo.com/v1/forecast?latitude=${lat}&longitude=${lng}&current=temperature_2m,wind_speed_10m`
443 |         );
444 |         const json = await result.json();
445 |         const temperature = {
446 |           value: json.current.temperature_2m as number,
447 |           units: json.current_units.temperature_2m as string,
448 |         };
449 |         const wind_speed = {
450 |           value: json.current.wind_speed_10m as number,
451 |           units: json.current_units.wind_speed_10m as string,
452 |         };
453 |         setMarker({ lat, lng, location, temperature, wind_speed });
454 |         return json;
455 |       }
456 |     );
457 | 
458 |     // handle realtime events from client + server for event logging
459 |     client.on('realtime.event', (realtimeEvent: RealtimeEvent) => {
460 |       setRealtimeEvents((realtimeEvents) => {
461 |         const lastEvent = realtimeEvents[realtimeEvents.length - 1];
462 |         if (lastEvent?.event.type === realtimeEvent.event.type) {
463 |           // if we receive multiple events in a row, aggregate them for display purposes
464 |           lastEvent.count = (lastEvent.count || 0) + 1;
465 |           return realtimeEvents.slice(0, -1).concat(lastEvent);
466 |         } else {
467 |           return realtimeEvents.concat(realtimeEvent);
468 |         }
469 |       });
470 |     });
471 |     client.on('error', (event: any) => console.error(event));
472 |     client.on('conversation.interrupted', async () => {
473 |       const trackSampleOffset = await wavStreamPlayer.interrupt();
474 |       if (trackSampleOffset?.trackId) {
475 |         const { trackId, offset } = trackSampleOffset;
476 |         await client.cancelResponse(trackId, offset);
477 |       }
478 |     });
479 |     client.on('conversation.updated', async ({ item, delta }: any) => {
480 |       const items = client.conversation.getItems();
481 |       if (delta?.audio) {
482 |         wavStreamPlayer.add16BitPCM(delta.audio, item.id);
483 |       }
484 |       if (item.status === 'completed' && item.formatted.audio?.length) {
485 |         const wavFile = await WavRecorder.decode(
486 |           item.formatted.audio,
487 |           24000,
488 |           24000
489 |         );
490 |         item.formatted.file = wavFile;
491 |       }
492 |       setItems(items);
493 |     });
494 | 
495 |     setItems(client.conversation.getItems());
496 | 
497 |     return () => {
498 |       // cleanup; resets to defaults
499 |       client.reset();
500 |     };
501 |   }, []);
502 | 
503 |   /**
504 |    * Render the application
505 |    */
506 |   return (
507 |     <div data-component="ConsolePage">
508 |       <div className="content-top">
509 |         <div className="content-title">
510 |           <img src="/openai-logomark.svg" />
511 |           <span>realtime console</span>
512 |         </div>
513 |         <div className="content-api-key">
514 |           {!LOCAL_RELAY_SERVER_URL && (
515 |             <Button
516 |               icon={Edit}
517 |               iconPosition="end"
518 |               buttonStyle="flush"
519 |               label={`api key: ${apiKey.slice(0, 3)}...`}
520 |               onClick={() => resetAPIKey()}
521 |             />
522 |           )}
523 |         </div>
524 |       </div>
525 |       <div className="content-main">
526 |         <div className="content-logs">
527 |           <div className="content-block events">
528 |             <div className="visualization">
529 |               <div className="visualization-entry client">
530 |                 <canvas ref={clientCanvasRef} />
531 |               </div>
532 |               <div className="visualization-entry server">
533 |                 <canvas ref={serverCanvasRef} />
534 |               </div>
535 |             </div>
536 |             <div className="content-block-title">events</div>
537 |             <div className="content-block-body" ref={eventsScrollRef}>
538 |               {!realtimeEvents.length && `awaiting connection...`}
539 |               {realtimeEvents.map((realtimeEvent, i) => {
540 |                 const count = realtimeEvent.count;
541 |                 const event = { ...realtimeEvent.event };
542 |                 if (event.type === 'input_audio_buffer.append') {
543 |                   event.audio = `[trimmed: ${event.audio.length} bytes]`;
544 |                 } else if (event.type === 'response.audio.delta') {
545 |                   event.delta = `[trimmed: ${event.delta.length} bytes]`;
546 |                 }
547 |                 return (
548 |                   <div className="event" key={event.event_id}>
549 |                     <div className="event-timestamp">
550 |                       {formatTime(realtimeEvent.time)}
551 |                     </div>
552 |                     <div className="event-details">
553 |                       <div
554 |                         className="event-summary"
555 |                         onClick={() => {
556 |                           // toggle event details
557 |                           const id = event.event_id;
558 |                           const expanded = { ...expandedEvents };
559 |                           if (expanded[id]) {
560 |                             delete expanded[id];
561 |                           } else {
562 |                             expanded[id] = true;
563 |                           }
564 |                           setExpandedEvents(expanded);
565 |                         }}
566 |                       >
567 |                         <div
568 |                           className={`event-source ${
569 |                             event.type === 'error'
570 |                               ? 'error'
571 |                               : realtimeEvent.source
572 |                           }`}
573 |                         >
574 |                           {realtimeEvent.source === 'client' ? (
575 |                             <ArrowUp />
576 |                           ) : (
577 |                             <ArrowDown />
578 |                           )}
579 |                           <span>
580 |                             {event.type === 'error'
581 |                               ? 'error!'
582 |                               : realtimeEvent.source}
583 |                           </span>
584 |                         </div>
585 |                         <div className="event-type">
586 |                           {event.type}
587 |                           {count && ` (${count})`}
588 |                         </div>
589 |                       </div>
590 |                       {!!expandedEvents[event.event_id] && (
591 |                         <div className="event-payload">
592 |                           {JSON.stringify(event, null, 2)}
593 |                         </div>
594 |                       )}
595 |                     </div>
596 |                   </div>
597 |                 );
598 |               })}
599 |             </div>
600 |           </div>
601 |           <div className="content-block conversation">
602 |             <div className="content-block-title">conversation</div>
603 |             <div className="content-block-body" data-conversation-content>
604 |               {!items.length && `awaiting connection...`}
605 |               {items.map((conversationItem, i) => {
606 |                 return (
607 |                   <div className="conversation-item" key={conversationItem.id}>
608 |                     <div className={`speaker ${conversationItem.role || ''}`}>
609 |                       <div>
610 |                         {(
611 |                           conversationItem.role || conversationItem.type
612 |                         ).replaceAll('_', ' ')}
613 |                       </div>
614 |                       <div
615 |                         className="close"
616 |                         onClick={() =>
617 |                           deleteConversationItem(conversationItem.id)
618 |                         }
619 |                       >
620 |                         <X />
621 |                       </div>
622 |                     </div>
623 |                     <div className={`speaker-content`}>
624 |                       {/* tool response */}
625 |                       {conversationItem.type === 'function_call_output' && (
626 |                         <div>{conversationItem.formatted.output}</div>
627 |                       )}
628 |                       {/* tool call */}
629 |                       {!!conversationItem.formatted.tool && (
630 |                         <div>
631 |                           {conversationItem.formatted.tool.name}(
632 |                           {conversationItem.formatted.tool.arguments})
633 |                         </div>
634 |                       )}
635 |                       {!conversationItem.formatted.tool &&
636 |                         conversationItem.role === 'user' && (
637 |                           <div>
638 |                             {conversationItem.formatted.transcript ||
639 |                               (conversationItem.formatted.audio?.length
640 |                                 ? '(awaiting transcript)'
641 |                                 : conversationItem.formatted.text ||
642 |                                   '(item sent)')}
643 |                           </div>
644 |                         )}
645 |                       {!conversationItem.formatted.tool &&
646 |                         conversationItem.role === 'assistant' && (
647 |                           <div>
648 |                             {conversationItem.formatted.transcript ||
649 |                               conversationItem.formatted.text ||
650 |                               '(truncated)'}
651 |                           </div>
652 |                         )}
653 |                       {conversationItem.formatted.file && (
654 |                         <audio
655 |                           src={conversationItem.formatted.file.url}
656 |                           controls
657 |                         />
658 |                       )}
659 |                     </div>
660 |                   </div>
661 |                 );
662 |               })}
663 |             </div>
664 |           </div>
665 |           <div className="content-actions">
666 |             <Toggle
667 |               defaultValue={false}
668 |               labels={['manual', 'vad']}
669 |               values={['none', 'server_vad']}
670 |               onChange={(_, value) => changeTurnEndType(value)}
671 |             />
672 |             <div className="spacer" />
673 |             {isConnected && canPushToTalk && (
674 |               <Button
675 |                 label={isRecording ? 'release to send' : 'push to talk'}
676 |                 buttonStyle={isRecording ? 'alert' : 'regular'}
677 |                 disabled={!isConnected || !canPushToTalk}
678 |                 onMouseDown={startRecording}
679 |                 onMouseUp={stopRecording}
680 |               />
681 |             )}
682 |             <div className="spacer" />
683 |             <Button
684 |               label={isConnected ? 'disconnect' : 'connect'}
685 |               iconPosition={isConnected ? 'end' : 'start'}
686 |               icon={isConnected ? X : Zap}
687 |               buttonStyle={isConnected ? 'regular' : 'action'}
688 |               onClick={
689 |                 isConnected ? disconnectConversation : connectConversation
690 |               }
691 |             />
692 |           </div>
693 |         </div>
694 |         <div className="content-right">
695 |           <div className="content-block map">
696 |             <div className="content-block-title">get_weather()</div>
697 |             <div className="content-block-title bottom">
698 |               {marker?.location || 'not yet retrieved'}
699 |               {!!marker?.temperature && (
700 |                 <>
701 |                   <br />
702 |                   🌡️ {marker.temperature.value} {marker.temperature.units}
703 |                 </>
704 |               )}
705 |               {!!marker?.wind_speed && (
706 |                 <>
707 |                   {' '}
708 |                   🍃 {marker.wind_speed.value} {marker.wind_speed.units}
709 |                 </>
710 |               )}
711 |             </div>
712 |             <div className="content-block-body full">
713 |               {coords && (
714 |                 <Map
715 |                   center={[coords.lat, coords.lng]}
716 |                   location={coords.location}
717 |                 />
718 |               )}
719 |             </div>
720 |           </div>
721 |           <div className="content-block kv">
722 |             <div className="content-block-title">set_memory()</div>
723 |             <div className="content-block-body content-kv">
724 |               {JSON.stringify(memoryKv, null, 2)}
725 |             </div>
726 |           </div>
727 |         </div>
728 |       </div>
729 |     </div>
730 |   );
731 | }
732 | 


--------------------------------------------------------------------------------
/src/pages/globals.d.ts:
--------------------------------------------------------------------------------
1 | interface Window {
2 |     webkitAudioContext?: typeof AudioContext;
3 | }


--------------------------------------------------------------------------------
/src/react-app-env.d.ts:
--------------------------------------------------------------------------------
1 | /// <reference types="react-scripts" />
2 | 


--------------------------------------------------------------------------------
/src/reportWebVitals.ts:
--------------------------------------------------------------------------------
 1 | import { ReportHandler } from 'web-vitals';
 2 | 
 3 | const reportWebVitals = (onPerfEntry?: ReportHandler) => {
 4 |   if (onPerfEntry && onPerfEntry instanceof Function) {
 5 |     import('web-vitals').then(({ getCLS, getFID, getFCP, getLCP, getTTFB }) => {
 6 |       getCLS(onPerfEntry);
 7 |       getFID(onPerfEntry);
 8 |       getFCP(onPerfEntry);
 9 |       getLCP(onPerfEntry);
10 |       getTTFB(onPerfEntry);
11 |     });
12 |   }
13 | };
14 | 
15 | export default reportWebVitals;
16 | 


--------------------------------------------------------------------------------
/src/setupTests.ts:
--------------------------------------------------------------------------------
1 | // jest-dom adds custom jest matchers for asserting on DOM nodes.
2 | // allows you to do things like:
3 | // expect(element).toHaveTextContent(/react/i)
4 | // learn more: https://github.com/testing-library/jest-dom
5 | import '@testing-library/jest-dom';
6 | 


--------------------------------------------------------------------------------
/src/utils/conversation_config.js:
--------------------------------------------------------------------------------
 1 | export const instructions = `System settings:
 2 | Tool use: enabled.
 3 | 
 4 | Instructions:
 5 | - You are an artificial intelligence agent responsible for helping test realtime voice capabilities
 6 | - Please make sure to respond with a helpful voice via audio
 7 | - Be kind, helpful, and curteous
 8 | - It is okay to ask the user questions
 9 | - Use tools and functions you have available liberally, it is part of the training apparatus
10 | - Be open to exploration and conversation
11 | - Remember: this is just for fun and testing!
12 | 
13 | Personality:
14 | - Be upbeat and genuine
15 | - Try speaking quickly as if excited
16 | `;
17 | 


--------------------------------------------------------------------------------
/src/utils/wav_renderer.ts:
--------------------------------------------------------------------------------
  1 | const dataMap = new WeakMap();
  2 | 
  3 | /**
  4 |  * Normalizes a Float32Array to Array(m): We use this to draw amplitudes on a graph
  5 |  * If we're rendering the same audio data, then we'll often be using
  6 |  * the same (data, m, downsamplePeaks) triplets so we give option to memoize
  7 |  */
  8 | const normalizeArray = (
  9 |   data: Float32Array,
 10 |   m: number,
 11 |   downsamplePeaks: boolean = false,
 12 |   memoize: boolean = false
 13 | ) => {
 14 |   let cache, mKey, dKey;
 15 |   if (memoize) {
 16 |     mKey = m.toString();
 17 |     dKey = downsamplePeaks.toString();
 18 |     cache = dataMap.has(data) ? dataMap.get(data) : {};
 19 |     dataMap.set(data, cache);
 20 |     cache[mKey] = cache[mKey] || {};
 21 |     if (cache[mKey][dKey]) {
 22 |       return cache[mKey][dKey];
 23 |     }
 24 |   }
 25 |   const n = data.length;
 26 |   const result = new Array(m);
 27 |   if (m <= n) {
 28 |     // Downsampling
 29 |     result.fill(0);
 30 |     const count = new Array(m).fill(0);
 31 |     for (let i = 0; i < n; i++) {
 32 |       const index = Math.floor(i * (m / n));
 33 |       if (downsamplePeaks) {
 34 |         // take highest result in the set
 35 |         result[index] = Math.max(result[index], Math.abs(data[i]));
 36 |       } else {
 37 |         result[index] += Math.abs(data[i]);
 38 |       }
 39 |       count[index]++;
 40 |     }
 41 |     if (!downsamplePeaks) {
 42 |       for (let i = 0; i < result.length; i++) {
 43 |         result[i] = result[i] / count[i];
 44 |       }
 45 |     }
 46 |   } else {
 47 |     for (let i = 0; i < m; i++) {
 48 |       const index = (i * (n - 1)) / (m - 1);
 49 |       const low = Math.floor(index);
 50 |       const high = Math.ceil(index);
 51 |       const t = index - low;
 52 |       if (high >= n) {
 53 |         result[i] = data[n - 1];
 54 |       } else {
 55 |         result[i] = data[low] * (1 - t) + data[high] * t;
 56 |       }
 57 |     }
 58 |   }
 59 |   if (memoize) {
 60 |     cache[mKey as string][dKey as string] = result;
 61 |   }
 62 |   return result;
 63 | };
 64 | 
 65 | export const WavRenderer = {
 66 |   /**
 67 |    * Renders a point-in-time snapshot of an audio sample, usually frequency values
 68 |    * @param canvas
 69 |    * @param ctx
 70 |    * @param data
 71 |    * @param color
 72 |    * @param pointCount number of bars to render
 73 |    * @param barWidth width of bars in px
 74 |    * @param barSpacing spacing between bars in px
 75 |    * @param center vertically center the bars
 76 |    */
 77 |   drawBars: (
 78 |     canvas: HTMLCanvasElement,
 79 |     ctx: CanvasRenderingContext2D,
 80 |     data: Float32Array,
 81 |     color: string,
 82 |     pointCount: number = 0,
 83 |     barWidth: number = 0,
 84 |     barSpacing: number = 0,
 85 |     center: boolean = false
 86 |   ) => {
 87 |     pointCount = Math.floor(
 88 |       Math.min(
 89 |         pointCount,
 90 |         (canvas.width - barSpacing) / (Math.max(barWidth, 1) + barSpacing)
 91 |       )
 92 |     );
 93 |     if (!pointCount) {
 94 |       pointCount = Math.floor(
 95 |         (canvas.width - barSpacing) / (Math.max(barWidth, 1) + barSpacing)
 96 |       );
 97 |     }
 98 |     if (!barWidth) {
 99 |       barWidth = (canvas.width - barSpacing) / pointCount - barSpacing;
100 |     }
101 |     const points = normalizeArray(data, pointCount, true);
102 |     for (let i = 0; i < pointCount; i++) {
103 |       const amplitude = Math.abs(points[i]);
104 |       const height = Math.max(1, amplitude * canvas.height);
105 |       const x = barSpacing + i * (barWidth + barSpacing);
106 |       const y = center ? (canvas.height - height) / 2 : canvas.height - height;
107 |       ctx.fillStyle = color;
108 |       ctx.fillRect(x, y, barWidth, height);
109 |     }
110 |   },
111 | };
112 | 


--------------------------------------------------------------------------------
/tsconfig.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "compilerOptions": {
 3 |     "target": "ES2020",
 4 |     "lib": ["dom", "dom.iterable", "esnext", "ES2020"],
 5 |     "allowJs": true,
 6 |     "skipLibCheck": true,
 7 |     "esModuleInterop": true,
 8 |     "allowSyntheticDefaultImports": true,
 9 |     "strict": true,
10 |     "forceConsistentCasingInFileNames": true,
11 |     "noFallthroughCasesInSwitch": true,
12 |     "module": "esnext",
13 |     "moduleResolution": "node",
14 |     "resolveJsonModule": true,
15 |     "isolatedModules": true,
16 |     "noEmit": true,
17 |     "jsx": "react-jsx"
18 |   },
19 |   "include": ["src", "src/lib"]
20 | }
21 | 


--------------------------------------------------------------------------------