diff --git a/app/ui.js b/app/ui.js
index 51e57bd3..3ecaf7a1 100644
--- a/app/ui.js
+++ b/app/ui.js
@@ -189,6 +189,7 @@ const UI = {
         UI.initSetting('repeaterID', '');
         UI.initSetting('reconnect', false);
         UI.initSetting('reconnect_delay', 5000);
+        UI.initSetting('enable_audio', true);
     },
     // Adds a link to the label elements on the corresponding input elements
     setupSettingLabels() {
@@ -333,6 +334,12 @@ const UI = {
             .addEventListener('click', UI.rejectServer);
         document.getElementById("noVNC_credentials_button")
             .addEventListener('click', UI.setCredentials);
+
+        document.addEventListener('click', function(event) {
+            if (UI.rfb !== undefined) {
+                UI.rfb.allow_audio();
+            }
+        });
     },
 
     addClipboardHandlers() {
@@ -379,6 +386,8 @@ const UI = {
         UI.addSettingChangeHandler('logging', UI.updateLogging);
         UI.addSettingChangeHandler('reconnect');
         UI.addSettingChangeHandler('reconnect_delay');
+        UI.addSettingChangeHandler('enable_audio');
+        UI.addSettingChangeHandler('enable_audio', UI.updateEnableAudio);
     },
 
     addFullscreenHandlers() {
@@ -892,6 +901,7 @@ const UI = {
         UI.updateSetting('logging');
         UI.updateSetting('reconnect');
         UI.updateSetting('reconnect_delay');
+        UI.updateSetting('enable_audio');
 
         document.getElementById('noVNC_settings')
             .classList.add("noVNC_open");
@@ -1103,6 +1113,8 @@ const UI = {
         UI.rfb.showDotCursor = UI.getSetting('show_dot');
 
         UI.updateViewOnly(); // requires UI.rfb
+        UI.updateEnableAudio(); // requires UI.rfb
+
     },
 
     disconnect() {
@@ -1795,6 +1807,11 @@ const UI = {
         selectbox.options.add(optn);
     },
 
+    updateEnableAudio() {
+        if (!UI.rfb) return;
+        UI.rfb.enable_audio(UI.getSetting('enable_audio'));
+    },
+
 /* ------^-------
  *    /MISC
  * ==============
diff --git a/core/audio.js b/core/audio.js
new file mode 100644
index 00000000..a2baf1eb
--- /dev/null
+++ b/core/audio.js
@@ -0,0 +1,173 @@
+// The RFB protocol (VNC) is designed for real-time user interactions
+// and allows transferring audio messages together with screen content.
+// It is not possible to use any kind of buffering, because that would
+// introduce large delays between user interaction and content display.
+//
+// This is not really a problem with screen content, because the human
+// brain is quite tolerate about slight speed changes in video content,
+// and we mostly transfer non-video data anyways.
+//
+// With audio, the situation is quite different, as it must be played
+// at a constant speed. Any delay leads to audio distortion, which is
+// unpleasant for humans.
+//
+// Without buffering, it is always possible for audio frames to arrive
+// too late or too early due to changing network speeds.
+//
+// We use the following algorithm:
+//
+// - small Jitter buffer to tolerate small speed changes (20ms)
+// - simply discard late audio frame
+// - Queue early frames with slight speedup (pitch scale) to re-sync audio
+// - if we get to many early frames, skip frames for fast re-sync
+//
+// ## Audio format
+//
+// We use/expect U16, little endian, raw audio data,
+// interleaved channel data:  [L0, R0, L1, R1, ...]
+
+import * as Log from './util/logging.js';
+
+export default class Audio {
+    constructor(sample_rate, nchannels) {
+        this._next_start = 0;
+        this._context = null;
+        this._jitter = 0.02;
+        this._resample_trigger = 5*this._jitter;
+        this._stable_time = 1.0;
+
+        // ===== PROPERTIES =====
+        this._sample_rate = sample_rate;
+        this._nchannels = nchannels;
+        this._little_endian = true;
+    }
+
+    // ===== PROPERTIES =====
+    get sample_rate() { return this._sample_rate; }
+    get nchannels() { return this._nchannels; }
+
+    // ===== PUBLIC METHODS =====
+
+    // Stop audio playback
+    //
+    // Further audio frames are simply dropped.
+    stop() {
+        this._context = null;
+        this._next_start = 0;
+    }
+
+    start() {
+        this._context = new AudioContext({
+            latencyHint: "interactive",
+            sampleRate: this._sample_rate,
+        });
+        this._next_start = 0;
+    }
+
+    play(payload) {
+        if (this._context === null) {
+            return true;
+        }
+
+        let ctime = this._context.currentTime;
+
+        let time_offset = this._next_start - ctime;
+
+        let sample_bytes = 2*this._nchannels;
+
+        if ((time_offset < this._jitter) && (this._resample_trigger !== 5*this._jitter)) {
+            Log.Debug("Stop resampling because audio is in sync (delay = " + time_offset + " sec)");
+            this._resample_trigger = 5*this._jitter;
+        }
+
+        let buffer = null;
+        if (time_offset > this._resample_trigger && (payload.length > (100*sample_bytes))) {
+            if (this._resample_trigger !== this._jitter) {
+                Log.Debug("Start resampling to re-sync audio (delay = " + time_offset + " sec)");
+                this._resample_trigger = this._jitter;
+            }
+            buffer = this._pitchScale(payload, 1.01); // increase pitch by 1%
+        } else {
+            buffer = this._createBuffer(payload);
+        }
+
+        if (this._next_start > 0) {
+            if (time_offset < -buffer.duration) {
+                Log.Warn("Skip delayed audio frame (delay = " + (-time_offset) + " sec)");
+                this._next_start = ctime + this._jitter;
+                return true; // do not play delayed frame - skip it!
+            }
+            if  (time_offset > 0.5) {
+                Log.Warn("Move fast audio frame (offset = " + time_offset + " sec)");
+                this._stable_time = 0;
+                return true; // skip frame.
+            }
+        }
+
+        this._stable_time += buffer.duration;
+
+        if (this._next_start === 0) {
+            this._next_start = ctime + this._jitter;
+        }
+
+        let start_time = this._next_start;
+        this._next_start += buffer.duration;
+
+        if (this._stable_time >= 1.0) {
+            let source = this._context.createBufferSource();
+            source.buffer = buffer;
+            source.connect(this._context.destination);
+            source.start(start_time);
+        }
+
+        return true;
+    }
+
+    // ===== PRIVATE METHODS =====
+
+    // see: https://en.wikipedia.org/wiki/Audio_time_stretching_and_pitch_scaling
+    _pitchScale(payload, factor) {
+        let sample_bytes = 2*this._nchannels;
+        let new_length = Math.ceil(payload.length/(factor*sample_bytes));
+        const payload_view = new DataView(payload);
+
+        let buffer = this._context.createBuffer(this._nchannels, new_length, this._sample_rate);
+        for (let ch = 0; ch < this._nchannels; ch++) {
+            const channel = buffer.getChannelData(ch);
+            let channel_offset = ch*2;
+            for (let i = 0; i < buffer.length; i++) {
+                let pos_float = i*factor;
+                let j = Math.trunc(pos_float);
+                let second_weight = pos_float % 1;
+                let first_weight = 1 - second_weight;
+                let p = j*sample_bytes + channel_offset;
+                let value0 = payload_view.getUint16(p, this._little_endian);
+                p += sample_bytes;
+                let value1 = value0;
+                if (p < payload.length) {
+                    value1 = payload_view.getUint16(p, this._little_endian);
+                }
+                let value = (value0*first_weight + value1*second_weight);
+                channel[i] = (value - 32768) / 32768.0;
+            }
+        }
+        return buffer;
+    }
+
+    _createBuffer(payload) {
+        let sample_bytes = 2*this._nchannels;
+        let buffer = this._context.createBuffer(
+            this._nchannels, payload.length/sample_bytes, this._sample_rate);
+
+        for (let ch = 0; ch < this._nchannels; ch++) {
+            const channel = buffer.getChannelData(ch);
+            let channel_offset = ch*2;
+            for (let i = 0; i < buffer.length; i++) {
+                let p = i*sample_bytes + channel_offset;
+                let value = payload[p] + payload[p+1]*256;
+                channel[i] = (value / 32768.0) - 1.0;
+            }
+        }
+        return buffer;
+    }
+}
diff --git a/core/encodings.js b/core/encodings.js
index 7afcb17f..a69b4315 100644
--- a/core/encodings.js
+++ b/core/encodings.js
@@ -24,6 +24,7 @@ export const encodings = {
     pseudoEncodingLastRect: -224,
     pseudoEncodingCursor: -239,
     pseudoEncodingQEMUExtendedKeyEvent: -258,
+    pseudoEncodingQEMUAudioEvent: -259,
     pseudoEncodingQEMULedEvent: -261,
     pseudoEncodingDesktopName: -307,
     pseudoEncodingExtendedDesktopSize: -308,
diff --git a/core/rfb.js b/core/rfb.js
index 80011e4a..4b35ce09 100644
--- a/core/rfb.js
+++ b/core/rfb.js
@@ -14,6 +14,7 @@ import { dragThreshold, supportsWebCodecsH264Decode } from './util/browser.js';
 import { clientToElement } from './util/element.js';
 import { setCapture } from './util/events.js';
 import EventTargetMixin from './util/eventtarget.js';
+import Audio from "./audio.js";
 import Display from "./display.js";
 import Inflator from "./inflator.js";
 import Deflator from "./deflator.js";
@@ -154,6 +155,11 @@ export default class RFB extends EventTargetMixin {
 
         this._qemuExtKeyEventSupported = false;
 
+        this._qemuAudioSupported = false;
+        this._page_had_user_interaction = false;
+        this._audio_enable = false;
+        this._audio = new Audio(44100, 2);
+
         this._extendedPointerEventSupported = false;
 
         this._clipboardText = null;
@@ -2252,6 +2258,7 @@ export default class RFB extends EventTargetMixin {
         encs.push(encodings.pseudoEncodingDesktopSize);
         encs.push(encodings.pseudoEncodingLastRect);
         encs.push(encodings.pseudoEncodingQEMUExtendedKeyEvent);
+        encs.push(encodings.pseudoEncodingQEMUAudioEvent);
         encs.push(encodings.pseudoEncodingQEMULedEvent);
         encs.push(encodings.pseudoEncodingExtendedDesktopSize);
         encs.push(encodings.pseudoEncodingXvp);
@@ -2607,6 +2614,9 @@ export default class RFB extends EventTargetMixin {
             case 250:  // XVP
                 return this._handleXvpMsg();
 
+            case 255: // Qemu Server Message
+                return this._handleQemuAudioEvent();
+
             default:
                 this._fail("Unexpected server message (type " + msgType + ")");
                 Log.Debug("sock.rQpeekBytes(30): " + this._sock.rQpeekBytes(30));
@@ -2679,6 +2689,13 @@ export default class RFB extends EventTargetMixin {
                 this._qemuExtKeyEventSupported = true;
                 return true;
 
+            case encodings.pseudoEncodingQEMUAudioEvent:
+                if (!this._qemuAudioSupported) {
+                    RFB.messages.enableQemuAudioUpdates(this._sock, this._audio.nchannels, this._audio.sample_rate);
+                    this._qemuAudioSupported = true;
+                }
+                return true;
+
             case encodings.pseudoEncodingDesktopName:
                 return this._handleDesktopName();
 
@@ -2701,6 +2718,75 @@ export default class RFB extends EventTargetMixin {
         }
     }
 
+    _handleQemuAudioEvent() {
+        if (this._sock.rQwait("Qemu Audio Event", 3, 1)) {
+            return false;
+        }
+
+        const submsg = this._sock.rQshift8();
+        if (submsg !== 1) {
+            Log.Warn("The given qemu message type " + submsg + " is not supported.");
+            return false;
+        }
+
+        const operation = this._sock.rQshift16();
+
+        switch (operation) {
+            case 0: {
+                this._audio.stop();
+                return true;
+            }
+            case 1: {
+                this._audio.start();
+                return true;
+            }
+            case 2: break;
+            default: {
+                Log.Warn("The given qemu audio opertaion " + opertaion + " is not supported.");
+                return false;
+            }
+        }
+
+        if (this._sock.rQwait("Qemu Audio payload length", 4, 4)) {
+            return false;
+        }
+
+        const length = this._sock.rQshift32();
+
+        if (length === 0) {
+            return false;
+        }
+
+        if (this._sock.rQwait("audio payload", length, 8)) {
+            return false;
+        }
+
+        let payload = this._sock.rQshiftBytes(length, false);
+
+        if (!this._page_had_user_interaction || !this._audio_enable) {
+            return true;
+        }
+
+        return this._audio.play(payload);
+    }
+
+    enable_audio(value) {
+        if (this._audio_enable !== value) {
+            this._audio_enable = value;
+            if (this._qemuAudioSupported) {
+                if (this._audio_enable) {
+                    RFB.messages.enableQemuAudioUpdates(this._sock, this._audio.nchannels, this._audio.sample_rate);
+                } else {
+                    RFB.messages.disableQemuAudioUpdates(this._sock);
+                }
+            }
+        }
+    }
+
+    allow_audio() {
+        this._page_had_user_interaction = true;
+    }
+
     _handleVMwareCursor() {
         const hotx = this._FBU.x;  // hotspot-x
         const hoty = this._FBU.y;  // hotspot-y
@@ -3310,6 +3396,30 @@ RFB.messages = {
         sock.flush();
     },
 
+    disableQemuAudioUpdates(sock, nchannels, sample_rate) {
+        sock.sQpush8(255); // msg-type
+        sock.sQpush8(1); // submessage-type
+        sock.sQpush16(1); // disable audio
+
+        sock.flush();
+    },
+
+    enableQemuAudioUpdates(sock, nchannels, sample_rate) {
+
+        sock.sQpush8(255); // msg-type
+        sock.sQpush8(1); // submessage-type
+        sock.sQpush16(2); // set sample format
+        sock.sQpush8(2); // format U16
+        sock.sQpush8(nchannels);
+        sock.sQpush32(sample_rate); // audio frequency
+
+        sock.sQpush8(255); // msg-type
+        sock.sQpush8(1); // submessage-type
+        sock.sQpush16(0); // enable audio
+
+        sock.flush();
+    },
+
     pixelFormat(sock, depth, trueColor) {
         let bpp;
 
diff --git a/vnc.html b/vnc.html
index 82cacd58..f6cab3f9 100644
--- a/vnc.html
+++ b/vnc.html
@@ -219,6 +219,13 @@
                             View only
                         </label>
                     </li>
+                    <li>
+                        <label>
+                            <input id="noVNC_setting_enable_audio" type="checkbox"
+                                   class="toggle">
+                            Enable Audio
+                        </label>
+                    </li>
                     <li><hr></li>
                     <li>
                         <label>