1 files changed, 3460 insertions, 1104 deletions
diff --git a/src/main.cpp b/src/main.cpp
index 2b29d3b..d04b52b 100644
--- a/src/main.cpp
+++ b/src/main.cpp
@@ -1,669 +1,1002 @@
-/*
-    Copyright (C) 2020 dec05eba
-
-    This program is free software: you can redistribute it and/or modify
-    it under the terms of the GNU General Public License as published by
-    the Free Software Foundation, either version 3 of the License, or
-    (at your option) any later version.
-
-    This program is distributed in the hope that it will be useful,
-    but WITHOUT ANY WARRANTY; without even the implied warranty of
-    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-    GNU General Public License for more details.
-
-    You should have received a copy of the GNU General Public License
-    along with this program.  If not, see <https://www.gnu.org/licenses/>.
-*/
+extern "C" {
+#include "../include/capture/nvfbc.h"
+#include "../include/capture/xcomposite.h"
+#include "../include/capture/ximage.h"
+#include "../include/capture/kms.h"
+#ifdef GSR_PORTAL
+#include "../include/capture/portal.h"
+#include "../include/dbus.h"
+#endif
+#ifdef GSR_APP_AUDIO
+#include "../include/pipewire_audio.h"
+#endif
+#include "../include/encoder/encoder.h"
+#include "../include/encoder/video/nvenc.h"
+#include "../include/encoder/video/vaapi.h"
+#include "../include/encoder/video/vulkan.h"
+#include "../include/encoder/video/software.h"
+#include "../include/codec_query/nvenc.h"
+#include "../include/codec_query/vaapi.h"
+#include "../include/codec_query/vulkan.h"
+#include "../include/window/x11.h"
+#include "../include/window/wayland.h"
+#include "../include/egl.h"
+#include "../include/utils.h"
+#include "../include/damage.h"
+#include "../include/color_conversion.h"
+#include "../include/image_writer.h"
+#include "../include/args_parser.h"
+}
 
 #include <assert.h>
 #include <stdio.h>
 #include <stdlib.h>
 #include <string>
-#include <vector>
 #include <thread>
 #include <mutex>
-#include <map>
 #include <signal.h>
 #include <sys/stat.h>
-
 #include <unistd.h>
-#include <fcntl.h>
+#include <sys/wait.h>
+#include <inttypes.h>
+#include <libgen.h>
+#include <malloc.h>
 
 #include "../include/sound.hpp"
 
-#define GLX_GLXEXT_PROTOTYPES
-#include <GL/glew.h>
-#include <GL/glx.h>
-#include <GL/glxext.h>
-#include <GLFW/glfw3.h>
-
-#include <X11/extensions/Xcomposite.h>
-
 extern "C" {
 #include <libavutil/pixfmt.h>
 #include <libavcodec/avcodec.h>
+#include <libavcodec/defs.h>
 #include <libavformat/avformat.h>
-#include <libavutil/hwcontext.h>
-#include <libavutil/hwcontext_cuda.h>
 #include <libavutil/opt.h>
 #include <libswresample/swresample.h>
 #include <libavutil/avutil.h>
 #include <libavutil/time.h>
+#include <libavutil/mastering_display_metadata.h>
+#include <libavfilter/avfilter.h>
+#include <libavfilter/buffersink.h>
+#include <libavfilter/buffersrc.h>
 }
-#include <cudaGL.h>
 
-extern "C" {
-#include <libavutil/hwcontext.h>
-}
+#include <future>
 
-#include "../include/NvFBCLibrary.hpp"
+#ifndef GSR_VERSION
+#define GSR_VERSION "unknown"
+#endif
 
-#include <deque>
-#include <future>
+// TODO: If options are not supported then they are returned (allocated) in the options. This should be free'd.
 
-//#include <CL/cl.h>
+// TODO: Remove LIBAVUTIL_VERSION_MAJOR checks in the future when ubuntu, pop os LTS etc update ffmpeg to >= 5.0
+
+static const int AUDIO_SAMPLE_RATE = 48000;
 
 static const int VIDEO_STREAM_INDEX = 0;
-static const int AUDIO_STREAM_INDEX = 1;
 
 static thread_local char av_error_buffer[AV_ERROR_MAX_STRING_SIZE];
 
-static char* av_error_to_string(int err) {
-    if(av_strerror(err, av_error_buffer, sizeof(av_error_buffer)) < 0)
-        strcpy(av_error_buffer, "Unknown error");
-    return av_error_buffer;
-}
-
-struct ScopedGLXFBConfig {
-    ~ScopedGLXFBConfig() {
-        if (configs)
-            XFree(configs);
+typedef struct {
+    const gsr_window *window;
+} MonitorOutputCallbackUserdata;
+
+static void monitor_output_callback_print(const gsr_monitor *monitor, void *userdata) {
+    const MonitorOutputCallbackUserdata *options = (MonitorOutputCallbackUserdata*)userdata;
+    vec2i monitor_position = monitor->pos;
+    vec2i monitor_size = monitor->size;
+    if(gsr_window_get_display_server(options->window) == GSR_DISPLAY_SERVER_WAYLAND) {
+        gsr_monitor_rotation monitor_rotation = GSR_MONITOR_ROT_0;
+        drm_monitor_get_display_server_data(options->window, monitor, &monitor_rotation, &monitor_position);
+        if(monitor_rotation == GSR_MONITOR_ROT_90 || monitor_rotation == GSR_MONITOR_ROT_270)
+            std::swap(monitor_size.x, monitor_size.y);
     }
-
-    GLXFBConfig *configs = nullptr;
-};
-
-struct WindowPixmap {
-    WindowPixmap()
-        : pixmap(None), glx_pixmap(None), texture_id(0), target_texture_id(0),
-          texture_width(0), texture_height(0) {}
-
-    Pixmap pixmap;
-    GLXPixmap glx_pixmap;
-    GLuint texture_id;
-    GLuint target_texture_id;
-
-    GLint texture_width;
-    GLint texture_height;
-};
-
-enum class VideoQuality {
-    MEDIUM,
-    HIGH,
-    ULTRA
-};
-
-static double clock_get_monotonic_seconds() {
-    struct timespec ts;
-    ts.tv_sec = 0;
-    ts.tv_nsec = 0;
-    clock_gettime(CLOCK_MONOTONIC, &ts);
-    return (double)ts.tv_sec + (double)ts.tv_nsec * 0.000000001;
+    fprintf(stderr, "  \"%.*s\"    (%dx%d+%d+%d)\n", monitor->name_len, monitor->name, monitor_size.x, monitor_size.y, monitor_position.x, monitor_position.y);
 }
 
-static bool x11_supports_composite_named_window_pixmap(Display *dpy) {
-    int extension_major;
-    int extension_minor;
-    if (!XCompositeQueryExtension(dpy, &extension_major, &extension_minor))
-        return false;
+typedef struct {
+    char *output_name;
+} FirstOutputCallback;
 
-    int major_version;
-    int minor_version;
-    return XCompositeQueryVersion(dpy, &major_version, &minor_version) &&
-           (major_version > 0 || minor_version >= 2);
+static void get_first_output_callback(const gsr_monitor *monitor, void *userdata) {
+    FirstOutputCallback *data = (FirstOutputCallback*)userdata;
+    if(!data->output_name)
+        data->output_name = strdup(monitor->name);
 }
 
-static int x11_error_handler(Display *dpy, XErrorEvent *ev) {
-#if 0
-    char type_str[128];
-    XGetErrorText(dpy, ev->type, type_str, sizeof(type_str));
+typedef struct {
+    gsr_window *window;
+    vec2i position;
+    char *output_name;
+    vec2i monitor_pos;
+    vec2i monitor_size;
+} MonitorByPositionCallback;
+
+static void get_monitor_by_position_callback(const gsr_monitor *monitor, void *userdata) {
+    MonitorByPositionCallback *data = (MonitorByPositionCallback*)userdata;
+
+    vec2i monitor_position = monitor->pos;
+    vec2i monitor_size = monitor->size;
+    if(gsr_window_get_display_server(data->window) == GSR_DISPLAY_SERVER_WAYLAND) {
+        gsr_monitor_rotation monitor_rotation = GSR_MONITOR_ROT_0;
+        drm_monitor_get_display_server_data(data->window, monitor, &monitor_rotation, &monitor_position);
+        if(monitor_rotation == GSR_MONITOR_ROT_90 || monitor_rotation == GSR_MONITOR_ROT_270)
+            std::swap(monitor_size.x, monitor_size.y);
+    }
 
-    char major_opcode_str[128];
-    XGetErrorText(dpy, ev->type, major_opcode_str, sizeof(major_opcode_str));
+    if(!data->output_name && data->position.x >= monitor_position.x && data->position.x <= monitor_position.x + monitor->size.x
+        && data->position.y >= monitor_position.y && data->position.y <= monitor_position.y + monitor->size.y)
+    {
+        data->output_name = strdup(monitor->name);
+        data->monitor_pos = monitor_position;
+        data->monitor_size = monitor->size;
+    }
+}
 
-    char minor_opcode_str[128];
-    XGetErrorText(dpy, ev->type, minor_opcode_str, sizeof(minor_opcode_str));
+static char* av_error_to_string(int err) {
+    if(av_strerror(err, av_error_buffer, sizeof(av_error_buffer)) < 0)
+        strcpy(av_error_buffer, "Unknown error");
+    return av_error_buffer;
+}
 
-    fprintf(stderr,
-        "X Error of failed request:  %s\n"
-        "Major opcode of failed request:  %d (%s)\n"
-        "Minor opcode of failed request:  %d (%s)\n"
-        "Serial number of failed request:  %d\n",
-            type_str,
-            ev->request_code, major_opcode_str,
-            ev->minor_code, minor_opcode_str);
-#endif
+static int x11_error_handler(Display*, XErrorEvent*) {
     return 0;
 }
 
-static int x11_io_error_handler(Display *dpy) {
+static int x11_io_error_handler(Display*) {
     return 0;
 }
 
-static void cleanup_window_pixmap(Display *dpy, WindowPixmap &pixmap) {
-    if (pixmap.target_texture_id) {
-        glDeleteTextures(1, &pixmap.target_texture_id);
-        pixmap.target_texture_id = 0;
-    }
-
-    if (pixmap.texture_id) {
-        glDeleteTextures(1, &pixmap.texture_id);
-        pixmap.texture_id = 0;
-        pixmap.texture_width = 0;
-        pixmap.texture_height = 0;
-    }
-
-    if (pixmap.glx_pixmap) {
-        glXDestroyPixmap(dpy, pixmap.glx_pixmap);
-        glXReleaseTexImageEXT(dpy, pixmap.glx_pixmap, GLX_FRONT_EXT);
-        pixmap.glx_pixmap = None;
-    }
-
-    if (pixmap.pixmap) {
-        XFreePixmap(dpy, pixmap.pixmap);
-        pixmap.pixmap = None;
+static AVCodecID audio_codec_get_id(gsr_audio_codec audio_codec) {
+    switch(audio_codec) {
+        case GSR_AUDIO_CODEC_AAC:  return AV_CODEC_ID_AAC;
+        case GSR_AUDIO_CODEC_OPUS: return AV_CODEC_ID_OPUS;
+        case GSR_AUDIO_CODEC_FLAC: return AV_CODEC_ID_FLAC;
     }
+    assert(false);
+    return AV_CODEC_ID_AAC;
 }
 
-static bool recreate_window_pixmap(Display *dpy, Window window_id,
-                                   WindowPixmap &pixmap) {
-    cleanup_window_pixmap(dpy, pixmap);
-
-    XWindowAttributes attr;
-    if (!XGetWindowAttributes(dpy, window_id, &attr)) {
-        fprintf(stderr, "Failed to get window attributes\n");
-        return false;
-    }
+static AVSampleFormat audio_codec_get_sample_format(AVCodecContext *audio_codec_context, gsr_audio_codec audio_codec, const AVCodec *codec, bool mix_audio) {
+    (void)audio_codec_context;
+    switch(audio_codec) {
+        case GSR_AUDIO_CODEC_AAC: {
+            return AV_SAMPLE_FMT_FLTP;
+        }
+        case GSR_AUDIO_CODEC_OPUS: {
+            bool supports_s16 = false;
+            bool supports_flt = false;
+
+            #if LIBAVCODEC_VERSION_INT < AV_VERSION_INT(61, 15, 0)
+            for(size_t i = 0; codec->sample_fmts && codec->sample_fmts[i] != AV_SAMPLE_FMT_NONE; ++i) {
+                if(codec->sample_fmts[i] == AV_SAMPLE_FMT_S16) {
+                    supports_s16 = true;
+                } else if(codec->sample_fmts[i] == AV_SAMPLE_FMT_FLT) {
+                    supports_flt = true;
+                }
+            }
+            #else
+            const enum AVSampleFormat *sample_fmts = NULL;
+            if(avcodec_get_supported_config(audio_codec_context, codec, AV_CODEC_CONFIG_SAMPLE_FORMAT, 0, (const void**)&sample_fmts, NULL) >= 0) {
+                if(sample_fmts) {
+                    for(size_t i = 0; sample_fmts[i] != AV_SAMPLE_FMT_NONE; ++i) {
+                        if(sample_fmts[i] == AV_SAMPLE_FMT_S16) {
+                            supports_s16 = true;
+                        } else if(sample_fmts[i] == AV_SAMPLE_FMT_FLT) {
+                            supports_flt = true;
+                        }
+                    }
+                } else {
+                    // What a dumb API. It returns NULL if all formats are supported
+                    supports_s16 = true;
+                    supports_flt = true;
+                }
+            }
+            #endif
 
-    const int pixmap_config[] = {
-        GLX_BIND_TO_TEXTURE_RGB_EXT, True,
-        GLX_DRAWABLE_TYPE, GLX_PIXMAP_BIT | GLX_WINDOW_BIT,
-        GLX_BIND_TO_TEXTURE_TARGETS_EXT, GLX_TEXTURE_2D_BIT_EXT,
-        GLX_BUFFER_SIZE, 24,
-        GLX_RED_SIZE, 8,
-        GLX_GREEN_SIZE, 8,
-        GLX_BLUE_SIZE, 8,
-        GLX_ALPHA_SIZE, 0,
-        // GLX_Y_INVERTED_EXT, (int)GLX_DONT_CARE,
-        None};
-
-    const int pixmap_attribs[] = {GLX_TEXTURE_TARGET_EXT,
-                                  GLX_TEXTURE_2D_EXT,
-                                  GLX_TEXTURE_FORMAT_EXT,
-                                  GLX_TEXTURE_FORMAT_RGB_EXT,
-                                  None};
-
-    int c;
-    GLXFBConfig *configs = glXChooseFBConfig(dpy, 0, pixmap_config, &c);
-    if (!configs) {
-        fprintf(stderr, "Failed too choose fb config\n");
-        return false;
-    }
-    ScopedGLXFBConfig scoped_configs;
-    scoped_configs.configs = configs;
+            // Amix only works with float audio
+            if(mix_audio)
+                supports_s16 = false;
 
-    bool found = false;
-    GLXFBConfig config;
-    for (int i = 0; i < c; i++) {
-        config = configs[i];
-        XVisualInfo *visual = glXGetVisualFromFBConfig(dpy, config);
-        if (!visual)
-            continue;
+            if(!supports_s16 && !supports_flt) {
+                fprintf(stderr, "gsr warning: opus audio codec is chosen but your ffmpeg version does not support s16/flt sample format and performance might be slightly worse.\n");
+                fprintf(stderr, "  You can either rebuild ffmpeg with libopus instead of the built-in opus, use the flatpak version of gpu screen recorder or record with aac audio codec instead (-ac aac).\n");
+                fprintf(stderr, "  Falling back to fltp audio sample format instead.\n");
+            }
 
-        if (attr.depth != visual->depth) {
-            XFree(visual);
-            continue;
+            if(supports_s16)
+                return AV_SAMPLE_FMT_S16;
+            else if(supports_flt)
+                return AV_SAMPLE_FMT_FLT;
+            else
+                return AV_SAMPLE_FMT_FLTP;
+        }
+        case GSR_AUDIO_CODEC_FLAC: {
+            return AV_SAMPLE_FMT_S32;
         }
-        XFree(visual);
-        found = true;
-        break;
     }
+    assert(false);
+    return AV_SAMPLE_FMT_FLTP;
+}
 
-    if(!found) {
-        fprintf(stderr, "No matching fb config found\n");
-        return false;
+static int64_t audio_codec_get_get_bitrate(gsr_audio_codec audio_codec) {
+    switch(audio_codec) {
+        case GSR_AUDIO_CODEC_AAC:  return 160000;
+        case GSR_AUDIO_CODEC_OPUS: return 128000;
+        case GSR_AUDIO_CODEC_FLAC: return 128000;
     }
+    assert(false);
+    return 128000;
+}
 
-    Pixmap new_window_pixmap = XCompositeNameWindowPixmap(dpy, window_id);
-    if (!new_window_pixmap) {
-        fprintf(stderr, "Failed to get pixmap for window %ld\n", window_id);
-        return false;
+static AudioFormat audio_codec_context_get_audio_format(const AVCodecContext *audio_codec_context) {
+    switch(audio_codec_context->sample_fmt) {
+        case AV_SAMPLE_FMT_FLT:   return F32;
+        case AV_SAMPLE_FMT_FLTP:  return S32;
+        case AV_SAMPLE_FMT_S16:   return S16;
+        case AV_SAMPLE_FMT_S32:   return S32;
+        default:                  return S16;
     }
+}
 
-    GLXPixmap glx_pixmap =
-        glXCreatePixmap(dpy, config, new_window_pixmap, pixmap_attribs);
-    if (!glx_pixmap) {
-        fprintf(stderr, "Failed to create glx pixmap\n");
-        XFreePixmap(dpy, new_window_pixmap);
-        return false;
+static AVSampleFormat audio_format_to_sample_format(const AudioFormat audio_format) {
+    switch(audio_format) {
+        case S16:   return AV_SAMPLE_FMT_S16;
+        case S32:   return AV_SAMPLE_FMT_S32;
+        case F32:   return AV_SAMPLE_FMT_FLT;
     }
-
-    pixmap.pixmap = new_window_pixmap;
-    pixmap.glx_pixmap = glx_pixmap;
-
-    //glEnable(GL_TEXTURE_2D);
-    glGenTextures(1, &pixmap.texture_id);
-    glBindTexture(GL_TEXTURE_2D, pixmap.texture_id);
-
-    // glEnable(GL_BLEND);
-    // glBlendFunc(GL_SRC_ALPHA, GL_ONE_MINUS_SRC_ALPHA);
-
-    glXBindTexImageEXT(dpy, pixmap.glx_pixmap, GLX_FRONT_EXT, NULL);
-    glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MAG_FILTER,
-                    GL_NEAREST); // GL_LINEAR );
-    glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MIN_FILTER,
-                    GL_NEAREST); // GL_LINEAR);//GL_LINEAR_MIPMAP_LINEAR );
-    //glTexEnvf(GL_TEXTURE_ENV, GL_TEXTURE_ENV_MODE, GL_MODULATE);
-
-    glGetTexLevelParameteriv(GL_TEXTURE_2D, 0, GL_TEXTURE_WIDTH,
-                             &pixmap.texture_width);
-    glGetTexLevelParameteriv(GL_TEXTURE_2D, 0, GL_TEXTURE_HEIGHT,
-                             &pixmap.texture_height);
-
-    if(pixmap.texture_width == 0 || pixmap.texture_height == 0) {
-        pixmap.texture_width = attr.width;
-        pixmap.texture_height = attr.height;
-        fprintf(stderr, "Warning: failed to get texture size. You are probably running an unsupported compositor and recording the selected window doesn't work at the moment. This could also happen if you are trying to record a window with client-side decorations (GNOME issue). A black window will be displayed instead. A workaround is to record the whole monitor (which use NvFBC).\n");
-    }
-
-    fprintf(stderr, "texture width: %d, height: %d\n", pixmap.texture_width,
-           pixmap.texture_height);
-
-    // Generating this second texture is needed because
-    // cuGraphicsGLRegisterImage cant be used with the texture that is mapped
-    // directly to the pixmap.
-    // TODO: Investigate if it's somehow possible to use the pixmap texture
-    // directly, this should improve performance since only less image copy is
-    // then needed every frame.
-    glGenTextures(1, &pixmap.target_texture_id);
-    glBindTexture(GL_TEXTURE_2D, pixmap.target_texture_id);
-    glTexImage2D(GL_TEXTURE_2D, 0, GL_RGB, pixmap.texture_width,
-                 pixmap.texture_height, 0, GL_RGB, GL_UNSIGNED_BYTE, NULL);
-    int err2 = glGetError();
-    //fprintf(stderr, "error: %d\n", err2);
-    // glXBindTexImageEXT(dpy, pixmap.glx_pixmap, GLX_FRONT_EXT, NULL);
-    // glGenerateTextureMipmapEXT(glxpixmap, GL_TEXTURE_2D);
-
-    // glGenerateMipmap(GL_TEXTURE_2D);
-
-    // glTexParameteri( GL_TEXTURE_2D, GL_TEXTURE_WRAP_S, GL_CLAMP_TO_EDGE );
-    // glTexParameteri( GL_TEXTURE_2D, GL_TEXTURE_WRAP_T, GL_CLAMP_TO_EDGE );
-
-    glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MAG_FILTER,
-                    GL_NEAREST); // GL_LINEAR );
-    glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MIN_FILTER,
-                    GL_NEAREST); // GL_LINEAR);//GL_LINEAR_MIPMAP_LINEAR );
-    //glTexEnvf(GL_TEXTURE_ENV, GL_TEXTURE_ENV_MODE, GL_MODULATE);
-
-    glBindTexture(GL_TEXTURE_2D, 0);
-
-    return pixmap.texture_id != 0 && pixmap.target_texture_id != 0;
-}
-
-// |stream| is only required for non-replay mode
-static void receive_frames(AVCodecContext *av_codec_context, int stream_index, AVStream *stream, AVFrame *frame,
-                           AVFormatContext *av_format_context,
-                           double replay_start_time,
-                           std::deque<AVPacket> &frame_data_queue,
-                           int replay_buffer_size_secs,
-                           bool &frames_erased,
-						   std::mutex &write_output_mutex) {
-    AVPacket av_packet;
-    memset(&av_packet, 0, sizeof(av_packet));
-    for (;;) {
-        av_packet.data = NULL;
-        av_packet.size = 0;
-        int res = avcodec_receive_packet(av_codec_context, &av_packet);
-        if (res == 0) { // we have a packet, send the packet to the muxer
-            av_packet.stream_index = stream_index;
-            av_packet.pts = av_packet.dts = frame->pts;
-
-			std::lock_guard<std::mutex> lock(write_output_mutex);
-            if(replay_buffer_size_secs != -1) {
-                double time_now = glfwGetTime();
-                double replay_time_elapsed = time_now - replay_start_time;
-
-                AVPacket new_pack;
-                av_packet_move_ref(&new_pack, &av_packet);
-                frame_data_queue.push_back(std::move(new_pack));
-                if(replay_time_elapsed >= replay_buffer_size_secs) {
-                    av_packet_unref(&frame_data_queue.front());
-                    frame_data_queue.pop_front();
-                    frames_erased = true;
-                }
-            } else {
-                av_packet_rescale_ts(&av_packet, av_codec_context->time_base, stream->time_base);
-                av_packet.stream_index = stream->index;
-                int ret = av_interleaved_write_frame(av_format_context, &av_packet);
-                if(ret < 0) {
-                    fprintf(stderr, "Error: Failed to write frame index %d to muxer, reason: %s (%d)\n", av_packet.stream_index, av_error_to_string(ret), ret);
-                }
-            }
-            av_packet_unref(&av_packet);
-        } else if (res == AVERROR(EAGAIN)) { // we have no packet
-                                             // fprintf(stderr, "No packet!\n");
-            break;
-        } else if (res == AVERROR_EOF) { // this is the end of the stream
-            fprintf(stderr, "End of stream!\n");
-            break;
-        } else {
-            fprintf(stderr, "Unexpected error: %d\n", res);
-            break;
-        }
-    }
-    //av_packet_unref(&av_packet);
+    assert(false);
+    return AV_SAMPLE_FMT_S16;
 }
 
-static AVCodecContext* create_audio_codec_context(AVFormatContext *av_format_context, int fps) {
-    const AVCodec *codec = avcodec_find_encoder(AV_CODEC_ID_AAC);
+static AVCodecContext* create_audio_codec_context(int fps, gsr_audio_codec audio_codec, bool mix_audio, int64_t audio_bitrate) {
+    (void)fps;
+    const AVCodec *codec = avcodec_find_encoder(audio_codec_get_id(audio_codec));
     if (!codec) {
-        fprintf(
-            stderr,
-            "Error: Could not find aac encoder\n");
-        exit(1);
+        fprintf(stderr, "gsr error: Could not find %s audio encoder\n", audio_codec_get_name(audio_codec));
+        _exit(1);
     }
 
     AVCodecContext *codec_context = avcodec_alloc_context3(codec);
 
     assert(codec->type == AVMEDIA_TYPE_AUDIO);
-    /*
-    codec_context->sample_fmt = (*codec)->sample_fmts
-                                    ? (*codec)->sample_fmts[0]
-                                    : AV_SAMPLE_FMT_FLTP;
-    */
-	codec_context->codec_id = AV_CODEC_ID_AAC;
-    codec_context->sample_fmt = AV_SAMPLE_FMT_FLTP;
-    //codec_context->bit_rate = 64000;
-    codec_context->sample_rate = 48000;
+    codec_context->codec_id = codec->id;
+    codec_context->sample_fmt = audio_codec_get_sample_format(codec_context, audio_codec, codec, mix_audio);
+    codec_context->bit_rate = audio_bitrate == 0 ? audio_codec_get_get_bitrate(audio_codec) : audio_bitrate;
+    codec_context->sample_rate = AUDIO_SAMPLE_RATE;
+    if(audio_codec == GSR_AUDIO_CODEC_AAC) {
+#if LIBAVCODEC_VERSION_MAJOR < 62
+        codec_context->profile = FF_PROFILE_AAC_LOW;
+#else
+        codec_context->profile = AV_PROFILE_AAC_LOW;
+#endif
+    }
+#if LIBAVCODEC_VERSION_MAJOR < 60
     codec_context->channel_layout = AV_CH_LAYOUT_STEREO;
     codec_context->channels = 2;
+#else
+    av_channel_layout_default(&codec_context->ch_layout, 2);
+#endif
 
     codec_context->time_base.num = 1;
-    codec_context->time_base.den = AV_TIME_BASE;
-    codec_context->framerate.num = fps;
-    codec_context->framerate.den = 1;
-
-    // Some formats want stream headers to be seperate
-    if (av_format_context->oformat->flags & AVFMT_GLOBALHEADER)
-        av_format_context->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
+    codec_context->time_base.den = codec_context->sample_rate;
+    codec_context->thread_count = 1;
+    codec_context->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
 
     return codec_context;
 }
 
-static AVCodecContext *create_video_codec_context(AVFormatContext *av_format_context, 
-                            VideoQuality video_quality,
-                            int record_width, int record_height,
-                            int fps, bool use_hevc) {
-    const AVCodec *codec = avcodec_find_encoder_by_name(use_hevc ? "hevc_nvenc" : "h264_nvenc");
-    if (!codec) {
-        codec = avcodec_find_encoder_by_name(use_hevc ? "nvenc_hevc" : "nvenc_h264");
-    }
-    if (!codec) {
-        fprintf(
-            stderr,
-            "Error: Could not find %s encoder\n", use_hevc ? "hevc" : "h264");
-        exit(1);
+static int vbr_get_quality_parameter(AVCodecContext *codec_context, gsr_video_quality video_quality, bool hdr) {
+    // 8 bit / 10 bit = 80%
+    const float qp_multiply = hdr ? 8.0f/10.0f : 1.0f;
+    if(codec_context->codec_id == AV_CODEC_ID_AV1) {
+        switch(video_quality) {
+            case GSR_VIDEO_QUALITY_MEDIUM:
+                return 160 * qp_multiply;
+            case GSR_VIDEO_QUALITY_HIGH:
+                return 130 * qp_multiply;
+            case GSR_VIDEO_QUALITY_VERY_HIGH:
+                return 110 * qp_multiply;
+            case GSR_VIDEO_QUALITY_ULTRA:
+                return 90 * qp_multiply;
+        }
+    } else if(codec_context->codec_id == AV_CODEC_ID_H264) {
+        switch(video_quality) {
+            case GSR_VIDEO_QUALITY_MEDIUM:
+                return 35 * qp_multiply;
+            case GSR_VIDEO_QUALITY_HIGH:
+                return 30 * qp_multiply;
+            case GSR_VIDEO_QUALITY_VERY_HIGH:
+                return 25 * qp_multiply;
+            case GSR_VIDEO_QUALITY_ULTRA:
+                return 22 * qp_multiply;
+        }
+    } else if(codec_context->codec_id == AV_CODEC_ID_HEVC) {
+        switch(video_quality) {
+            case GSR_VIDEO_QUALITY_MEDIUM:
+                return 35 * qp_multiply;
+            case GSR_VIDEO_QUALITY_HIGH:
+                return 30 * qp_multiply;
+            case GSR_VIDEO_QUALITY_VERY_HIGH:
+                return 25 * qp_multiply;
+            case GSR_VIDEO_QUALITY_ULTRA:
+                return 22 * qp_multiply;
+        }
+    } else if(codec_context->codec_id == AV_CODEC_ID_VP8 || codec_context->codec_id == AV_CODEC_ID_VP9) {
+        switch(video_quality) {
+            case GSR_VIDEO_QUALITY_MEDIUM:
+                return 35 * qp_multiply;
+            case GSR_VIDEO_QUALITY_HIGH:
+                return 30 * qp_multiply;
+            case GSR_VIDEO_QUALITY_VERY_HIGH:
+                return 25 * qp_multiply;
+            case GSR_VIDEO_QUALITY_ULTRA:
+                return 22 * qp_multiply;
+        }
     }
+    assert(false);
+    return 22 * qp_multiply;
+}
 
+static AVCodecContext *create_video_codec_context(AVPixelFormat pix_fmt, const AVCodec *codec, const gsr_egl &egl, const args_parser &arg_parser) {
+    const bool use_software_video_encoder = arg_parser.video_encoder == GSR_VIDEO_ENCODER_HW_CPU;
+    const bool hdr = video_codec_is_hdr(arg_parser.video_codec);
     AVCodecContext *codec_context = avcodec_alloc_context3(codec);
 
     //double fps_ratio = (double)fps / 30.0;
 
     assert(codec->type == AVMEDIA_TYPE_VIDEO);
     codec_context->codec_id = codec->id;
-    codec_context->width = record_width & ~1;
-    codec_context->height = record_height & ~1;
-	codec_context->bit_rate = 12500000 + (codec_context->width * codec_context->height) / 2;
     // Timebase: This is the fundamental unit of time (in seconds) in terms
     // of which frame timestamps are represented. For fixed-fps content,
     // timebase should be 1/framerate and timestamp increments should be
     // identical to 1
     codec_context->time_base.num = 1;
-    codec_context->time_base.den = AV_TIME_BASE;
-    codec_context->framerate.num = fps;
+    codec_context->time_base.den = arg_parser.framerate_mode == GSR_FRAMERATE_MODE_CONSTANT ? arg_parser.fps : AV_TIME_BASE;
+    codec_context->framerate.num = arg_parser.fps;
     codec_context->framerate.den = 1;
     codec_context->sample_aspect_ratio.num = 0;
     codec_context->sample_aspect_ratio.den = 0;
-    codec_context->gop_size = fps * 2;
+    if(arg_parser.low_latency_recording) {
+        codec_context->flags |= (AV_CODEC_FLAG_CLOSED_GOP | AV_CODEC_FLAG_LOW_DELAY);
+        codec_context->flags2 |= AV_CODEC_FLAG2_FAST;
+        //codec_context->gop_size = std::numeric_limits<int>::max();
+        //codec_context->keyint_min = std::numeric_limits<int>::max();
+        codec_context->gop_size = arg_parser.fps * arg_parser.keyint;
+    } else {
+        // High values reduce file size but increases time it takes to seek
+        codec_context->gop_size = arg_parser.fps * arg_parser.keyint;
+    }
     codec_context->max_b_frames = 0;
-    codec_context->pix_fmt = AV_PIX_FMT_CUDA;
-    codec_context->color_range = AVCOL_RANGE_JPEG;
-    switch(video_quality) {
-        case VideoQuality::MEDIUM:
-	        codec_context->bit_rate = 10000000 + (codec_context->width * codec_context->height) / 2;
-            if(use_hevc) {
-                codec_context->qmin = 20;
-                codec_context->qmax = 35;
-            } else {
-                codec_context->qmin = 5;
-                codec_context->qmax = 20;
+    codec_context->pix_fmt = pix_fmt;
+    codec_context->color_range = arg_parser.color_range == GSR_COLOR_RANGE_LIMITED ? AVCOL_RANGE_MPEG : AVCOL_RANGE_JPEG;
+    if(hdr) {
+        codec_context->color_primaries = AVCOL_PRI_BT2020;
+        codec_context->color_trc = AVCOL_TRC_SMPTE2084;
+        codec_context->colorspace = AVCOL_SPC_BT2020_NCL;
+    } else {
+        codec_context->color_primaries = AVCOL_PRI_BT709;
+        codec_context->color_trc = AVCOL_TRC_BT709;
+        codec_context->colorspace = AVCOL_SPC_BT709;
+    }
+    //codec_context->chroma_sample_location = AVCHROMA_LOC_CENTER;
+    if(codec->id == AV_CODEC_ID_HEVC)
+        codec_context->codec_tag = MKTAG('h', 'v', 'c', '1'); // QuickTime on MacOS requires this or the video wont be playable
+
+    if(arg_parser.bitrate_mode == GSR_BITRATE_MODE_CBR) {
+        codec_context->bit_rate = arg_parser.video_bitrate;
+        codec_context->rc_max_rate = codec_context->bit_rate;
+        //codec_context->rc_min_rate = codec_context->bit_rate;
+        codec_context->rc_buffer_size = codec_context->bit_rate;//codec_context->bit_rate / 10;
+        codec_context->rc_initial_buffer_occupancy = 0;//codec_context->bit_rate;//codec_context->bit_rate * 1000;
+    } else if(arg_parser.bitrate_mode == GSR_BITRATE_MODE_VBR) {
+        const int quality = vbr_get_quality_parameter(codec_context, arg_parser.video_quality, hdr);
+        switch(arg_parser.video_quality) {
+            case GSR_VIDEO_QUALITY_MEDIUM:
+                codec_context->qmin = quality;
+                codec_context->qmax = quality;
+                codec_context->bit_rate = 100000;//4500000 + (codec_context->width * codec_context->height)*0.75;
+                break;
+            case GSR_VIDEO_QUALITY_HIGH:
+                codec_context->qmin = quality;
+                codec_context->qmax = quality;
+                codec_context->bit_rate = 100000;//10000000-9000000 + (codec_context->width * codec_context->height)*0.75;
+                break;
+            case GSR_VIDEO_QUALITY_VERY_HIGH:
+                codec_context->qmin = quality;
+                codec_context->qmax = quality;
+                codec_context->bit_rate = 100000;//10000000-9000000 + (codec_context->width * codec_context->height)*0.75;
+                break;
+            case GSR_VIDEO_QUALITY_ULTRA:
+                codec_context->qmin = quality;
+                codec_context->qmax = quality;
+                codec_context->bit_rate = 100000;//10000000-9000000 + (codec_context->width * codec_context->height)*0.75;
+                break;
+        }
+
+        codec_context->rc_max_rate = codec_context->bit_rate;
+        //codec_context->rc_min_rate = codec_context->bit_rate;
+        codec_context->rc_buffer_size = codec_context->bit_rate;//codec_context->bit_rate / 10;
+        codec_context->rc_initial_buffer_occupancy = codec_context->bit_rate;//codec_context->bit_rate * 1000;
+    } else {
+        //codec_context->rc_buffer_size = 50000 * 1000;
+    }
+    //codec_context->profile = FF_PROFILE_H264_MAIN;
+    if (codec_context->codec_id == AV_CODEC_ID_MPEG1VIDEO)
+        codec_context->mb_decision = 2;
+
+    if(!use_software_video_encoder && egl.gpu_info.vendor != GSR_GPU_VENDOR_NVIDIA && arg_parser.bitrate_mode != GSR_BITRATE_MODE_CBR) {
+        // 8 bit / 10 bit = 80%, and increase it even more
+        const float quality_multiply = hdr ? (8.0f/10.0f * 0.7f) : 1.0f;
+        if(codec_context->codec_id == AV_CODEC_ID_AV1 || codec_context->codec_id == AV_CODEC_ID_H264 || codec_context->codec_id == AV_CODEC_ID_HEVC) {
+            switch(arg_parser.video_quality) {
+                case GSR_VIDEO_QUALITY_MEDIUM:
+                    codec_context->global_quality = 130 * quality_multiply;
+                    break;
+                case GSR_VIDEO_QUALITY_HIGH:
+                    codec_context->global_quality = 110 * quality_multiply;
+                    break;
+                case GSR_VIDEO_QUALITY_VERY_HIGH:
+                    codec_context->global_quality = 95 * quality_multiply;
+                    break;
+                case GSR_VIDEO_QUALITY_ULTRA:
+                    codec_context->global_quality = 85 * quality_multiply;
+                    break;
             }
-            //av_opt_set(codec_context->priv_data, "preset", "slow", 0);
-            //av_opt_set(codec_context->priv_data, "profile", "high", 0);
-            //codec_context->profile = FF_PROFILE_H264_HIGH;
-            //av_opt_set(codec_context->priv_data, "preset", "p4", 0);
-            break;
-        case VideoQuality::HIGH:
-            if(use_hevc) {
-                codec_context->qmin = 17;
-                codec_context->qmax = 30;
-            } else {
-                codec_context->qmin = 5;
-                codec_context->qmax = 15;
+        } else if(codec_context->codec_id == AV_CODEC_ID_VP8) {
+            switch(arg_parser.video_quality) {
+                case GSR_VIDEO_QUALITY_MEDIUM:
+                    codec_context->global_quality = 35 * quality_multiply;
+                    break;
+                case GSR_VIDEO_QUALITY_HIGH:
+                    codec_context->global_quality = 30 * quality_multiply;
+                    break;
+                case GSR_VIDEO_QUALITY_VERY_HIGH:
+                    codec_context->global_quality = 25 * quality_multiply;
+                    break;
+                case GSR_VIDEO_QUALITY_ULTRA:
+                    codec_context->global_quality = 10 * quality_multiply;
+                    break;
             }
-            //av_opt_set(codec_context->priv_data, "preset", "slow", 0);
-            //av_opt_set(codec_context->priv_data, "profile", "high", 0);
-            //codec_context->profile = FF_PROFILE_H264_HIGH;
-            //av_opt_set(codec_context->priv_data, "preset", "p5", 0);
-            break;
-        case VideoQuality::ULTRA:
-	        codec_context->bit_rate = 15000000 + (codec_context->width * codec_context->height) / 2;
-            if(use_hevc) {
-                codec_context->qmin = 16;
-                codec_context->qmax = 25;
-            } else {
-                codec_context->qmin = 3;
-                codec_context->qmax = 13;
+        } else if(codec_context->codec_id == AV_CODEC_ID_VP9) {
+            switch(arg_parser.video_quality) {
+                case GSR_VIDEO_QUALITY_MEDIUM:
+                    codec_context->global_quality = 35 * quality_multiply;
+                    break;
+                case GSR_VIDEO_QUALITY_HIGH:
+                    codec_context->global_quality = 30 * quality_multiply;
+                    break;
+                case GSR_VIDEO_QUALITY_VERY_HIGH:
+                    codec_context->global_quality = 25 * quality_multiply;
+                    break;
+                case GSR_VIDEO_QUALITY_ULTRA:
+                    codec_context->global_quality = 10 * quality_multiply;
+                    break;
             }
-            //av_opt_set(codec_context->priv_data, "preset", "veryslow", 0);
-            //av_opt_set(codec_context->priv_data, "profile", "high", 0);
-            //codec_context->profile = FF_PROFILE_H264_HIGH;
-            //av_opt_set(codec_context->priv_data, "preset", "p7", 0);
-            break;
+        }
     }
-    if (codec_context->codec_id == AV_CODEC_ID_MPEG1VIDEO)
-        codec_context->mb_decision = 2;
 
-    // stream->time_base = codec_context->time_base;
-    // codec_context->ticks_per_frame = 30;
-    //av_opt_set(codec_context->priv_data, "tune", "hq", 0);
-    //av_opt_set(codec_context->priv_data, "rc", "vbr", 0);
+    av_opt_set_int(codec_context->priv_data, "b_ref_mode", 0, 0);
+    //av_opt_set_int(codec_context->priv_data, "cbr", true, 0);
+
+    if(egl.gpu_info.vendor != GSR_GPU_VENDOR_NVIDIA) {
+        // TODO: More options, better options
+        //codec_context->bit_rate = codec_context->width * codec_context->height;
+        switch(arg_parser.bitrate_mode) {
+            case GSR_BITRATE_MODE_QP: {
+                if(video_codec_is_vulkan(arg_parser.video_codec))
+                    av_opt_set(codec_context->priv_data, "rc_mode", "cqp", 0);
+                else if(egl.gpu_info.vendor == GSR_GPU_VENDOR_NVIDIA)
+                    av_opt_set(codec_context->priv_data, "rc", "constqp", 0);
+                else
+                    av_opt_set(codec_context->priv_data, "rc_mode", "CQP", 0);
+                break;
+            }
+            case GSR_BITRATE_MODE_VBR: {
+                if(video_codec_is_vulkan(arg_parser.video_codec))
+                    av_opt_set(codec_context->priv_data, "rc_mode", "vbr", 0);
+                else if(egl.gpu_info.vendor == GSR_GPU_VENDOR_NVIDIA)
+                    av_opt_set(codec_context->priv_data, "rc", "vbr", 0);
+                else
+                    av_opt_set(codec_context->priv_data, "rc_mode", "VBR", 0);
+                break;
+            }
+            case GSR_BITRATE_MODE_CBR: {
+                if(video_codec_is_vulkan(arg_parser.video_codec))
+                    av_opt_set(codec_context->priv_data, "rc_mode", "cbr", 0);
+                else if(egl.gpu_info.vendor == GSR_GPU_VENDOR_NVIDIA)
+                    av_opt_set(codec_context->priv_data, "rc", "cbr", 0);
+                else
+                    av_opt_set(codec_context->priv_data, "rc_mode", "CBR", 0);
+                break;
+            }
+        }
+        //codec_context->global_quality = 4;
+        //codec_context->compression_level = 2;
+    }
 
-    // Some formats want stream headers to be seperate
-    if (av_format_context->oformat->flags & AVFMT_GLOBALHEADER)
-        av_format_context->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
+    //av_opt_set(codec_context->priv_data, "bsf", "hevc_metadata=colour_primaries=9:transfer_characteristics=16:matrix_coefficients=9", 0);
+
+    codec_context->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
 
     return codec_context;
 }
 
-static AVFrame* open_audio(AVCodecContext *audio_codec_context) {
+static void open_audio(AVCodecContext *audio_codec_context) {
+    AVDictionary *options = nullptr;
+    av_dict_set(&options, "strict", "experimental", 0);
+
     int ret;
-    ret = avcodec_open2(audio_codec_context, audio_codec_context->codec, nullptr);
+    ret = avcodec_open2(audio_codec_context, audio_codec_context->codec, &options);
     if(ret < 0) {
         fprintf(stderr, "failed to open codec, reason: %s\n", av_error_to_string(ret));
-        exit(1);
+        _exit(1);
     }
+}
 
+static AVFrame* create_audio_frame(AVCodecContext *audio_codec_context) {
     AVFrame *frame = av_frame_alloc();
     if(!frame) {
         fprintf(stderr, "failed to allocate audio frame\n");
-        exit(1);
+        _exit(1);
     }
 
+    frame->sample_rate = audio_codec_context->sample_rate;
     frame->nb_samples = audio_codec_context->frame_size;
     frame->format = audio_codec_context->sample_fmt;
-	frame->channels = audio_codec_context->channels;
+#if LIBAVCODEC_VERSION_MAJOR < 60
+    frame->channels = audio_codec_context->channels;
     frame->channel_layout = audio_codec_context->channel_layout;
+#else
+    av_channel_layout_copy(&frame->ch_layout, &audio_codec_context->ch_layout);
+#endif
 
-    ret = av_frame_get_buffer(frame, 0);
+    int ret = av_frame_get_buffer(frame, 0);
     if(ret < 0) {
         fprintf(stderr, "failed to allocate audio data buffers, reason: %s\n", av_error_to_string(ret));
-        exit(1);
+        _exit(1);
     }
 
     return frame;
 }
 
-static void open_video(AVCodecContext *codec_context,
-                       WindowPixmap &window_pixmap, AVBufferRef **device_ctx,
-                       CUgraphicsResource *cuda_graphics_resource, CUcontext cuda_context) {
-    int ret;
+static void dict_set_profile(AVCodecContext *codec_context, gsr_gpu_vendor vendor, gsr_color_depth color_depth, gsr_video_codec video_codec, AVDictionary **options) {
+    #if LIBAVCODEC_VERSION_INT < AV_VERSION_INT(61, 17, 100)
+    if(codec_context->codec_id == AV_CODEC_ID_H264) {
+        // TODO: Only for vaapi
+        //if(color_depth == GSR_COLOR_DEPTH_10_BITS)
+        //    av_dict_set(options, "profile", "high10", 0);
+        //else
+        av_dict_set(options, "profile", "high", 0);
+    } else if(codec_context->codec_id == AV_CODEC_ID_AV1) {
+        if(vendor == GSR_GPU_VENDOR_NVIDIA) {
+            if(color_depth == GSR_COLOR_DEPTH_10_BITS)
+                av_dict_set_int(options, "highbitdepth", 1, 0);
+        } else {
+            av_dict_set(options, "profile", "main", 0); // TODO: use professional instead?
+        }
+    } else if(codec_context->codec_id == AV_CODEC_ID_HEVC) {
+        if(color_depth == GSR_COLOR_DEPTH_10_BITS)
+            av_dict_set(options, "profile", "main10", 0);
+        else
+            av_dict_set(options, "profile", "main", 0);
+    }
+    #else
+    const bool use_nvidia_values = vendor == GSR_GPU_VENDOR_NVIDIA && !video_codec_is_vulkan(video_codec);
+    if(codec_context->codec_id == AV_CODEC_ID_H264) {
+        // TODO: Only for vaapi
+        //if(color_depth == GSR_COLOR_DEPTH_10_BITS)
+        //    av_dict_set_int(options, "profile", AV_PROFILE_H264_HIGH_10, 0);
+        //else
+        av_dict_set_int(options, "profile", use_nvidia_values ? 2 : AV_PROFILE_H264_HIGH, 0);
+    } else if(codec_context->codec_id == AV_CODEC_ID_AV1) {
+        if(use_nvidia_values) {
+            if(color_depth == GSR_COLOR_DEPTH_10_BITS)
+                av_dict_set_int(options, "highbitdepth", 1, 0);
+        } else {
+            av_dict_set_int(options, "profile", AV_PROFILE_AV1_MAIN, 0); // TODO: use professional instead?
+        }
+    } else if(codec_context->codec_id == AV_CODEC_ID_HEVC) {
+        if(color_depth == GSR_COLOR_DEPTH_10_BITS)
+            av_dict_set_int(options, "profile", use_nvidia_values ? 1 : AV_PROFILE_HEVC_MAIN_10, 0);
+        else
+            av_dict_set_int(options, "profile", use_nvidia_values ? 0 : AV_PROFILE_HEVC_MAIN, 0);
+    }
+    #endif
+}
 
-    *device_ctx = av_hwdevice_ctx_alloc(AV_HWDEVICE_TYPE_CUDA);
-    if(!*device_ctx) {
-        fprintf(stderr, "Error: Failed to create hardware device context\n");
-        exit(1);
+static void video_software_set_qp(AVCodecContext *codec_context, gsr_video_quality video_quality, bool hdr, AVDictionary **options) {
+    // 8 bit / 10 bit = 80%
+    const float qp_multiply = hdr ? 8.0f/10.0f : 1.0f;
+    if(codec_context->codec_id == AV_CODEC_ID_AV1) {
+        switch(video_quality) {
+            case GSR_VIDEO_QUALITY_MEDIUM:
+                av_dict_set_int(options, "qp", 35 * qp_multiply, 0);
+                break;
+            case GSR_VIDEO_QUALITY_HIGH:
+                av_dict_set_int(options, "qp", 30 * qp_multiply, 0);
+                break;
+            case GSR_VIDEO_QUALITY_VERY_HIGH:
+                av_dict_set_int(options, "qp", 25 * qp_multiply, 0);
+                break;
+            case GSR_VIDEO_QUALITY_ULTRA:
+                av_dict_set_int(options, "qp", 22 * qp_multiply, 0);
+                break;
+        }
+    } else if(codec_context->codec_id == AV_CODEC_ID_H264) {
+        switch(video_quality) {
+            case GSR_VIDEO_QUALITY_MEDIUM:
+                av_dict_set_int(options, "qp", 34 * qp_multiply, 0);
+                break;
+            case GSR_VIDEO_QUALITY_HIGH:
+                av_dict_set_int(options, "qp", 30 * qp_multiply, 0);
+                break;
+            case GSR_VIDEO_QUALITY_VERY_HIGH:
+                av_dict_set_int(options, "qp", 25 * qp_multiply, 0);
+                break;
+            case GSR_VIDEO_QUALITY_ULTRA:
+                av_dict_set_int(options, "qp", 22 * qp_multiply, 0);
+                break;
+        }
+    } else {
+        switch(video_quality) {
+            case GSR_VIDEO_QUALITY_MEDIUM:
+                av_dict_set_int(options, "qp", 35 * qp_multiply, 0);
+                break;
+            case GSR_VIDEO_QUALITY_HIGH:
+                av_dict_set_int(options, "qp", 30 * qp_multiply, 0);
+                break;
+            case GSR_VIDEO_QUALITY_VERY_HIGH:
+                av_dict_set_int(options, "qp", 25 * qp_multiply, 0);
+                break;
+            case GSR_VIDEO_QUALITY_ULTRA:
+                av_dict_set_int(options, "qp", 22 * qp_multiply, 0);
+                break;
+        }
     }
+}
+
+static void open_video_software(AVCodecContext *codec_context, const args_parser &arg_parser) {
+    const bool hdr = video_codec_is_hdr(arg_parser.video_codec);
+    AVDictionary *options = nullptr;
 
-    AVHWDeviceContext *hw_device_context = (AVHWDeviceContext *)(*device_ctx)->data;
-    AVCUDADeviceContext *cuda_device_context = (AVCUDADeviceContext *)hw_device_context->hwctx;
-    cuda_device_context->cuda_ctx = cuda_context;
-    if(av_hwdevice_ctx_init(*device_ctx) < 0) {
-        fprintf(stderr, "Error: Failed to create hardware device context\n");
-        exit(1);
+    if(arg_parser.bitrate_mode == GSR_BITRATE_MODE_QP)
+        video_software_set_qp(codec_context, arg_parser.video_quality, hdr, &options);
+
+    av_dict_set(&options, "preset", "veryfast", 0);
+    av_dict_set(&options, "tune", "film", 0);
+
+    if(codec_context->codec_id == AV_CODEC_ID_H264) {
+        av_dict_set(&options, "coder", "cabac", 0); // TODO: cavlc is faster than cabac but worse compression. Which to use?
     }
 
-    AVBufferRef *frame_context = av_hwframe_ctx_alloc(*device_ctx);
-    if (!frame_context) {
-        fprintf(stderr, "Error: Failed to create hwframe context\n");
-        exit(1);
+    av_dict_set(&options, "strict", "experimental", 0);
+
+    int ret = avcodec_open2(codec_context, codec_context->codec, &options);
+    if (ret < 0) {
+        fprintf(stderr, "gsr error: Could not open video codec: %s\n", av_error_to_string(ret));
+        _exit(1);
     }
+}
 
-    AVHWFramesContext *hw_frame_context =
-        (AVHWFramesContext *)frame_context->data;
-    hw_frame_context->width = codec_context->width;
-    hw_frame_context->height = codec_context->height;
-    hw_frame_context->sw_format = AV_PIX_FMT_0RGB32;
-    hw_frame_context->format = codec_context->pix_fmt;
-    hw_frame_context->device_ref = *device_ctx;
-    hw_frame_context->device_ctx = (AVHWDeviceContext *)(*device_ctx)->data;
+static void video_set_rc(gsr_video_codec video_codec, gsr_gpu_vendor vendor, gsr_bitrate_mode bitrate_mode, AVDictionary **options) {
+    switch(bitrate_mode) {
+        case GSR_BITRATE_MODE_QP: {
+            if(video_codec_is_vulkan(video_codec))
+                av_dict_set(options, "rc_mode", "cqp", 0);
+            else if(vendor == GSR_GPU_VENDOR_NVIDIA)
+                av_dict_set(options, "rc", "constqp", 0);
+            else
+                av_dict_set(options, "rc_mode", "CQP", 0);
+            break;
+        }
+        case GSR_BITRATE_MODE_VBR: {
+            if(video_codec_is_vulkan(video_codec))
+                av_dict_set(options, "rc_mode", "vbr", 0);
+            else if(vendor == GSR_GPU_VENDOR_NVIDIA)
+                av_dict_set(options, "rc", "vbr", 0);
+            else
+                av_dict_set(options, "rc_mode", "VBR", 0);
+            break;
+        }
+        case GSR_BITRATE_MODE_CBR: {
+            if(video_codec_is_vulkan(video_codec))
+                av_dict_set(options, "rc_mode", "cbr", 0);
+            else if(vendor == GSR_GPU_VENDOR_NVIDIA)
+                av_dict_set(options, "rc", "cbr", 0);
+            else
+                av_dict_set(options, "rc_mode", "CBR", 0);
+            break;
+        }
+    }
+}
 
-    if (av_hwframe_ctx_init(frame_context) < 0) {
-        fprintf(stderr, "Error: Failed to initialize hardware frame context "
-                        "(note: ffmpeg version needs to be > 4.0\n");
-        exit(1);
+static void video_hardware_set_qp(AVCodecContext *codec_context, gsr_video_quality video_quality, gsr_gpu_vendor vendor, bool hdr, AVDictionary **options) {
+    // 8 bit / 10 bit = 80%
+    const float qp_multiply = hdr ? 8.0f/10.0f : 1.0f;
+    if(vendor == GSR_GPU_VENDOR_NVIDIA) {
+        // TODO: Test if these should be in the same range as vaapi
+        if(codec_context->codec_id == AV_CODEC_ID_AV1) {
+            switch(video_quality) {
+                case GSR_VIDEO_QUALITY_MEDIUM:
+                    av_dict_set_int(options, "qp", 35 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_HIGH:
+                    av_dict_set_int(options, "qp", 30 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_VERY_HIGH:
+                    av_dict_set_int(options, "qp", 25 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_ULTRA:
+                    av_dict_set_int(options, "qp", 22 * qp_multiply, 0);
+                    break;
+            }
+        } else if(codec_context->codec_id == AV_CODEC_ID_H264) {
+            switch(video_quality) {
+                case GSR_VIDEO_QUALITY_MEDIUM:
+                    av_dict_set_int(options, "qp", 35 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_HIGH:
+                    av_dict_set_int(options, "qp", 30 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_VERY_HIGH:
+                    av_dict_set_int(options, "qp", 25 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_ULTRA:
+                    av_dict_set_int(options, "qp", 22 * qp_multiply, 0);
+                    break;
+            }
+        } else if(codec_context->codec_id == AV_CODEC_ID_HEVC) {
+            switch(video_quality) {
+                case GSR_VIDEO_QUALITY_MEDIUM:
+                    av_dict_set_int(options, "qp", 35 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_HIGH:
+                    av_dict_set_int(options, "qp", 30 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_VERY_HIGH:
+                    av_dict_set_int(options, "qp", 25 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_ULTRA:
+                    av_dict_set_int(options, "qp", 22 * qp_multiply, 0);
+                    break;
+            }
+        } else if(codec_context->codec_id == AV_CODEC_ID_VP8 || codec_context->codec_id == AV_CODEC_ID_VP9) {
+            switch(video_quality) {
+                case GSR_VIDEO_QUALITY_MEDIUM:
+                    av_dict_set_int(options, "qp", 35 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_HIGH:
+                    av_dict_set_int(options, "qp", 30 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_VERY_HIGH:
+                    av_dict_set_int(options, "qp", 25 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_ULTRA:
+                    av_dict_set_int(options, "qp", 22 * qp_multiply, 0);
+                    break;
+            }
+        }
+    } else {
+        if(codec_context->codec_id == AV_CODEC_ID_AV1) {
+            // Using global_quality option
+        } else if(codec_context->codec_id == AV_CODEC_ID_H264) {
+            switch(video_quality) {
+                case GSR_VIDEO_QUALITY_MEDIUM:
+                    av_dict_set_int(options, "qp", 35 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_HIGH:
+                    av_dict_set_int(options, "qp", 30 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_VERY_HIGH:
+                    av_dict_set_int(options, "qp", 25 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_ULTRA:
+                    av_dict_set_int(options, "qp", 22 * qp_multiply, 0);
+                    break;
+            }
+        } else if(codec_context->codec_id == AV_CODEC_ID_HEVC) {
+            switch(video_quality) {
+                case GSR_VIDEO_QUALITY_MEDIUM:
+                    av_dict_set_int(options, "qp", 35 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_HIGH:
+                    av_dict_set_int(options, "qp", 30 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_VERY_HIGH:
+                    av_dict_set_int(options, "qp", 25 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_ULTRA:
+                    av_dict_set_int(options, "qp", 22 * qp_multiply, 0);
+                    break;
+            }
+        } else if(codec_context->codec_id == AV_CODEC_ID_VP8 || codec_context->codec_id == AV_CODEC_ID_VP9) {
+            switch(video_quality) {
+                case GSR_VIDEO_QUALITY_MEDIUM:
+                    av_dict_set_int(options, "qp", 35 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_HIGH:
+                    av_dict_set_int(options, "qp", 30 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_VERY_HIGH:
+                    av_dict_set_int(options, "qp", 25 * qp_multiply, 0);
+                    break;
+                case GSR_VIDEO_QUALITY_ULTRA:
+                    av_dict_set_int(options, "qp", 22 * qp_multiply, 0);
+                    break;
+            }
+        }
+    }
+}
+
+static void open_video_hardware(AVCodecContext *codec_context, bool low_power, const gsr_egl &egl, const args_parser &arg_parser) {
+    const gsr_color_depth color_depth = video_codec_to_bit_depth(arg_parser.video_codec);
+    const bool hdr = video_codec_is_hdr(arg_parser.video_codec);
+    AVDictionary *options = nullptr;
+
+    if(arg_parser.bitrate_mode == GSR_BITRATE_MODE_QP)
+        video_hardware_set_qp(codec_context, arg_parser.video_quality, egl.gpu_info.vendor, hdr, &options);
+
+    video_set_rc(arg_parser.video_codec, egl.gpu_info.vendor, arg_parser.bitrate_mode, &options);
+
+    // TODO: Enable multipass
+
+    dict_set_profile(codec_context, egl.gpu_info.vendor, color_depth, arg_parser.video_codec, &options);
+
+    if(video_codec_is_vulkan(arg_parser.video_codec)) {
+        av_dict_set_int(&options, "async_depth", 3, 0);
+        av_dict_set(&options, "tune", "hq", 0);
+        av_dict_set(&options, "usage", "record", 0); // TODO: Set to stream when streaming
+        av_dict_set(&options, "content", "rendered", 0);
+    } else if(egl.gpu_info.vendor == GSR_GPU_VENDOR_NVIDIA) {
+        // TODO: These dont seem to be necessary
+        // av_dict_set_int(&options, "zerolatency", 1, 0);
+        // if(codec_context->codec_id == AV_CODEC_ID_AV1) {
+        //     av_dict_set(&options, "tune", "ll", 0);
+        // } else if(codec_context->codec_id == AV_CODEC_ID_H264 || codec_context->codec_id == AV_CODEC_ID_HEVC) {
+        //     av_dict_set(&options, "preset", "llhq", 0);
+        //     av_dict_set(&options, "tune", "ll", 0);
+        // }
+        av_dict_set(&options, "tune", "hq", 0);
+
+        switch(arg_parser.tune) {
+            case GSR_TUNE_PERFORMANCE:
+                //av_dict_set(&options, "multipass", "qres", 0);
+                break;
+            case GSR_TUNE_QUALITY:
+                av_dict_set(&options, "multipass", "fullres", 0);
+                av_dict_set(&options, "preset", "p6", 0);
+                av_dict_set_int(&options, "rc-lookahead", 0, 0);
+                break;
+        }
+
+        if(codec_context->codec_id == AV_CODEC_ID_H264) {
+            // TODO: h264 10bit?
+            // TODO:
+            // switch(pixel_format) {
+            //     case GSR_PIXEL_FORMAT_YUV420:
+            //         av_dict_set_int(&options, "profile", AV_PROFILE_H264_HIGH, 0);
+            //         break;
+            //     case GSR_PIXEL_FORMAT_YUV444:
+            //         av_dict_set_int(&options, "profile", AV_PROFILE_H264_HIGH_444, 0);
+            //         break;
+            // }
+        } else if(codec_context->codec_id == AV_CODEC_ID_AV1) {
+            switch(arg_parser.pixel_format) {
+                case GSR_PIXEL_FORMAT_YUV420:
+                    av_dict_set(&options, "rgb_mode", "yuv420", 0);
+                    break;
+                case GSR_PIXEL_FORMAT_YUV444:
+                    av_dict_set(&options, "rgb_mode", "yuv444", 0);
+                    break;
+            }
+        } else if(codec_context->codec_id == AV_CODEC_ID_HEVC) {
+            //av_dict_set(&options, "pix_fmt", "yuv420p16le", 0);
+        }
+    } else {
+        // TODO: More quality options
+        if(low_power)
+            av_dict_set_int(&options, "low_power", 1, 0);
+        // Improves performance but increases vram.
+        // TODO: Might need a different async_depth for optimal performance on different amd/intel gpus
+        av_dict_set_int(&options, "async_depth", 3, 0);
+
+        if(codec_context->codec_id == AV_CODEC_ID_H264) {
+            // Removed because it causes stutter in games for some people
+            //av_dict_set_int(&options, "quality", 5, 0); // quality preset
+        } else if(codec_context->codec_id == AV_CODEC_ID_AV1) {
+            av_dict_set(&options, "tier", "main", 0);
+        } else if(codec_context->codec_id == AV_CODEC_ID_HEVC) {
+            if(hdr)
+                av_dict_set(&options, "sei", "hdr", 0);
+        }
+
+        // TODO: vp8/vp9 10bit
     }
 
-    codec_context->hw_device_ctx = *device_ctx;
-    codec_context->hw_frames_ctx = frame_context;
+    if(codec_context->codec_id == AV_CODEC_ID_H264) {
+        av_dict_set(&options, "coder", "cabac", 0); // TODO: cavlc is faster than cabac but worse compression. Which to use?
+    }
+
+    av_dict_set(&options, "strict", "experimental", 0);
 
-    ret = avcodec_open2(codec_context, codec_context->codec, nullptr);
+    int ret = avcodec_open2(codec_context, codec_context->codec, &options);
     if (ret < 0) {
-        fprintf(stderr, "Error: Could not open video codec: %s\n",
-                "blabla"); // av_err2str(ret));
-        exit(1);
-    }
-
-    if(window_pixmap.target_texture_id != 0) {
-        CUresult res;
-        CUcontext old_ctx;
-        res = cuCtxPopCurrent(&old_ctx);
-        res = cuCtxPushCurrent(cuda_context);
-        res = cuGraphicsGLRegisterImage(
-            cuda_graphics_resource, window_pixmap.target_texture_id, GL_TEXTURE_2D,
-            CU_GRAPHICS_REGISTER_FLAGS_READ_ONLY);
-        // cuGraphicsUnregisterResource(*cuda_graphics_resource);
-        if (res != CUDA_SUCCESS) {
-            const char *err_str;
-            cuGetErrorString(res, &err_str);
-            fprintf(stderr,
-                    "Error: cuGraphicsGLRegisterImage failed, error %s, texture "
-                    "id: %u\n",
-                    err_str, window_pixmap.target_texture_id);
-            exit(1);
-        }
-        res = cuCtxPopCurrent(&old_ctx);
-    }
-}
-
-static void close_video(AVStream *video_stream, AVFrame *frame) {
-    // avcodec_close(video_stream->codec);
-    // av_frame_free(&frame);
-}
-
-static void usage() {
-    fprintf(stderr, "usage: gpu-screen-recorder -w <window_id> -c <container_format> -f <fps> [-a <audio_input>] [-q <quality>] [-r <replay_buffer_size_sec>] [-o <output_file>]\n");
-    fprintf(stderr, "OPTIONS:\n");
-    fprintf(stderr, "  -w    Window to record or a display, \"screen\" or \"screen-direct\". The display is the display name in xrandr and if \"screen\" or \"screen-direct\" is selected then all displays are recorded and they are recorded in h265 (aka hevc)."
-        "\"screen-direct\" skips one texture copy for fullscreen applications so it may lead to better performance and it works with VRR monitors when recording fullscreen application but may break some applications, such as mpv in fullscreen mode. Recording a display requires a gpu with NvFBC support.\n");
-    fprintf(stderr, "  -s    The size (area) to record at in the format WxH, for example 1920x1080. Usually you want to set this to the size of the window. Optional, by default the size of the window, monitor or screen is used (which is passed to -w).\n");
-    fprintf(stderr, "  -c    Container format for output file, for example mp4, or flv.\n");
-    fprintf(stderr, "  -f    Framerate to record at. Clamped to [1,250].\n");
-    fprintf(stderr, "  -a    Audio device to record from (pulse audio device). Optional, disabled by default.\n");
-    fprintf(stderr, "  -q    Video quality. Should either be 'medium', 'high' or 'ultra'. Optional, set to 'medium' be default.\n");
-    fprintf(stderr, "  -r    Replay buffer size in seconds. If this is set, then only the last seconds as set by this option will be stored"
-        " and the video will only be saved when the gpu-screen-recorder is closed. This feature is similar to Nvidia's instant replay feature."
-        " This option has be between 5 and 1200. Note that the replay buffer size will not always be precise, because of keyframes. Optional, disabled by default.\n");
-    fprintf(stderr, "  -o    The output file path. If omitted then the encoded data is sent to stdout. Required in replay mode (when using -r). In replay mode this has to be an existing directory instead of a file.\n");
-    fprintf(stderr, "NOTES:\n");
-    fprintf(stderr, "  Send signal SIGINT (Ctrl+C) to gpu-screen-recorder to stop and save the recording (when not using replay mode).\n");
-    fprintf(stderr, "  Send signal SIGUSR1 (killall -SIGUSR1 gpu-screen-recorder) to gpu-screen-recorder to save a replay.\n");
-    exit(1);
-}
-
-static sig_atomic_t started = 0;
+        fprintf(stderr, "gsr error: Could not open video codec: %s\n", av_error_to_string(ret));
+        _exit(1);
+    }
+}
+
+static const int save_replay_seconds_full = -1;
+
 static sig_atomic_t running = 1;
-static sig_atomic_t save_replay = 0;
-static const char *pid_file = "/tmp/gpu-screen-recorder";
+static sig_atomic_t toggle_pause = 0;
+static sig_atomic_t toggle_replay_recording = 0;
+static sig_atomic_t save_replay_seconds = 0;
 
-static void term_handler(int) {
-    if(started)
-        unlink(pid_file);
-    exit(0);
+static void stop_handler(int) {
+    running = 0;
 }
 
-static void int_handler(int) {
-    running = 0;
+static void toggle_pause_handler(int) {
+    toggle_pause = 1;
+}
+
+static void toggle_replay_recording_handler(int) {
+    toggle_replay_recording = 1;
 }
 
 static void save_replay_handler(int) {
-    save_replay = 1;
+    save_replay_seconds = save_replay_seconds_full;
 }
 
-struct Arg {
-    const char *value;
-    bool optional;
-};
+static void save_replay_10_seconds_handler(int) {
+    save_replay_seconds = 10;
+}
+
+static void save_replay_30_seconds_handler(int) {
+    save_replay_seconds = 30;
+}
+
+static void save_replay_1_minute_handler(int) {
+    save_replay_seconds = 60;
+}
+
+static void save_replay_5_minutes_handler(int) {
+    save_replay_seconds = 60*5;
+}
+
+static void save_replay_10_minutes_handler(int) {
+    save_replay_seconds = 60*10;
+}
+
+static void save_replay_30_minutes_handler(int) {
+    save_replay_seconds = 60*30;
+}
 
 static bool is_hex_num(char c) {
     return (c >= 'A' && c <= 'F') || (c >= 'a' && c <= 'f') || (c >= '0' && c <= '9');
 }
 
 static bool contains_non_hex_number(const char *str) {
+    bool hex_start = false;
     size_t len = strlen(str);
     if(len >= 2 && memcmp(str, "0x", 2) == 0) {
         str += 2;
         len -= 2;
+        hex_start = true;
     }
 
+    bool is_hex = false;
     for(size_t i = 0; i < len; ++i) {
         char c = str[i];
         if(c == '\0')
             return false;
         if(!is_hex_num(c))
             return true;
+        if((c >= 'A' && c <= 'F') || (c >= 'a' && c <= 'f'))
+            is_hex = true;
     }
-    return false;
+
+    return is_hex && !hex_start;
 }
 
 static std::string get_date_str() {
@@ -671,14 +1004,30 @@ static std::string get_date_str() {
     time_t now = time(NULL);
     struct tm *t = localtime(&now);
     strftime(str, sizeof(str)-1, "%Y-%m-%d_%H-%M-%S", t);
-    return str; 
+    return str;
+}
+
+static std::string get_date_only_str() {
+    char str[128];
+    time_t now = time(NULL);
+    struct tm *t = localtime(&now);
+    strftime(str, sizeof(str)-1, "%Y-%m-%d", t);
+    return str;
+}
+
+static std::string get_time_only_str() {
+    char str[128];
+    time_t now = time(NULL);
+    struct tm *t = localtime(&now);
+    strftime(str, sizeof(str)-1, "%H-%M-%S", t);
+    return str;
 }
 
 static AVStream* create_stream(AVFormatContext *av_format_context, AVCodecContext *codec_context) {
     AVStream *stream = avformat_new_stream(av_format_context, nullptr);
     if (!stream) {
-        fprintf(stderr, "Error: Could not allocate stream\n");
-        exit(1);
+        fprintf(stderr, "gsr error: Could not allocate stream\n");
+        _exit(1);
     }
     stream->id = av_format_context->nb_streams - 1;
     stream->time_base = codec_context->time_base;
@@ -686,824 +1035,2831 @@ static AVStream* create_stream(AVFormatContext *av_format_context, AVCodecContex
     return stream;
 }
 
+static void run_recording_saved_script_async(const char *script_file, const char *video_file, const char *type) {
+    char script_file_full[PATH_MAX];
+    script_file_full[0] = '\0';
+    if(!realpath(script_file, script_file_full)) {
+        fprintf(stderr, "gsr error: script file not found: %s\n", script_file);
+        return;
+    }
+
+    const char *args[7];
+    const bool inside_flatpak = getenv("FLATPAK_ID") != NULL;
+
+    if(inside_flatpak) {
+        args[0] = "flatpak-spawn";
+        args[1] = "--host";
+        args[2] = "--";
+        args[3] = script_file_full;
+        args[4] = video_file;
+        args[5] = type;
+        args[6] = NULL;
+    } else {
+        args[0] = script_file_full;
+        args[1] = video_file;
+        args[2] = type;
+        args[3] = NULL;
+    }
+
+    pid_t pid = fork();
+    if(pid == -1) {
+        perror(script_file_full);
+        return;
+    } else if(pid == 0) { // child
+        setsid();
+        signal(SIGHUP, SIG_IGN);
+
+        pid_t second_child = fork();
+        if(second_child == 0) { // child
+            execvp(args[0], (char* const*)args);
+            perror(script_file_full);
+            _exit(127);
+        } else if(second_child != -1) { // parent
+            _exit(0);
+        }
+    } else { // parent
+        waitpid(pid, NULL, 0);
+    }
+}
+
+static double audio_codec_get_desired_delay(gsr_audio_codec audio_codec, int fps) {
+    const double fps_inv = 1.0 / (double)fps;
+    const double base = 0.01 + 1.0/165.0;
+    switch(audio_codec) {
+        case GSR_AUDIO_CODEC_OPUS:
+            return std::max(0.0, base - fps_inv);
+        case GSR_AUDIO_CODEC_AAC:
+            return std::max(0.0, (base + 0.008) * 2.0 - fps_inv);
+        case GSR_AUDIO_CODEC_FLAC:
+            // TODO: Test
+            return std::max(0.0, base - fps_inv);
+    }
+    assert(false);
+    return std::max(0.0, base - fps_inv);
+}
+
+struct AudioDeviceData {
+    SoundDevice sound_device;
+    AudioInput audio_input;
+    AVFilterContext *src_filter_ctx = nullptr;
+    AVFrame *frame = nullptr;
+    std::thread thread; // TODO: Instead of having a thread for each track, have one thread for all threads and read the data with non-blocking read
+};
+
+// TODO: Cleanup
+struct AudioTrack {
+    std::string name;
+    AVCodecContext *codec_context = nullptr;
+
+    std::vector<AudioDeviceData> audio_devices;
+    AVFilterGraph *graph = nullptr;
+    AVFilterContext *sink = nullptr;
+    int stream_index = 0;
+    int64_t pts = 0;
+};
+
+static bool add_hdr_metadata_to_video_stream(gsr_capture *cap, AVStream *video_stream) {
+    size_t light_metadata_size = 0;
+    size_t mastering_display_metadata_size = 0;
+    AVContentLightMetadata *light_metadata = av_content_light_metadata_alloc(&light_metadata_size);
+    #if LIBAVUTIL_VERSION_INT < AV_VERSION_INT(59, 37, 100)
+    AVMasteringDisplayMetadata *mastering_display_metadata = av_mastering_display_metadata_alloc();
+    mastering_display_metadata_size = sizeof(*mastering_display_metadata);
+    #else
+    AVMasteringDisplayMetadata *mastering_display_metadata = av_mastering_display_metadata_alloc_size(&mastering_display_metadata_size);
+    #endif
+
+    if(!light_metadata || !mastering_display_metadata) {
+        if(light_metadata)
+            av_freep(&light_metadata);
+
+        if(mastering_display_metadata)
+            av_freep(&mastering_display_metadata);
+
+        return false;
+    }
+
+    if(!gsr_capture_set_hdr_metadata(cap, mastering_display_metadata, light_metadata)) {
+        av_freep(&light_metadata);
+        av_freep(&mastering_display_metadata);
+        return false;
+    }
+
+    // TODO: More error checking
+
+    #if LIBAVCODEC_VERSION_INT < AV_VERSION_INT(60, 31, 102)
+    const bool content_light_level_added = av_stream_add_side_data(video_stream, AV_PKT_DATA_CONTENT_LIGHT_LEVEL, (uint8_t*)light_metadata, light_metadata_size) == 0;
+    #else
+    const bool content_light_level_added = av_packet_side_data_add(&video_stream->codecpar->coded_side_data, &video_stream->codecpar->nb_coded_side_data, AV_PKT_DATA_CONTENT_LIGHT_LEVEL, light_metadata, light_metadata_size, 0) != NULL;
+    #endif
+
+    #if LIBAVCODEC_VERSION_INT < AV_VERSION_INT(60, 31, 102)
+    const bool mastering_display_metadata_added = av_stream_add_side_data(video_stream, AV_PKT_DATA_MASTERING_DISPLAY_METADATA, (uint8_t*)mastering_display_metadata, mastering_display_metadata_size) == 0;
+    #else
+    const bool mastering_display_metadata_added = av_packet_side_data_add(&video_stream->codecpar->coded_side_data, &video_stream->codecpar->nb_coded_side_data, AV_PKT_DATA_MASTERING_DISPLAY_METADATA, mastering_display_metadata, mastering_display_metadata_size, 0) != NULL;
+    #endif
+
+    if(!content_light_level_added)
+        av_freep(&light_metadata);
+
+    if(!mastering_display_metadata_added)
+        av_freep(&mastering_display_metadata);
+
+    // Return true even on failure because we dont want to retry adding hdr metadata on failure
+    return true;
+}
+
+struct RecordingStartAudio {
+    const AudioTrack *audio_track;
+    AVStream *stream;
+};
+
+struct RecordingStartResult {
+    AVFormatContext *av_format_context = nullptr;
+    AVStream *video_stream = nullptr;
+    std::vector<RecordingStartAudio> audio_inputs;
+};
+
+static RecordingStartResult start_recording_create_streams(const char *filename, const char *container_format, AVCodecContext *video_codec_context, const std::vector<AudioTrack> &audio_tracks, bool hdr, gsr_capture *capture) {
+    AVFormatContext *av_format_context;
+    avformat_alloc_output_context2(&av_format_context, nullptr, container_format, filename);
+
+    AVStream *video_stream = create_stream(av_format_context, video_codec_context);
+    avcodec_parameters_from_context(video_stream->codecpar, video_codec_context);
+
+    RecordingStartResult result;
+    result.audio_inputs.reserve(audio_tracks.size());
+
+    for(const AudioTrack &audio_track : audio_tracks) {
+        AVStream *audio_stream = create_stream(av_format_context, audio_track.codec_context);
+        if(!audio_track.name.empty())
+            av_dict_set(&audio_stream->metadata, "title", audio_track.name.c_str(), 0);
+        avcodec_parameters_from_context(audio_stream->codecpar, audio_track.codec_context);
+        result.audio_inputs.push_back({&audio_track, audio_stream});
+    }
+
+    const int open_ret = avio_open(&av_format_context->pb, filename, AVIO_FLAG_WRITE);
+    if(open_ret < 0) {
+        fprintf(stderr, "gsr error: start: could not open '%s': %s\n", filename, av_error_to_string(open_ret));
+        return result;
+    }
+
+    AVDictionary *options = nullptr;
+    av_dict_set(&options, "strict", "experimental", 0);
+
+    const int header_write_ret = avformat_write_header(av_format_context, &options);
+    av_dict_free(&options);
+    if(header_write_ret < 0) {
+        fprintf(stderr, "gsr error: start: error occurred when writing header to output file: %s\n", av_error_to_string(header_write_ret));
+        avio_close(av_format_context->pb);
+        avformat_free_context(av_format_context);
+        return result;
+    }
+
+    if(hdr)
+        add_hdr_metadata_to_video_stream(capture, video_stream);
+
+    result.av_format_context = av_format_context;
+    result.video_stream = video_stream;
+    return result;
+}
+
+static bool stop_recording_close_streams(AVFormatContext *av_format_context) {
+    bool trailer_written = true;
+    if(av_write_trailer(av_format_context) != 0) {
+        fprintf(stderr, "gsr error: end: failed to write trailer\n");
+        trailer_written = false;
+    }
+
+    const bool closed = avio_close(av_format_context->pb) == 0;
+    avformat_free_context(av_format_context);
+    return trailer_written && closed;
+}
+
 static std::future<void> save_replay_thread;
-static std::vector<AVPacket> save_replay_packets;
 static std::string save_replay_output_filepath;
 
-static void save_replay_async(AVCodecContext *video_codec_context, AVCodecContext *audio_codec_context, int video_stream_index, int audio_stream_index, const std::deque<AVPacket> &frame_data_queue, bool frames_erased, std::string output_dir, std::string container_format) {
+static std::string create_new_recording_filepath_from_timestamp(std::string directory, const char *filename_prefix, const std::string &file_extension, bool date_folders) {
+    std::string output_filepath;
+    if(date_folders) {
+        std::string output_folder = directory + '/' + get_date_only_str();
+        if(create_directory_recursive(&output_folder[0]) != 0)
+            fprintf(stderr, "gsr error: failed to create directory: %s\n", output_folder.c_str());
+        output_filepath = output_folder + "/" + filename_prefix + "_" + get_time_only_str() + "." + file_extension;
+    } else {
+        if(create_directory_recursive(&directory[0]) != 0)
+            fprintf(stderr, "gsr error: failed to create directory: %s\n", directory.c_str());
+        output_filepath = directory + "/" + filename_prefix + "_" + get_date_str() + "." + file_extension;
+    }
+    return output_filepath;
+}
+
+static RecordingStartAudio* get_recording_start_item_by_stream_index(RecordingStartResult &result, int stream_index) {
+    for(auto &audio_input : result.audio_inputs) {
+        if(audio_input.stream->index == stream_index)
+            return &audio_input;
+    }
+    return nullptr;
+}
+
+static void save_replay_async(AVCodecContext *video_codec_context, int video_stream_index, const std::vector<AudioTrack> &audio_tracks, gsr_replay_buffer *replay_buffer, std::string output_dir, const char *container_format, const std::string &file_extension, bool date_folders, bool hdr, gsr_capture *capture, int current_save_replay_seconds) {
     if(save_replay_thread.valid())
         return;
-    
-    size_t start_index = (size_t)-1;
-    for(size_t i = 0; i < frame_data_queue.size(); ++i) {
-        const AVPacket &av_packet = frame_data_queue[i];
-        if((av_packet.flags & AV_PKT_FLAG_KEY) && av_packet.stream_index == video_stream_index) {
-            start_index = i;
-            break;
-        }
-    }
 
-    if(start_index == (size_t)-1)
+    const gsr_replay_buffer_iterator search_start_iterator = current_save_replay_seconds == save_replay_seconds_full ? gsr_replay_buffer_iterator{0, 0} : gsr_replay_buffer_find_packet_index_by_time_passed(replay_buffer, current_save_replay_seconds);
+    const gsr_replay_buffer_iterator video_start_iterator = gsr_replay_buffer_find_keyframe(replay_buffer, search_start_iterator, video_stream_index, false);
+    if(video_start_iterator.packet_index == (size_t)-1) {
+        fprintf(stderr, "gsr error: failed to save replay: failed to find a video keyframe. perhaps replay was saved too fast, before anything has been recorded\n");
         return;
+    }
 
-    int64_t pts_offset = 0;
-    if(frames_erased)
-        pts_offset = frame_data_queue[start_index].pts;
+    const gsr_replay_buffer_iterator audio_start_iterator = gsr_replay_buffer_find_keyframe(replay_buffer, video_start_iterator, video_stream_index, true);
+    // if(audio_start_index == (size_t)-1) {
+    //     fprintf(stderr, "gsr error: failed to save replay: failed to find an audio keyframe. perhaps replay was saved too fast, before anything has been recorded\n");
+    //     return;
+    // }
 
-    save_replay_packets.resize(frame_data_queue.size());
-    for(size_t i = 0; i < frame_data_queue.size(); ++i) {
-        av_packet_ref(&save_replay_packets[i], &frame_data_queue[i]);
+    const int64_t video_pts_offset = gsr_replay_buffer_iterator_get_packet(replay_buffer, video_start_iterator)->pts;
+    const int64_t audio_pts_offset = audio_start_iterator.packet_index == (size_t)-1 ? 0 : gsr_replay_buffer_iterator_get_packet(replay_buffer, audio_start_iterator)->pts;
+
+    gsr_replay_buffer *cloned_replay_buffer = gsr_replay_buffer_clone(replay_buffer);
+    if(!cloned_replay_buffer) {
+        // TODO: Return this error to mark the replay as failed
+        fprintf(stderr, "gsr error: failed to save replay: failed to clone replay buffer\n");
+        return;
     }
 
-    save_replay_output_filepath = output_dir + "/Replay_" + get_date_str() + "." + container_format;
-    save_replay_thread = std::async(std::launch::async, [video_stream_index, container_format, start_index, pts_offset, video_codec_context, audio_codec_context]() mutable {
-        AVFormatContext *av_format_context;
-        // The output format is automatically guessed from the file extension
-        avformat_alloc_output_context2(&av_format_context, nullptr, container_format.c_str(), nullptr);
+    std::string output_filepath = create_new_recording_filepath_from_timestamp(output_dir, "Replay", file_extension, date_folders);
+    RecordingStartResult recording_start_result = start_recording_create_streams(output_filepath.c_str(), container_format, video_codec_context, audio_tracks, hdr, capture);
+    if(!recording_start_result.av_format_context)
+        return;
 
-        av_format_context->flags |= AVFMT_FLAG_GENPTS;
-        if (av_format_context->oformat->flags & AVFMT_GLOBALHEADER)
-            av_format_context->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
+    save_replay_output_filepath = std::move(output_filepath);
 
-        AVStream *video_stream = create_stream(av_format_context, video_codec_context);
-        AVStream *audio_stream = audio_codec_context ? create_stream(av_format_context, audio_codec_context) : nullptr;
+    save_replay_thread = std::async(std::launch::async, [video_stream_index, recording_start_result, video_start_iterator, video_pts_offset, audio_pts_offset, video_codec_context, cloned_replay_buffer]() mutable {
+        gsr_replay_buffer_iterator replay_iterator = video_start_iterator;
+        for(;;) {
+            AVPacket *replay_packet = gsr_replay_buffer_iterator_get_packet(cloned_replay_buffer, replay_iterator);
+            uint8_t *replay_packet_data = NULL;
+            if(replay_packet)
+                replay_packet_data = gsr_replay_buffer_iterator_get_packet_data(cloned_replay_buffer, replay_iterator);
 
-        avcodec_parameters_from_context(video_stream->codecpar, video_codec_context);
-        if(audio_stream)
-            avcodec_parameters_from_context(audio_stream->codecpar, audio_codec_context);
+            if(!replay_packet) {
+                fprintf(stderr, "gsr error: save_replay_async: no replay packet\n");
+                break;
+            }
 
-        int ret = avio_open(&av_format_context->pb, save_replay_output_filepath.c_str(), AVIO_FLAG_WRITE);
-        if (ret < 0) {
-            fprintf(stderr, "Error: Could not open '%s': %s. Make sure %s is an existing directory with write access\n", save_replay_output_filepath.c_str(), av_error_to_string(ret), save_replay_output_filepath.c_str());
-            return;
-        }
+            if(!replay_packet->data && !replay_packet_data) {
+                fprintf(stderr, "gsr error: save_replay_async: no replay packet data\n");
+                break;
+            }
 
-        ret = avformat_write_header(av_format_context, nullptr);
-        if (ret < 0) {
-            fprintf(stderr, "Error occurred when writing header to output file: %s\n", av_error_to_string(ret));
-            return;
-        }
+            // TODO: Check if successful
+            AVPacket av_packet;
+            memset(&av_packet, 0, sizeof(av_packet));
+            //av_packet_from_data(av_packet, replay_packet->data, replay_packet->size);
+            av_packet.data = replay_packet->data ? replay_packet->data : replay_packet_data;
+            av_packet.size = replay_packet->size;
+            av_packet.stream_index = replay_packet->stream_index;
+            av_packet.pts = replay_packet->pts;
+            av_packet.dts = replay_packet->pts;
+            av_packet.flags = replay_packet->flags;
+            //av_packet.duration = replay_packet->duration;
+
+            AVStream *stream = recording_start_result.video_stream;
+            AVCodecContext *codec_context = video_codec_context;
+
+            if(av_packet.stream_index == video_stream_index) {
+                av_packet.pts -= video_pts_offset;
+                av_packet.dts -= video_pts_offset;
+            } else {
+                RecordingStartAudio *recording_start_audio = get_recording_start_item_by_stream_index(recording_start_result, av_packet.stream_index);
+                if(!recording_start_audio) {
+                    fprintf(stderr, "gsr error: save_replay_async: failed to find audio stream by index: %d\n", av_packet.stream_index);
+                    free(replay_packet_data);
+                    continue;
+                }
 
-        for(size_t i = start_index; i < save_replay_packets.size(); ++i) {
-            AVPacket &av_packet = save_replay_packets[i];
+                const AudioTrack *audio_track = recording_start_audio->audio_track;
+                stream = recording_start_audio->stream;
+                codec_context = audio_track->codec_context;
 
-            AVStream *stream = av_packet.stream_index == video_stream_index ? video_stream : audio_stream;
-            AVCodecContext *codec_context = av_packet.stream_index == video_stream_index ? video_codec_context : audio_codec_context;
+                av_packet.pts -= audio_pts_offset;
+                av_packet.dts -= audio_pts_offset;
+            }
 
-            av_packet.stream_index = stream->index;
-            av_packet.pts -= pts_offset;
-            av_packet.dts -= pts_offset;
+            //av_packet.stream_index = stream->index;
             av_packet_rescale_ts(&av_packet, codec_context->time_base, stream->time_base);
 
-            int ret = av_interleaved_write_frame(av_format_context, &av_packet);
+            const int ret = av_write_frame(recording_start_result.av_format_context, &av_packet);
             if(ret < 0)
-                fprintf(stderr, "Error: Failed to write frame index %d to muxer, reason: %s (%d)\n", stream->index, av_error_to_string(ret), ret);
+                fprintf(stderr, "gsr error: Failed to write frame index %d to muxer, reason: %s (%d)\n", av_packet.stream_index, av_error_to_string(ret), ret);
+
+            free(replay_packet_data);
+
+            //av_packet_free(&av_packet);
+            if(!gsr_replay_buffer_iterator_next(cloned_replay_buffer, &replay_iterator))
+                break;
         }
 
-        if (av_write_trailer(av_format_context) != 0)
-            fprintf(stderr, "Failed to write trailer\n");
+        stop_recording_close_streams(recording_start_result.av_format_context);
+        gsr_replay_buffer_destroy(cloned_replay_buffer);
+    });
+}
 
-        avio_close(av_format_context->pb);
-        avformat_free_context(av_format_context);
+static void split_string(const std::string &str, char delimiter, std::function<bool(const char*,size_t)> callback) {
+    size_t index = 0;
+    while(index < str.size()) {
+        size_t end_index = str.find(delimiter, index);
+        if(end_index == std::string::npos)
+            end_index = str.size();
+
+        if(!callback(&str[index], end_index - index))
+            break;
+
+        index = end_index + 1;
+    }
+}
+
+static bool string_starts_with(const std::string &str, const char *substr) {
+    int len = strlen(substr);
+    return (int)str.size() >= len && memcmp(str.data(), substr, len) == 0;
+}
+
+static bool string_ends_with(const char *str, const char *substr) {
+    int str_len = strlen(str);
+    int substr_len = strlen(substr);
+    return str_len >= substr_len && memcmp(str + str_len - substr_len, substr, substr_len) == 0;
+}
+
+static const AudioDevice* get_audio_device_by_name(const std::vector<AudioDevice> &audio_devices, const char *name) {
+    for(const auto &audio_device : audio_devices) {
+        if(strcmp(audio_device.name.c_str(), name) == 0)
+            return &audio_device;
+    }
+    return nullptr;
+}
+
+static MergedAudioInputs parse_audio_input_arg(const char *str) {
+    MergedAudioInputs result;
+
+    split_string(str, '|', [&](const char *sub, size_t size) {
+        AudioInput audio_input;
+        audio_input.name.assign(sub, size);
+
+        if(string_starts_with(audio_input.name.c_str(), "app:")) {
+            audio_input.name.erase(audio_input.name.begin(), audio_input.name.begin() + 4);
+            audio_input.type = AudioInputType::APPLICATION;
+            audio_input.inverted = false;
+            result.audio_inputs.push_back(std::move(audio_input));
+            return true;
+        } else if(string_starts_with(audio_input.name.c_str(), "app-inverse:")) {
+            audio_input.name.erase(audio_input.name.begin(), audio_input.name.begin() + 12);
+            audio_input.type = AudioInputType::APPLICATION;
+            audio_input.inverted = true;
+            result.audio_inputs.push_back(std::move(audio_input));
+            return true;
+        } else if(string_starts_with(audio_input.name.c_str(), "device:")) {
+            audio_input.name.erase(audio_input.name.begin(), audio_input.name.begin() + 7);
+            audio_input.type = AudioInputType::DEVICE;
+            result.audio_inputs.push_back(std::move(audio_input));
+            return true;
+        } else {
+            audio_input.type = AudioInputType::DEVICE;
+            result.audio_inputs.push_back(std::move(audio_input));
+            return true;
+        }
     });
+
+    return result;
 }
 
-static bool is_process_running_program(pid_t pid, const char *program_name) {
-    char filepath[256];
-    snprintf(filepath, sizeof(filepath), "/proc/%ld/exe", (long)pid);
+static int init_filter_graph(AVCodecContext* audio_codec_context, AVFilterGraph** graph, AVFilterContext** sink, std::vector<AVFilterContext*>& src_filter_ctx, size_t num_sources) {
+    char ch_layout[64];
+    int err = 0;
+    ch_layout[0] = '\0';
+
+    // C89-style variable declaration to
+    // avoid problems because of goto
+    AVFilterGraph* filter_graph = nullptr;
+    AVFilterContext* mix_ctx = nullptr;
+
+    const AVFilter* mix_filter = nullptr;
+    const AVFilter* abuffersink = nullptr;
+    AVFilterContext* abuffersink_ctx = nullptr;
+    char args[512] = { 0 };
+#if LIBAVFILTER_VERSION_INT >= AV_VERSION_INT(7, 107, 100)
+    bool normalize = false;
+#endif
 
-    char resolved_path[PATH_MAX];
-    const ssize_t resolved_path_len = readlink(filepath, resolved_path, sizeof(resolved_path) - 1);
-    if(resolved_path_len == -1)
-        return false;
-    
-    resolved_path[resolved_path_len] = '\0';
+    filter_graph = avfilter_graph_alloc();
+    if (!filter_graph) {
+        fprintf(stderr, "Unable to create filter graph.\n");
+        err = AVERROR(ENOMEM);
+        goto fail;
+    }
 
-    const int program_name_len = strlen(program_name);
-    return resolved_path_len >= program_name_len && memcmp(resolved_path + resolved_path_len - program_name_len, program_name, program_name_len) == 0;
+    for(size_t i = 0; i < num_sources; ++i) {
+        const AVFilter *abuffer = avfilter_get_by_name("abuffer");
+        if (!abuffer) {
+            fprintf(stderr, "Could not find the abuffer filter.\n");
+            err = AVERROR_FILTER_NOT_FOUND;
+            goto fail;
+        }
+
+        AVFilterContext *abuffer_ctx = avfilter_graph_alloc_filter(filter_graph, abuffer, NULL);
+        if (!abuffer_ctx) {
+            fprintf(stderr, "Could not allocate the abuffer instance.\n");
+            err = AVERROR(ENOMEM);
+            goto fail;
+        }
+
+        #if LIBAVCODEC_VERSION_MAJOR < 60
+        av_get_channel_layout_string(ch_layout, sizeof(ch_layout), 0, AV_CH_LAYOUT_STEREO);
+        #else
+        av_channel_layout_describe(&audio_codec_context->ch_layout, ch_layout, sizeof(ch_layout));
+        #endif
+        av_opt_set    (abuffer_ctx, "channel_layout", ch_layout,                                               AV_OPT_SEARCH_CHILDREN);
+        av_opt_set    (abuffer_ctx, "sample_fmt",     av_get_sample_fmt_name(audio_codec_context->sample_fmt), AV_OPT_SEARCH_CHILDREN);
+        av_opt_set_q  (abuffer_ctx, "time_base",      audio_codec_context->time_base,                          AV_OPT_SEARCH_CHILDREN);
+        av_opt_set_int(abuffer_ctx, "sample_rate",    audio_codec_context->sample_rate,                        AV_OPT_SEARCH_CHILDREN);
+        av_opt_set_int(abuffer_ctx, "bit_rate",       audio_codec_context->bit_rate,                           AV_OPT_SEARCH_CHILDREN);
+
+        err = avfilter_init_str(abuffer_ctx, NULL);
+        if (err < 0) {
+            fprintf(stderr, "Could not initialize the abuffer filter.\n");
+            goto fail;
+        }
+
+        src_filter_ctx.push_back(abuffer_ctx);
+    }
+
+    mix_filter = avfilter_get_by_name("amix");
+    if (!mix_filter) {
+        av_log(NULL, AV_LOG_ERROR, "Could not find the mix filter.\n");
+        err = AVERROR_FILTER_NOT_FOUND;
+        goto fail;
+    }
+
+#if LIBAVFILTER_VERSION_INT >= AV_VERSION_INT(7, 107, 100)
+    snprintf(args, sizeof(args), "inputs=%d:normalize=%s", (int)num_sources, normalize ? "true" : "false");
+#else
+    snprintf(args, sizeof(args), "inputs=%d", (int)num_sources);
+    fprintf(stderr, "gsr warning: your ffmpeg version doesn't support disabling normalizing of mixed audio. Volume might be lower than expected\n");
+#endif
+
+    err = avfilter_graph_create_filter(&mix_ctx, mix_filter, "amix", args, NULL, filter_graph);
+    if (err < 0) {
+        av_log(NULL, AV_LOG_ERROR, "Cannot create audio amix filter\n");
+        goto fail;
+    }
+
+    abuffersink = avfilter_get_by_name("abuffersink");
+    if (!abuffersink) {
+        fprintf(stderr, "Could not find the abuffersink filter.\n");
+        err = AVERROR_FILTER_NOT_FOUND;
+        goto fail;
+    }
+
+    abuffersink_ctx = avfilter_graph_alloc_filter(filter_graph, abuffersink, "sink");
+    if (!abuffersink_ctx) {
+        fprintf(stderr, "Could not allocate the abuffersink instance.\n");
+        err = AVERROR(ENOMEM);
+        goto fail;
+    }
+
+    err = avfilter_init_str(abuffersink_ctx, NULL);
+    if (err < 0) {
+        fprintf(stderr, "Could not initialize the abuffersink instance.\n");
+        goto fail;
+    }
+
+    err = 0;
+    for(size_t i = 0; i < src_filter_ctx.size(); ++i) {
+        AVFilterContext *src_ctx = src_filter_ctx[i];
+        if (err >= 0)
+            err = avfilter_link(src_ctx, 0, mix_ctx, i);
+    }
+    if (err >= 0)
+        err = avfilter_link(mix_ctx, 0, abuffersink_ctx, 0);
+    if (err < 0) {
+        av_log(NULL, AV_LOG_ERROR, "Error connecting filters\n");
+        goto fail;
+    }
+
+    err = avfilter_graph_config(filter_graph, NULL);
+    if (err < 0) {
+        av_log(NULL, AV_LOG_ERROR, "Error configuring the filter graph\n");
+        goto fail;
+    }
+
+    *graph = filter_graph;
+    *sink = abuffersink_ctx;
+
+    return 0;
+
+fail:
+    avfilter_graph_free(&filter_graph);
+    src_filter_ctx.clear();  // possibly unnecessary?
+    return err;
 }
 
-static void handle_existing_pid_file() {
-    char buffer[256];
-    int fd = open(pid_file, O_RDONLY);
-    if(fd == -1)
-        return;
+static gsr_video_encoder* create_video_encoder(gsr_egl *egl, const args_parser &arg_parser) {
+    const gsr_color_depth color_depth = video_codec_to_bit_depth(arg_parser.video_codec);
+    gsr_video_encoder *video_encoder = nullptr;
 
-    ssize_t bytes_read = read(fd, buffer, sizeof(buffer) - 1);
-    if(bytes_read < 0) {
-        perror("failed to read gpu-screen-recorder pid file");
-        exit(1);
+    if(arg_parser.video_encoder == GSR_VIDEO_ENCODER_HW_CPU) {
+        gsr_video_encoder_software_params params;
+        params.egl = egl;
+        params.color_depth = color_depth;
+        video_encoder = gsr_video_encoder_software_create(&params);
+        return video_encoder;
     }
-    buffer[bytes_read] = '\0';
-    close(fd);
 
-    long pid = 0;
-    if(sscanf(buffer, "%ld %120s", &pid, buffer) == 2) {
-        if(is_process_running_program(pid, "gpu-screen-recorder")) {
-            fprintf(stderr, "Error: gpu-screen-recorder is already running\n");
-            exit(1);
+    if(video_codec_is_vulkan(arg_parser.video_codec)) {
+        gsr_video_encoder_vulkan_params params;
+        params.egl = egl;
+        params.color_depth = color_depth;
+        video_encoder = gsr_video_encoder_vulkan_create(&params);
+        return video_encoder;
+    }
+
+    switch(egl->gpu_info.vendor) {
+        case GSR_GPU_VENDOR_AMD:
+        case GSR_GPU_VENDOR_INTEL:
+        case GSR_GPU_VENDOR_BROADCOM: {
+            gsr_video_encoder_vaapi_params params;
+            params.egl = egl;
+            params.color_depth = color_depth;
+            video_encoder = gsr_video_encoder_vaapi_create(&params);
+            break;
         }
+        case GSR_GPU_VENDOR_NVIDIA: {
+            gsr_video_encoder_nvenc_params params;
+            params.egl = egl;
+            params.overclock = arg_parser.overclock;
+            params.color_depth = color_depth;
+            video_encoder = gsr_video_encoder_nvenc_create(&params);
+            break;
+        }
+    }
+
+    return video_encoder;
+}
+
+static bool get_supported_video_codecs(gsr_egl *egl, gsr_video_codec video_codec, bool use_software_video_encoder, bool cleanup, gsr_supported_video_codecs *video_codecs) {
+    memset(video_codecs, 0, sizeof(*video_codecs));
+
+    if(use_software_video_encoder) {
+        video_codecs->h264.supported = true;
+        return true;
+    }
+
+    if(video_codec_is_vulkan(video_codec))
+        return gsr_get_supported_video_codecs_vulkan(video_codecs, egl->card_path, cleanup);
+
+    switch(egl->gpu_info.vendor) {
+        case GSR_GPU_VENDOR_AMD:
+        case GSR_GPU_VENDOR_INTEL:
+        case GSR_GPU_VENDOR_BROADCOM:
+            return gsr_get_supported_video_codecs_vaapi(video_codecs, egl->card_path, cleanup);
+        case GSR_GPU_VENDOR_NVIDIA:
+            return gsr_get_supported_video_codecs_nvenc(video_codecs, cleanup);
+    }
+
+    return false;
+}
+
+static void xwayland_check_callback(const gsr_monitor *monitor, void *userdata) {
+    bool *xwayland_found = (bool*)userdata;
+    if(monitor->name_len >= 8 && strncmp(monitor->name, "XWAYLAND", 8) == 0)
+        *xwayland_found = true;
+    else if(memmem(monitor->name, monitor->name_len, "X11", 3))
+        *xwayland_found = true;
+}
+
+static bool is_xwayland(Display *display) {
+    int opcode, event, error;
+    if(XQueryExtension(display, "XWAYLAND", &opcode, &event, &error))
+        return true;
+
+    bool xwayland_found = false;
+    for_each_active_monitor_output_x11_not_cached(display, xwayland_check_callback, &xwayland_found);
+    return xwayland_found;
+}
+
+static bool is_using_prime_run() {
+    const char *prime_render_offload = getenv("__NV_PRIME_RENDER_OFFLOAD");
+    return (prime_render_offload && strcmp(prime_render_offload, "1") == 0) || getenv("DRI_PRIME");
+}
+
+static void disable_prime_run() {
+    unsetenv("__NV_PRIME_RENDER_OFFLOAD");
+    unsetenv("__NV_PRIME_RENDER_OFFLOAD_PROVIDER");
+    unsetenv("__GLX_VENDOR_LIBRARY_NAME");
+    unsetenv("__VK_LAYER_NV_optimus");
+    unsetenv("DRI_PRIME");
+}
+
+static gsr_window* gsr_window_create(Display *display, bool wayland) {
+    if(wayland)
+        return gsr_window_wayland_create();
+    else
+        return gsr_window_x11_create(display);
+}
+
+static void list_system_info(bool wayland) {
+    printf("display_server|%s\n", wayland ? "wayland" : "x11");
+    bool supports_app_audio = false;
+#ifdef GSR_APP_AUDIO
+    supports_app_audio = pulseaudio_server_is_pipewire();
+    if(supports_app_audio) {
+        gsr_pipewire_audio audio;
+        if(gsr_pipewire_audio_init(&audio))
+            gsr_pipewire_audio_deinit(&audio);
+        else
+            supports_app_audio = false;
+    }
+#endif
+    printf("supports_app_audio|%s\n", supports_app_audio ? "yes" : "no");
+}
+
+static void list_gpu_info(gsr_egl *egl) {
+    switch(egl->gpu_info.vendor) {
+        case GSR_GPU_VENDOR_AMD:
+            printf("vendor|amd\n");
+            break;
+        case GSR_GPU_VENDOR_INTEL:
+            printf("vendor|intel\n");
+            break;
+        case GSR_GPU_VENDOR_NVIDIA:
+            printf("vendor|nvidia\n");
+            break;
+        case GSR_GPU_VENDOR_BROADCOM:
+            printf("vendor|broadcom\n");
+            break;
+    }
+    printf("card_path|%s\n", egl->card_path);
+}
+
+static const AVCodec* get_ffmpeg_video_codec(gsr_video_codec video_codec, gsr_gpu_vendor vendor) {
+    switch(video_codec) {
+        case GSR_VIDEO_CODEC_H264:
+            return avcodec_find_encoder_by_name(vendor == GSR_GPU_VENDOR_NVIDIA ? "h264_nvenc" : "h264_vaapi");
+        case GSR_VIDEO_CODEC_HEVC:
+        case GSR_VIDEO_CODEC_HEVC_HDR:
+        case GSR_VIDEO_CODEC_HEVC_10BIT:
+            return avcodec_find_encoder_by_name(vendor == GSR_GPU_VENDOR_NVIDIA ? "hevc_nvenc" : "hevc_vaapi");
+        case GSR_VIDEO_CODEC_AV1:
+        case GSR_VIDEO_CODEC_AV1_HDR:
+        case GSR_VIDEO_CODEC_AV1_10BIT:
+            return avcodec_find_encoder_by_name(vendor == GSR_GPU_VENDOR_NVIDIA ? "av1_nvenc" : "av1_vaapi");
+        case GSR_VIDEO_CODEC_VP8:
+            return avcodec_find_encoder_by_name(vendor == GSR_GPU_VENDOR_NVIDIA ? "vp8_nvenc" : "vp8_vaapi");
+        case GSR_VIDEO_CODEC_VP9:
+            return avcodec_find_encoder_by_name(vendor == GSR_GPU_VENDOR_NVIDIA ? "vp9_nvenc" : "vp9_vaapi");
+        case GSR_VIDEO_CODEC_H264_VULKAN:
+            return avcodec_find_encoder_by_name("h264_vulkan");
+        case GSR_VIDEO_CODEC_HEVC_VULKAN:
+            return avcodec_find_encoder_by_name("hevc_vulkan");
+    }
+    return nullptr;
+}
+
+static void set_supported_video_codecs_ffmpeg(gsr_supported_video_codecs *supported_video_codecs, gsr_supported_video_codecs *supported_video_codecs_vulkan, gsr_gpu_vendor vendor) {
+    if(!get_ffmpeg_video_codec(GSR_VIDEO_CODEC_H264, vendor)) {
+        supported_video_codecs->h264.supported = false;
+    }
+
+    if(!get_ffmpeg_video_codec(GSR_VIDEO_CODEC_HEVC, vendor)) {
+        supported_video_codecs->hevc.supported = false;
+        supported_video_codecs->hevc_hdr.supported = false;
+        supported_video_codecs->hevc_10bit.supported = false;
+    }
+
+    if(!get_ffmpeg_video_codec(GSR_VIDEO_CODEC_AV1, vendor)) {
+        supported_video_codecs->av1.supported = false;
+        supported_video_codecs->av1_hdr.supported = false;
+        supported_video_codecs->av1_10bit.supported = false;
+    }
+
+    if(!get_ffmpeg_video_codec(GSR_VIDEO_CODEC_VP8, vendor)) {
+        supported_video_codecs->vp8.supported = false;
+    }
+
+    if(!get_ffmpeg_video_codec(GSR_VIDEO_CODEC_VP9, vendor)) {
+        supported_video_codecs->vp9.supported = false;
+    }
+
+    if(!get_ffmpeg_video_codec(GSR_VIDEO_CODEC_H264_VULKAN, vendor)) {
+        supported_video_codecs_vulkan->h264.supported = false;
+    }
+
+    if(!get_ffmpeg_video_codec(GSR_VIDEO_CODEC_HEVC_VULKAN, vendor)) {
+        supported_video_codecs_vulkan->hevc.supported = false;
+        supported_video_codecs_vulkan->hevc_hdr.supported = false;
+        supported_video_codecs_vulkan->hevc_10bit.supported = false;
+    }
+}
+
+static void list_supported_video_codecs(gsr_egl *egl, bool wayland) {
+    // Dont clean it up on purpose to increase shutdown speed
+    gsr_supported_video_codecs supported_video_codecs;
+    get_supported_video_codecs(egl, GSR_VIDEO_CODEC_H264, false, false, &supported_video_codecs);
+
+    gsr_supported_video_codecs supported_video_codecs_vulkan;
+    get_supported_video_codecs(egl, GSR_VIDEO_CODEC_H264_VULKAN, false, false, &supported_video_codecs_vulkan);
+
+    set_supported_video_codecs_ffmpeg(&supported_video_codecs, &supported_video_codecs_vulkan, egl->gpu_info.vendor);
+
+    if(supported_video_codecs.h264.supported)
+        puts("h264");
+    if(avcodec_find_encoder_by_name("libx264"))
+        puts("h264_software");
+    if(supported_video_codecs.hevc.supported)
+        puts("hevc");
+    if(supported_video_codecs.hevc_hdr.supported && wayland)
+        puts("hevc_hdr");
+    if(supported_video_codecs.hevc_10bit.supported)
+        puts("hevc_10bit");
+    if(supported_video_codecs.av1.supported)
+        puts("av1");
+    if(supported_video_codecs.av1_hdr.supported && wayland)
+        puts("av1_hdr");
+    if(supported_video_codecs.av1_10bit.supported)
+        puts("av1_10bit");
+    if(supported_video_codecs.vp8.supported)
+        puts("vp8");
+    if(supported_video_codecs.vp9.supported)
+        puts("vp9");
+    //if(supported_video_codecs_vulkan.h264.supported)
+    //    puts("h264_vulkan");
+    //if(supported_video_codecs_vulkan.hevc.supported)
+    //    puts("hevc_vulkan"); // TODO: hdr, 10 bit
+}
+
+static bool monitor_capture_use_drm(const gsr_window *window, gsr_gpu_vendor vendor) {
+    return gsr_window_get_display_server(window) == GSR_DISPLAY_SERVER_WAYLAND || vendor != GSR_GPU_VENDOR_NVIDIA;
+}
+
+typedef struct {
+    const gsr_window *window;
+    int num_monitors;
+} capture_options_callback;
+
+static void output_monitor_info(const gsr_monitor *monitor, void *userdata) {
+    capture_options_callback *options = (capture_options_callback*)userdata;
+    if(gsr_window_get_display_server(options->window) == GSR_DISPLAY_SERVER_WAYLAND) {
+        vec2i monitor_size = monitor->size;
+        gsr_monitor_rotation monitor_rotation = GSR_MONITOR_ROT_0;
+        vec2i monitor_position = {0, 0};
+        drm_monitor_get_display_server_data(options->window, monitor, &monitor_rotation, &monitor_position);
+        if(monitor_rotation == GSR_MONITOR_ROT_90 || monitor_rotation == GSR_MONITOR_ROT_270)
+            std::swap(monitor_size.x, monitor_size.y);
+        printf("%.*s|%dx%d\n", monitor->name_len, monitor->name, monitor_size.x, monitor_size.y);
     } else {
-        fprintf(stderr, "Warning: gpu-screen-recorder pid file is in incorrect format, it's possible that its corrupt. Replacing file and continuing...\n");
+        printf("%.*s|%dx%d\n", monitor->name_len, monitor->name, monitor->size.x, monitor->size.y);
     }
-    unlink(pid_file);
+    ++options->num_monitors;
 }
 
-static void handle_new_pid_file(const char *mode) {
-    int fd = open(pid_file, O_WRONLY|O_CREAT|O_TRUNC, 0777);
-    if(fd == -1) {
-        perror("failed to create gpu-screen-recorder pid file");
-        exit(1);
+static void list_supported_capture_options(const gsr_window *window, const char *card_path, bool list_monitors) {
+    const bool wayland = gsr_window_get_display_server(window) == GSR_DISPLAY_SERVER_WAYLAND;
+    if(!wayland) {
+        puts("window");
+        puts("focused");
     }
 
-    char buffer[256];
-    const int buffer_size = snprintf(buffer, sizeof(buffer), "%ld %s", (long)getpid(), mode);
-    if(write(fd, buffer, buffer_size) == -1) {
-        perror("failed to write gpu-screen-recorder pid file");
-        exit(1);
+    capture_options_callback options;
+    options.window = window;
+    options.num_monitors = 0;
+    if(list_monitors) {
+        const bool is_x11 = gsr_window_get_display_server(window) == GSR_DISPLAY_SERVER_X11;
+        const gsr_connection_type connection_type = is_x11 ? GSR_CONNECTION_X11 : GSR_CONNECTION_DRM;
+        for_each_active_monitor_output(window, card_path, connection_type, output_monitor_info, &options);
     }
-    close(fd);
+
+    if(options.num_monitors > 0)
+        puts("region");
+
+#ifdef GSR_PORTAL
+    // Desktop portal capture on x11 doesn't seem to be hardware accelerated
+    if(!wayland)
+        return;
+
+    gsr_dbus dbus;
+    if(!gsr_dbus_init(&dbus, NULL))
+        return;
+
+    char *session_handle = NULL;
+    if(gsr_dbus_screencast_create_session(&dbus, &session_handle) == 0)
+        puts("portal");
+
+    gsr_dbus_deinit(&dbus);
+#endif
 }
 
-int main(int argc, char **argv) {
-    signal(SIGTERM, term_handler);
-    signal(SIGINT, int_handler);
-    signal(SIGUSR1, save_replay_handler);
+static void version_command(void *userdata) {
+    (void)userdata;
+    puts(GSR_VERSION);
+    fflush(stdout);
+    _exit(0);
+}
 
-    handle_existing_pid_file();
+static void info_command(void *userdata) {
+    (void)userdata;
+    bool wayland = false;
+    Display *dpy = XOpenDisplay(nullptr);
+    if (!dpy) {
+        wayland = true;
+        fprintf(stderr, "gsr warning: failed to connect to the X server. Assuming wayland is running without Xwayland\n");
+    }
 
-    std::map<std::string, Arg> args = {
-        { "-w", Arg { nullptr, false } },
-        //{ "-s", Arg { nullptr, true } },
-        { "-c", Arg { nullptr, false } },
-        { "-f", Arg { nullptr, false } },
-        { "-s", Arg { nullptr, true } },
-        { "-a", Arg { nullptr, true } },
-        { "-q", Arg { nullptr, true } },
-        { "-o", Arg { nullptr, true } },
-        { "-r", Arg { nullptr, true } }
-    };
+    XSetErrorHandler(x11_error_handler);
+    XSetIOErrorHandler(x11_io_error_handler);
 
-    for(int i = 1; i < argc - 1; i += 2) {
-        auto it = args.find(argv[i]);
-        if(it == args.end()) {
-            fprintf(stderr, "Invalid argument '%s'\n", argv[i]);
-            usage();
-        }
-        it->second.value = argv[i + 1];
+    if(!wayland)
+        wayland = is_xwayland(dpy);
+
+    if(!wayland && is_using_prime_run()) {
+        // Disable prime-run and similar options as it doesn't work, the monitor to capture has to be run on the same device.
+        // This is fine on wayland since nvidia uses drm interface there and the monitor query checks the monitors connected
+        // to the drm device.
+        fprintf(stderr, "gsr warning: use of prime-run on X11 is not supported. Disabling prime-run\n");
+        disable_prime_run();
+    }
+
+    gsr_window *window = gsr_window_create(dpy, wayland);
+    if(!window) {
+        fprintf(stderr, "gsr error: failed to create window\n");
+        _exit(1);
+    }
+
+    gsr_egl egl;
+    if(!gsr_egl_load(&egl, window, false, false)) {
+        fprintf(stderr, "gsr error: failed to load opengl\n");
+        _exit(22);
     }
 
-    for(auto &it : args) {
-        if(!it.second.optional && !it.second.value) {
-            fprintf(stderr, "Missing argument '%s'\n", it.first.c_str());
-            usage();
+    bool list_monitors = true;
+    egl.card_path[0] = '\0';
+    if(monitor_capture_use_drm(window, egl.gpu_info.vendor)) {
+        // TODO: Allow specifying another card, and in other places
+        if(!gsr_get_valid_card_path(&egl, egl.card_path, true)) {
+            fprintf(stderr, "gsr error: no /dev/dri/cardX device found. Make sure that you have at least one monitor connected\n");
+            list_monitors = false;
         }
     }
 
-    Arg &audio_input_arg = args["-a"];
+    av_log_set_level(AV_LOG_FATAL);
+
+    puts("section=system_info");
+    list_system_info(wayland);
+    if(egl.gpu_info.is_steam_deck)
+        puts("is_steam_deck|yes");
+    else
+        puts("is_steam_deck|no");
+    printf("gsr_version|%s\n", GSR_VERSION);
+    puts("section=gpu_info");
+    list_gpu_info(&egl);
+    puts("section=video_codecs");
+    list_supported_video_codecs(&egl, wayland);
+    puts("section=image_formats");
+    puts("jpeg");
+    puts("png");
+    puts("section=capture_options");
+    list_supported_capture_options(window, egl.card_path, list_monitors);
+
+    fflush(stdout);
+
+    // Not needed as this will just slow down shutdown
+    //gsr_egl_unload(&egl);
+    //gsr_window_destroy(&window);
+    //if(dpy)
+    //    XCloseDisplay(dpy);
+
+    _exit(0);
+}
+
+static void list_audio_devices_command(void *userdata) {
+    (void)userdata;
+    const AudioDevices audio_devices = get_pulseaudio_inputs();
 
-    uint32_t region_x = 0;
-    uint32_t region_y = 0;
-    uint32_t region_width = 0;
-    uint32_t region_height = 0;
+    if(!audio_devices.default_output.empty())
+        puts("default_output|Default output");
 
-    /*
-    TODO: Fix this. Doesn't work for some reason
-    const char *screen_region = args["-s"].value;
-    if(screen_region) {
-        if(sscanf(screen_region, "%ux%u+%u+%u", &region_x, &region_y, &region_width, &region_height) != 4) {
-            fprintf(stderr, "Invalid value for -s '%s', expected a value in format WxH+X+Y\n", screen_region);
-            return 1;
+    if(!audio_devices.default_input.empty())
+        puts("default_input|Default input");
+
+    for(const auto &audio_input : audio_devices.audio_inputs) {
+        printf("%s|%s\n", audio_input.name.c_str(), audio_input.description.c_str());
+    }
+
+    fflush(stdout);
+    _exit(0);
+}
+
+static bool app_audio_query_callback(const char *app_name, void*) {
+    puts(app_name);
+    return true;
+}
+
+static void list_application_audio_command(void *userdata) {
+    (void)userdata;
+#ifdef GSR_APP_AUDIO
+    if(pulseaudio_server_is_pipewire()) {
+        gsr_pipewire_audio audio;
+        if(gsr_pipewire_audio_init(&audio)) {
+            gsr_pipewire_audio_for_each_app(&audio, app_audio_query_callback, NULL);
+            gsr_pipewire_audio_deinit(&audio);
         }
     }
-    */
+#endif
+
+    fflush(stdout);
+    _exit(0);
+}
 
-    const char *container_format = args["-c"].value;
-    int fps = atoi(args["-f"].value);
-    if(fps == 0) {
-        fprintf(stderr, "Invalid fps argument: %s\n", args["-f"].value);
-        return 1;
+// |card_path| can be NULL. If not NULL then |vendor| has to be valid
+static void list_capture_options_command(const char *card_path, void *userdata) {
+    (void)userdata;
+    bool wayland = false;
+    Display *dpy = XOpenDisplay(nullptr);
+    if (!dpy) {
+        wayland = true;
+        fprintf(stderr, "gsr warning: failed to connect to the X server. Assuming wayland is running without Xwayland\n");
     }
-    if(fps > 250)
-        fps = 250;
 
-    const char *quality_str = args["-q"].value;
-    if(!quality_str)
-        quality_str = "medium";
+    XSetErrorHandler(x11_error_handler);
+    XSetIOErrorHandler(x11_io_error_handler);
 
-    VideoQuality quality;
-    if(strcmp(quality_str, "medium") == 0) {
-        quality = VideoQuality::MEDIUM;
-    } else if(strcmp(quality_str, "high") == 0) {
-        quality = VideoQuality::HIGH;
-    } else if(strcmp(quality_str, "ultra") == 0) {
-        quality = VideoQuality::ULTRA;
-    } else {
-        fprintf(stderr, "Error: -q should either be either 'medium', 'high' or 'ultra', got: '%s'\n", quality_str);
-        usage();
+    if(!wayland)
+        wayland = is_xwayland(dpy);
+
+    if(!wayland && is_using_prime_run()) {
+        // Disable prime-run and similar options as it doesn't work, the monitor to capture has to be run on the same device.
+        // This is fine on wayland since nvidia uses drm interface there and the monitor query checks the monitors connected
+        // to the drm device.
+        fprintf(stderr, "gsr warning: use of prime-run on X11 is not supported. Disabling prime-run\n");
+        disable_prime_run();
+    }
+
+    gsr_window *window = gsr_window_create(dpy, wayland);
+    if(!window) {
+        fprintf(stderr, "gsr error: failed to create window\n");
+        _exit(1);
     }
 
-    int replay_buffer_size_secs = -1;
-    const char *replay_buffer_size_secs_str = args["-r"].value;
-    if(replay_buffer_size_secs_str) {
-        replay_buffer_size_secs = atoi(replay_buffer_size_secs_str);
-        if(replay_buffer_size_secs < 5 || replay_buffer_size_secs > 1200) {
-            fprintf(stderr, "Error: option -r has to be between 5 and 1200, was: %s\n", replay_buffer_size_secs_str);
-            return 1;
+    if(card_path) {
+        list_supported_capture_options(window, card_path, true);
+    } else {
+        gsr_egl egl;
+        if(!gsr_egl_load(&egl, window, false, false)) {
+            fprintf(stderr, "gsr error: failed to load opengl\n");
+            _exit(1);
+        }
+
+        bool list_monitors = true;
+        egl.card_path[0] = '\0';
+        if(monitor_capture_use_drm(window, egl.gpu_info.vendor)) {
+            // TODO: Allow specifying another card, and in other places
+            if(!gsr_get_valid_card_path(&egl, egl.card_path, true)) {
+                fprintf(stderr, "gsr error: no /dev/dri/cardX device found. Make sure that you have at least one monitor connected\n");
+                list_monitors = false;
+            }
         }
-        replay_buffer_size_secs += 5; // Add a few seconds to account of lost packets because of non-keyframe packets skipped
+        list_supported_capture_options(window, egl.card_path, list_monitors);
     }
 
-    CUresult res;
+    fflush(stdout);
+
+    // Not needed as this will just slow down shutdown
+    //gsr_egl_unload(&egl);
+    //gsr_window_destroy(&window);
+    //if(dpy)
+    //    XCloseDisplay(dpy);
+
+    _exit(0);
+}
+
+static std::string validate_monitor_get_valid(const gsr_egl *egl, const char* window) {
+    const bool is_x11 = gsr_window_get_display_server(egl->window) == GSR_DISPLAY_SERVER_X11;
+    const gsr_connection_type connection_type = is_x11 ? GSR_CONNECTION_X11 : GSR_CONNECTION_DRM;
+    const bool capture_use_drm = monitor_capture_use_drm(egl->window, egl->gpu_info.vendor);
+
+    std::string window_result = window;
+    if(strcmp(window_result.c_str(), "screen") == 0) {
+        FirstOutputCallback data;
+        data.output_name = NULL;
+        for_each_active_monitor_output(egl->window, egl->card_path, connection_type, get_first_output_callback, &data);
 
-    res = cuInit(0);
-    if(res != CUDA_SUCCESS) {
-        const char *err_str;
-        cuGetErrorString(res, &err_str);
-        fprintf(stderr, "Error: cuInit failed, error %s (result: %d)\n", err_str, res);
-        return 1;
+        if(data.output_name) {
+            window_result = data.output_name;
+            free(data.output_name);
+        } else {
+            fprintf(stderr, "gsr error: no usable output found\n");
+            _exit(51);
+        }
+    } else if(capture_use_drm || (strcmp(window_result.c_str(), "screen-direct") != 0 && strcmp(window_result.c_str(), "screen-direct-force") != 0)) {
+        gsr_monitor gmon;
+        if(!get_monitor_by_name(egl, connection_type, window_result.c_str(), &gmon)) {
+            fprintf(stderr, "gsr error: display \"%s\" not found, expected one of:\n", window_result.c_str());
+            fprintf(stderr, "  \"screen\"\n");
+            if(!capture_use_drm)
+                fprintf(stderr, "  \"screen-direct\"\n");
+
+            MonitorOutputCallbackUserdata userdata;
+            userdata.window = egl->window;
+            for_each_active_monitor_output(egl->window, egl->card_path, connection_type, monitor_output_callback_print, &userdata);
+            _exit(51);
+        }
     }
+    return window_result;
+}
 
-    int nGpu = 0;
-    cuDeviceGetCount(&nGpu);
-    if (nGpu <= 0) {
-        fprintf(stderr, "Error: no cuda supported devices found\n");
-        return 1;
+static std::string get_monitor_by_region_center(const gsr_egl *egl, vec2i region_position, vec2i region_size, vec2i *monitor_pos, vec2i *monitor_size) {
+    const bool is_x11 = gsr_window_get_display_server(egl->window) == GSR_DISPLAY_SERVER_X11;
+    const gsr_connection_type connection_type = is_x11 ? GSR_CONNECTION_X11 : GSR_CONNECTION_DRM;
+
+    MonitorByPositionCallback data;
+    data.window = egl->window;
+    data.position = { region_position.x + region_size.x / 2, region_position.y + region_size.y / 2 };
+    data.output_name = NULL;
+    data.monitor_pos = {0, 0};
+    data.monitor_size = {0, 0};
+    for_each_active_monitor_output(egl->window, egl->card_path, connection_type, get_monitor_by_position_callback, &data);
+
+    std::string result;
+    if(data.output_name) {
+        result = data.output_name;
+        free(data.output_name);
     }
+    *monitor_pos = data.monitor_pos;
+    *monitor_size = data.monitor_size;
+    return result;
+}
 
-    CUdevice cu_dev;
-    res = cuDeviceGet(&cu_dev, 0);
-    if(res != CUDA_SUCCESS) {
-        const char *err_str;
-        cuGetErrorString(res, &err_str);
-        fprintf(stderr, "Error: unable to get CUDA device, error: %s (result: %d)\n", err_str, res);
-        return 1;
+static gsr_capture* create_monitor_capture(const args_parser &arg_parser, gsr_egl *egl, bool prefer_ximage) {
+    if(gsr_window_get_display_server(egl->window) == GSR_DISPLAY_SERVER_X11 && prefer_ximage) {
+        gsr_capture_ximage_params ximage_params;
+        ximage_params.egl = egl;
+        ximage_params.display_to_capture = arg_parser.window;
+        ximage_params.record_cursor = arg_parser.record_cursor;
+        ximage_params.output_resolution = arg_parser.output_resolution;
+        ximage_params.region_size = arg_parser.region_size;
+        ximage_params.region_position = arg_parser.region_position;
+        return gsr_capture_ximage_create(&ximage_params);
     }
 
-    CUcontext cu_ctx;
-    res = cuCtxCreate_v2(&cu_ctx, CU_CTX_SCHED_AUTO, cu_dev);
-    if(res != CUDA_SUCCESS) {
-        const char *err_str;
-        cuGetErrorString(res, &err_str);
-        fprintf(stderr, "Error: unable to create CUDA context, error: %s (result: %d)\n", err_str, res);
-        return 1;
+    if(monitor_capture_use_drm(egl->window, egl->gpu_info.vendor)) {
+        gsr_capture_kms_params kms_params;
+        kms_params.egl = egl;
+        kms_params.display_to_capture = arg_parser.window;
+        kms_params.record_cursor = arg_parser.record_cursor;
+        kms_params.hdr = video_codec_is_hdr(arg_parser.video_codec);
+        kms_params.fps = arg_parser.fps;
+        kms_params.output_resolution = arg_parser.output_resolution;
+        kms_params.region_size = arg_parser.region_size;
+        kms_params.region_position = arg_parser.region_position;
+        return gsr_capture_kms_create(&kms_params);
+    } else {
+        const char *capture_target = arg_parser.window;
+        const bool direct_capture = strcmp(arg_parser.window, "screen-direct") == 0 || strcmp(arg_parser.window, "screen-direct-force") == 0;
+        if(direct_capture) {
+            capture_target = "screen";
+            fprintf(stderr, "gsr warning: %s capture option is not recommended unless you use G-SYNC as Nvidia has driver issues that can cause your system or games to freeze/crash.\n", arg_parser.window);
+        }
+
+        gsr_capture_nvfbc_params nvfbc_params;
+        nvfbc_params.egl = egl;
+        nvfbc_params.display_to_capture = capture_target;
+        nvfbc_params.fps = arg_parser.fps;
+        nvfbc_params.direct_capture = direct_capture;
+        nvfbc_params.record_cursor = arg_parser.record_cursor;
+        nvfbc_params.output_resolution = arg_parser.output_resolution;
+        nvfbc_params.region_size = arg_parser.region_size;
+        nvfbc_params.region_position = arg_parser.region_position;
+        return gsr_capture_nvfbc_create(&nvfbc_params);
     }
+}
 
-    uint32_t window_width = 0;
-    uint32_t window_height = 0;
+static std::string region_get_data(gsr_egl *egl, vec2i *region_size, vec2i *region_position) {
+    vec2i monitor_pos = {0, 0};
+    vec2i monitor_size = {0, 0};
+    std::string window = get_monitor_by_region_center(egl, *region_position, *region_size, &monitor_pos, &monitor_size);
+    if(window.empty()) {
+        const bool is_x11 = gsr_window_get_display_server(egl->window) == GSR_DISPLAY_SERVER_X11;
+        const gsr_connection_type connection_type = is_x11 ? GSR_CONNECTION_X11 : GSR_CONNECTION_DRM;
+        fprintf(stderr, "gsr error: the region %dx%d+%d+%d doesn't match any monitor. Available monitors and their regions:\n", region_size->x, region_size->y, region_position->x, region_position->y);
+
+        MonitorOutputCallbackUserdata userdata;
+        userdata.window = egl->window;
+        for_each_active_monitor_output(egl->window, egl->card_path, connection_type, monitor_output_callback_print, &userdata);
+        _exit(51);
+    }
 
-    NvFBCLibrary nv_fbc_library;
+    // Capture whole monitor when region size is set to 0x0
+    if(region_size->x == 0 && region_size->y == 0) {
+        region_position->x = 0;
+        region_position->y = 0;
+    } else {
+        region_position->x -= monitor_pos.x;
+        region_position->y -= monitor_pos.y;
+    }
+    return window;
+}
 
-    const char *window_str = args["-w"].value;
+static gsr_capture* create_capture_impl(args_parser &arg_parser, gsr_egl *egl, bool prefer_ximage) {
     Window src_window_id = None;
-    if(contains_non_hex_number(window_str)) {
-        if(!nv_fbc_library.load())
-            return 1;
+    bool follow_focused = false;
+    const bool wayland = gsr_window_get_display_server(egl->window) == GSR_DISPLAY_SERVER_WAYLAND;
+
+    gsr_capture *capture = nullptr;
+    if(strcmp(arg_parser.window, "focused") == 0) {
+        if(wayland) {
+            fprintf(stderr, "gsr error: GPU Screen Recorder window capture only works in a pure X11 session. Xwayland is not supported. You can record a monitor instead on wayland\n");
+            _exit(2);
+        }
 
-        const char *capture_target = window_str;
-        const bool direct_capture = strcmp(window_str, "screen-direct") == 0;
-        if(direct_capture)
-            capture_target = "screen";
+        if(arg_parser.output_resolution.x <= 0 || arg_parser.output_resolution.y <= 0) {
+            fprintf(stderr, "gsr error: invalid value for option -s '%dx%d' when using -w focused option. expected width and height to be greater than 0\n", arg_parser.output_resolution.x, arg_parser.output_resolution.y);
+            args_parser_print_usage();
+            _exit(1);
+        }
 
-        if(!nv_fbc_library.create(capture_target, fps, &window_width, &window_height, region_x, region_y, region_width, region_height, direct_capture))
-            return 1;
+        follow_focused = true;
+    } else if(strcmp(arg_parser.window, "portal") == 0) {
+#ifdef GSR_PORTAL
+        // Desktop portal capture on x11 doesn't seem to be hardware accelerated
+        if(!wayland) {
+            fprintf(stderr, "gsr error: desktop portal capture is not supported on X11\n");
+            _exit(1);
+        }
+
+        gsr_capture_portal_params portal_params;
+        portal_params.egl = egl;
+        portal_params.record_cursor = arg_parser.record_cursor;
+        portal_params.restore_portal_session = arg_parser.restore_portal_session;
+        portal_params.portal_session_token_filepath = arg_parser.portal_session_token_filepath;
+        portal_params.output_resolution = arg_parser.output_resolution;
+        capture = gsr_capture_portal_create(&portal_params);
+        if(!capture)
+            _exit(1);
+#else
+        fprintf(stderr, "gsr error: option '-w portal' used but GPU Screen Recorder was compiled without desktop portal support. Please recompile GPU Screen recorder with the -Dportal=true option\n");
+        _exit(2);
+#endif
+    } else if(strcmp(arg_parser.window, "region") == 0) {
+        const std::string window = region_get_data(egl, &arg_parser.region_size, &arg_parser.region_position);
+        snprintf(arg_parser.window, sizeof(arg_parser.window), "%s", window.c_str());
+        capture = create_monitor_capture(arg_parser, egl, prefer_ximage);
+        if(!capture)
+            _exit(1);
+    } else if(contains_non_hex_number(arg_parser.window)) {
+        const std::string window = validate_monitor_get_valid(egl, arg_parser.window);
+        snprintf(arg_parser.window, sizeof(arg_parser.window), "%s", window.c_str());
+        capture = create_monitor_capture(arg_parser, egl, prefer_ximage);
+        if(!capture)
+            _exit(1);
     } else {
+        if(wayland) {
+            fprintf(stderr, "gsr error: GPU Screen Recorder window capture only works in a pure X11 session. Xwayland is not supported. You can record a monitor instead on wayland or use -w portal option which supports window capture if your wayland compositor supports window capture\n");
+            _exit(2);
+        }
+
         errno = 0;
-        src_window_id = strtol(window_str, nullptr, 0);
+        src_window_id = strtol(arg_parser.window, nullptr, 0);
         if(src_window_id == None || errno == EINVAL) {
-            fprintf(stderr, "Invalid window number %s\n", window_str);
-            usage();
+            fprintf(stderr, "gsr error: invalid window number %s\n", arg_parser.window);
+            args_parser_print_usage();
+            _exit(1);
         }
     }
 
-    int record_width = window_width;
-    int record_height = window_height;
-    const char *record_area = args["-s"].value;
-    if(record_area) {
-        if(sscanf(record_area, "%dx%d", &record_width, &record_height) != 2) {
-            fprintf(stderr, "Invalid value for -s '%s', expected a value in format WxH\n", record_area);
-            return 1;
+    if(!capture) {
+        gsr_capture_xcomposite_params xcomposite_params;
+        xcomposite_params.egl = egl;
+        xcomposite_params.window = src_window_id;
+        xcomposite_params.follow_focused = follow_focused;
+        xcomposite_params.record_cursor = arg_parser.record_cursor;
+        xcomposite_params.output_resolution = arg_parser.output_resolution;
+        capture = gsr_capture_xcomposite_create(&xcomposite_params);
+        if(!capture)
+            _exit(1);
+    }
+
+    return capture;
+}
+
+static gsr_color_range image_format_to_color_range(gsr_image_format image_format) {
+    switch(image_format) {
+        case GSR_IMAGE_FORMAT_JPEG: return GSR_COLOR_RANGE_LIMITED;
+        case GSR_IMAGE_FORMAT_PNG:  return GSR_COLOR_RANGE_FULL;
+    }
+    assert(false);
+    return GSR_COLOR_RANGE_FULL;
+}
+
+static int video_quality_to_image_quality_value(gsr_video_quality video_quality) {
+    switch(video_quality) {
+        case GSR_VIDEO_QUALITY_MEDIUM:
+            return 75;
+        case GSR_VIDEO_QUALITY_HIGH:
+            return 85;
+        case GSR_VIDEO_QUALITY_VERY_HIGH:
+            return 90;
+        case GSR_VIDEO_QUALITY_ULTRA:
+            return 97;
+    }
+    assert(false);
+    return 90;
+}
+
+// TODO: 10-bit and hdr.
+static void capture_image_to_file(args_parser &arg_parser, gsr_egl *egl, gsr_image_format image_format) {
+    const gsr_color_range color_range = image_format_to_color_range(image_format);
+    const int fps = 60;
+    const bool prefer_ximage = true;
+    gsr_capture *capture = create_capture_impl(arg_parser, egl, prefer_ximage);
+
+    gsr_capture_metadata capture_metadata;
+    capture_metadata.width = 0;
+    capture_metadata.height = 0;
+    capture_metadata.fps = fps;
+    capture_metadata.video_codec_context = nullptr;
+    capture_metadata.frame = nullptr;
+
+    int capture_result = gsr_capture_start(capture, &capture_metadata);
+    if(capture_result != 0) {
+        fprintf(stderr, "gsr error: capture_image_to_file_wayland: gsr_capture_start failed\n");
+        _exit(capture_result);
+    }
+
+    gsr_image_writer image_writer;
+    if(!gsr_image_writer_init_opengl(&image_writer, egl, capture_metadata.width, capture_metadata.height)) {
+        fprintf(stderr, "gsr error: capture_image_to_file_wayland: gsr_image_write_gl_init failed\n");
+        _exit(1);
+    }
+
+    gsr_color_conversion_params color_conversion_params;
+    memset(&color_conversion_params, 0, sizeof(color_conversion_params));
+    color_conversion_params.color_range = color_range;
+    color_conversion_params.egl = egl;
+    color_conversion_params.load_external_image_shader = gsr_capture_uses_external_image(capture);
+
+    color_conversion_params.destination_textures[0] = image_writer.texture;
+    color_conversion_params.num_destination_textures = 1;
+    color_conversion_params.destination_color = GSR_DESTINATION_COLOR_RGB8;
+
+    gsr_color_conversion color_conversion;
+    if(gsr_color_conversion_init(&color_conversion, &color_conversion_params) != 0) {
+        fprintf(stderr, "gsr error: capture_image_to_file_wayland: failed to create color conversion\n");
+        _exit(1);
+    }
+
+    gsr_color_conversion_clear(&color_conversion);
+
+    bool should_stop_error = false;
+    egl->glClear(0);
+
+    while(running) {
+        should_stop_error = false;
+        if(gsr_capture_should_stop(capture, &should_stop_error)) {
+            running = 0;
+            break;
         }
+
+        // It can fail, for example when capturing portal and the target is a monitor that hasn't been updated.
+        // Desktop portal wont refresh the image until there is an update.
+        // TODO: Find out if there is a way to force update desktop portal image.
+        // This can also happen for example if the system suspends and the monitor to capture's framebuffer is gone, or if the target window disappeared.
+        if(gsr_capture_capture(capture, &capture_metadata, &color_conversion) == 0)
+            break;
+
+        usleep(30 * 1000); // 30 ms
+    }
+
+    gsr_egl_swap_buffers(egl);
+    
+    const int image_quality = video_quality_to_image_quality_value(arg_parser.video_quality);
+    if(!gsr_image_writer_write_to_file(&image_writer, arg_parser.filename, image_format, image_quality)) {
+        fprintf(stderr, "gsr error: capture_image_to_file_wayland: failed to write opengl texture to image output file %s\n", arg_parser.filename);
+        _exit(1);
+    }
+
+    gsr_image_writer_deinit(&image_writer);
+    gsr_capture_destroy(capture);
+    _exit(should_stop_error ? 3 : 0);
+}
+
+static AVPixelFormat get_pixel_format(gsr_video_codec video_codec, gsr_gpu_vendor vendor, bool use_software_video_encoder) {
+    if(use_software_video_encoder) {
+        return AV_PIX_FMT_NV12;
+    } else {
+        if(video_codec_is_vulkan(video_codec))
+            return AV_PIX_FMT_VULKAN;
+        else
+            return vendor == GSR_GPU_VENDOR_NVIDIA ? AV_PIX_FMT_CUDA : AV_PIX_FMT_VAAPI;
     }
+}
+
+static void match_app_audio_input_to_available_apps(const std::vector<AudioInput> &requested_audio_inputs, const std::vector<std::string> &app_audio_names) {
+    for(const AudioInput &request_audio_input : requested_audio_inputs) {
+        if(request_audio_input.type != AudioInputType::APPLICATION || request_audio_input.inverted)
+            continue;
 
-    const char *filename = args["-o"].value;
-    if(filename) {
-        if(replay_buffer_size_secs != -1) {
-            struct stat buf;
-            if(stat(filename, &buf) == -1 || !S_ISDIR(buf.st_mode)) {
-                fprintf(stderr, "%s does not exist or is not a directory\n", filename);
-                usage();
+        bool match = false;
+        for(const std::string &app_name : app_audio_names) {
+            if(strcasecmp(app_name.c_str(), request_audio_input.name.c_str()) == 0) {
+                match = true;
+                break;
             }
         }
-    } else {
-        if(replay_buffer_size_secs == -1) {
-            filename = "/dev/stdout";
-        } else {
-            fprintf(stderr, "Option -o is required when using option -r\n");
-            usage();
+
+        if(!match) {
+            fprintf(stderr, "gsr warning: no audio application with the name \"%s\" was found, expected one of the following:\n", request_audio_input.name.c_str());
+            for(const std::string &app_name : app_audio_names) {
+                fprintf(stderr, "  * %s\n", app_name.c_str());
+            }
+            fprintf(stderr, "  assuming this is intentional (if you are trying to record audio for applications that haven't started yet).\n");
         }
     }
+}
+
+// Manually check if the audio inputs we give exist. This is only needed for pipewire, not pulseaudio.
+// Pipewire instead DEFAULTS TO THE DEFAULT AUDIO INPUT. THAT'S RETARDED.
+// OH, YOU MISSPELLED THE AUDIO INPUT? FUCK YOU
+static std::vector<MergedAudioInputs> parse_audio_inputs(const AudioDevices &audio_devices, const Arg *audio_input_arg) {
+    std::vector<MergedAudioInputs> requested_audio_inputs;
+
+    for(int i = 0; i < audio_input_arg->num_values; ++i) {
+        const char *audio_input = audio_input_arg->values[i];
+        if(!audio_input || audio_input[0] == '\0')
+            continue;
 
-    const double target_fps = 1.0 / (double)fps;
+        requested_audio_inputs.push_back(parse_audio_input_arg(audio_input));
+        for(AudioInput &request_audio_input : requested_audio_inputs.back().audio_inputs) {
+            if(request_audio_input.type != AudioInputType::DEVICE)
+                continue;
 
-    WindowPixmap window_pixmap;
-    Display *dpy = nullptr;
-    GLFWwindow *window = nullptr;
-    if(src_window_id) {
-        dpy = XOpenDisplay(nullptr);
-        if (!dpy) {
-            fprintf(stderr, "Error: Failed to open display\n");
-            return 1;
+            bool match = false;
+
+            if(request_audio_input.name == "default_output") {
+                if(audio_devices.default_output.empty()) {
+                    fprintf(stderr, "gsr error: -a default_output was specified but no default audio output is specified in the audio server\n");
+                    _exit(2);
+                }
+                match = true;
+            } else if(request_audio_input.name == "default_input") {
+                if(audio_devices.default_input.empty()) {
+                    fprintf(stderr, "gsr error: -a default_input was specified but no default audio input is specified in the audio server\n");
+                    _exit(2);
+                }
+                match = true;
+            } else {
+                const bool name_is_existing_audio_device = get_audio_device_by_name(audio_devices.audio_inputs, request_audio_input.name.c_str()) != nullptr;
+                if(name_is_existing_audio_device)
+                    match = true;
+            }
+
+            if(!match) {
+                fprintf(stderr, "gsr error: Audio device '%s' is not a valid audio device, expected one of:\n", request_audio_input.name.c_str());
+                if(!audio_devices.default_output.empty())
+                    fprintf(stderr, "    default_output (Default output)\n");
+                if(!audio_devices.default_input.empty())
+                    fprintf(stderr, "    default_input (Default input)\n");
+                for(const auto &audio_device_input : audio_devices.audio_inputs) {
+                    fprintf(stderr, "    %s (%s)\n", audio_device_input.name.c_str(), audio_device_input.description.c_str());
+                }
+                _exit(50);
+            }
         }
+    }
+
+    return requested_audio_inputs;
+}
 
-        bool has_name_pixmap = x11_supports_composite_named_window_pixmap(dpy);
-        if (!has_name_pixmap) {
-            fprintf(stderr, "Error: XCompositeNameWindowPixmap is not supported by "
-                            "your X11 server\n");
-            return 1;
+static bool audio_inputs_has_app_audio(const std::vector<AudioInput> &audio_inputs) {
+    for(const auto &audio_input : audio_inputs) {
+        if(audio_input.type == AudioInputType::APPLICATION)
+            return true;
+    }
+    return false;
+}
+
+static bool merged_audio_inputs_has_app_audio(const std::vector<MergedAudioInputs> &merged_audio_inputs) {
+    for(const auto &merged_audio_input : merged_audio_inputs) {
+        if(audio_inputs_has_app_audio(merged_audio_input.audio_inputs))
+            return true;
+    }
+    return false;
+}
+
+// Should use amix if more than 1 audio device and 0 application audio, merged
+static bool audio_inputs_should_use_amix(const std::vector<AudioInput> &audio_inputs) {
+    int num_audio_devices = 0;
+    int num_app_audio = 0;
+
+    for(const auto &audio_input : audio_inputs) {
+        if(audio_input.type == AudioInputType::DEVICE)
+            ++num_audio_devices;
+        else if(audio_input.type == AudioInputType::APPLICATION)
+            ++num_app_audio;
+    }
+
+    return num_audio_devices > 1 && num_app_audio == 0;
+}
+
+static bool merged_audio_inputs_should_use_amix(const std::vector<MergedAudioInputs> &merged_audio_inputs) {
+    for(const auto &merged_audio_input : merged_audio_inputs) {
+        if(audio_inputs_should_use_amix(merged_audio_input.audio_inputs))
+            return true;
+    }
+    return false;
+}
+
+static void validate_merged_audio_inputs_app_audio(const std::vector<MergedAudioInputs> &merged_audio_inputs, const std::vector<std::string> &app_audio_names) {
+    for(const auto &merged_audio_input : merged_audio_inputs) {
+        int num_app_audio = 0;
+        int num_app_inverted_audio = 0;
+
+        for(const auto &audio_input : merged_audio_input.audio_inputs) {
+            if(audio_input.type == AudioInputType::APPLICATION) {
+                if(audio_input.inverted)
+                    ++num_app_inverted_audio;
+                else
+                    ++num_app_audio;
+            }
         }
 
-        XWindowAttributes attr;
-        if (!XGetWindowAttributes(dpy, src_window_id, &attr)) {
-            fprintf(stderr, "Error: Invalid window id: %lu\n", src_window_id);
-            return 1;
+        match_app_audio_input_to_available_apps(merged_audio_input.audio_inputs, app_audio_names);
+
+        if(num_app_audio > 0 && num_app_inverted_audio > 0) {
+            fprintf(stderr, "gsr error: argument -a was provided with both app: and app-inverse:, only one of them can be used for one audio track\n");
+            _exit(2);
+        }
+    }
+}
+
+static gsr_audio_codec select_audio_codec_with_fallback(gsr_audio_codec audio_codec, const std::string &file_extension, bool uses_amix) {
+    switch(audio_codec) {
+        case GSR_AUDIO_CODEC_AAC: {
+            if(file_extension == "webm") {
+                //audio_codec_to_use = "opus";
+                audio_codec = GSR_AUDIO_CODEC_OPUS;
+                fprintf(stderr, "gsr warning: .webm files only support opus audio codec, changing audio codec from aac to opus\n");
+            }
+            break;
+        }
+        case GSR_AUDIO_CODEC_OPUS: {
+            // TODO: Also check mpegts?
+            if(file_extension != "mp4" && file_extension != "mkv" && file_extension != "webm") {
+                //audio_codec_to_use = "aac";
+                audio_codec = GSR_AUDIO_CODEC_AAC;
+                fprintf(stderr, "gsr warning: opus audio codec is only supported by .mp4, .mkv and .webm files, falling back to aac instead\n");
+            }
+            break;
+        }
+        case GSR_AUDIO_CODEC_FLAC: {
+            // TODO: Also check mpegts?
+            if(file_extension == "webm") {
+                //audio_codec_to_use = "opus";
+                audio_codec = GSR_AUDIO_CODEC_OPUS;
+                fprintf(stderr, "gsr warning: .webm files only support opus audio codec, changing audio codec from flac to opus\n");
+            } else if(file_extension != "mp4" && file_extension != "mkv") {
+                //audio_codec_to_use = "aac";
+                audio_codec = GSR_AUDIO_CODEC_AAC;
+                fprintf(stderr, "gsr warning: flac audio codec is only supported by .mp4 and .mkv files, falling back to aac instead\n");
+            } else if(uses_amix) {
+                // TODO: remove this? is it true anymore?
+                //audio_codec_to_use = "opus";
+                audio_codec = GSR_AUDIO_CODEC_OPUS;
+                fprintf(stderr, "gsr warning: flac audio codec is not supported when mixing audio sources, falling back to opus instead\n");
+            }
+            break;
         }
+    }
+    return audio_codec;
+}
 
-        window_width = attr.width;
-        window_height = attr.height;
+static bool video_codec_only_supports_low_power_mode(const gsr_supported_video_codecs &supported_video_codecs, gsr_video_codec video_codec) {
+    switch(video_codec) {
+        case GSR_VIDEO_CODEC_H264:        return supported_video_codecs.h264.low_power;
+        case GSR_VIDEO_CODEC_HEVC:        return supported_video_codecs.hevc.low_power;
+        case GSR_VIDEO_CODEC_HEVC_HDR:    return supported_video_codecs.hevc_hdr.low_power;
+        case GSR_VIDEO_CODEC_HEVC_10BIT:  return supported_video_codecs.hevc_10bit.low_power;
+        case GSR_VIDEO_CODEC_AV1:         return supported_video_codecs.av1.low_power;
+        case GSR_VIDEO_CODEC_AV1_HDR:     return supported_video_codecs.av1_hdr.low_power;
+        case GSR_VIDEO_CODEC_AV1_10BIT:   return supported_video_codecs.av1_10bit.low_power;
+        case GSR_VIDEO_CODEC_VP8:         return supported_video_codecs.vp8.low_power;
+        case GSR_VIDEO_CODEC_VP9:         return supported_video_codecs.vp9.low_power;
+        case GSR_VIDEO_CODEC_H264_VULKAN: return supported_video_codecs.h264.low_power;
+        case GSR_VIDEO_CODEC_HEVC_VULKAN: return supported_video_codecs.hevc.low_power; // TODO: hdr, 10 bit
+    }
+    return false;
+}
 
-        XCompositeRedirectWindow(dpy, src_window_id, CompositeRedirectAutomatic);
+static const AVCodec* pick_video_codec(gsr_video_codec *video_codec, gsr_egl *egl, bool use_software_video_encoder, bool video_codec_auto, bool is_flv, bool *low_power) {
+    // TODO: software encoder for hevc, av1, vp8 and vp9
+    *low_power = false;
 
-        // glXMakeContextCurrent(Display *dpy, GLXDrawable draw, GLXDrawable read,
-        // GLXContext ctx)
-        if (!glfwInit()) {
-            fprintf(stderr, "Error: Failed to initialize glfw\n");
-            return 1;
+    gsr_supported_video_codecs supported_video_codecs;
+    if(!get_supported_video_codecs(egl, *video_codec, use_software_video_encoder, true, &supported_video_codecs)) {
+        fprintf(stderr, "gsr error: failed to query for supported video codecs\n");
+        _exit(11);
+    }
+
+    const AVCodec *video_codec_f = nullptr;
+
+    switch(*video_codec) {
+        case GSR_VIDEO_CODEC_H264: {
+            if(use_software_video_encoder)
+                video_codec_f = avcodec_find_encoder_by_name("libx264");
+            else if(supported_video_codecs.h264.supported)
+                video_codec_f = get_ffmpeg_video_codec(*video_codec, egl->gpu_info.vendor);
+            break;
+        }
+        case GSR_VIDEO_CODEC_HEVC: {
+            if(supported_video_codecs.hevc.supported)
+                video_codec_f = get_ffmpeg_video_codec(*video_codec, egl->gpu_info.vendor);
+            break;
+        }
+        case GSR_VIDEO_CODEC_HEVC_HDR: {
+            if(supported_video_codecs.hevc_hdr.supported)
+                video_codec_f = get_ffmpeg_video_codec(*video_codec, egl->gpu_info.vendor);
+            break;
+        }
+        case GSR_VIDEO_CODEC_HEVC_10BIT: {
+            if(supported_video_codecs.hevc_10bit.supported)
+                video_codec_f = get_ffmpeg_video_codec(*video_codec, egl->gpu_info.vendor);
+            break;
+        }
+        case GSR_VIDEO_CODEC_AV1: {
+            if(supported_video_codecs.av1.supported)
+                video_codec_f = get_ffmpeg_video_codec(*video_codec, egl->gpu_info.vendor);
+            break;
+        }
+        case GSR_VIDEO_CODEC_AV1_HDR: {
+            if(supported_video_codecs.av1_hdr.supported)
+                video_codec_f = get_ffmpeg_video_codec(*video_codec, egl->gpu_info.vendor);
+            break;
+        }
+        case GSR_VIDEO_CODEC_AV1_10BIT: {
+            if(supported_video_codecs.av1_10bit.supported)
+                video_codec_f = get_ffmpeg_video_codec(*video_codec, egl->gpu_info.vendor);
+            break;
+        }
+        case GSR_VIDEO_CODEC_VP8: {
+            if(supported_video_codecs.vp8.supported)
+                video_codec_f = get_ffmpeg_video_codec(*video_codec, egl->gpu_info.vendor);
+            break;
+        }
+        case GSR_VIDEO_CODEC_VP9: {
+            if(supported_video_codecs.vp9.supported)
+                video_codec_f = get_ffmpeg_video_codec(*video_codec, egl->gpu_info.vendor);
+            break;
+        }
+        case GSR_VIDEO_CODEC_H264_VULKAN: {
+            if(supported_video_codecs.h264.supported)
+                video_codec_f = get_ffmpeg_video_codec(*video_codec, egl->gpu_info.vendor);
+            break;
+        }
+        case GSR_VIDEO_CODEC_HEVC_VULKAN: {
+            // TODO: hdr, 10 bit
+            if(supported_video_codecs.hevc.supported)
+                video_codec_f = get_ffmpeg_video_codec(*video_codec, egl->gpu_info.vendor);
+            break;
+        }
+    }
+
+    if(!video_codec_auto && !video_codec_f && !is_flv) {
+        switch(*video_codec) {
+            case GSR_VIDEO_CODEC_H264: {
+                fprintf(stderr, "gsr warning: selected video codec h264 is not supported, trying hevc instead\n");
+                *video_codec = GSR_VIDEO_CODEC_HEVC;
+                if(supported_video_codecs.hevc.supported)
+                    video_codec_f = get_ffmpeg_video_codec(*video_codec, egl->gpu_info.vendor);
+                break;
+            }
+            case GSR_VIDEO_CODEC_HEVC:
+            case GSR_VIDEO_CODEC_HEVC_HDR:
+            case GSR_VIDEO_CODEC_HEVC_10BIT: {
+                fprintf(stderr, "gsr warning: selected video codec hevc is not supported, trying h264 instead\n");
+                *video_codec = GSR_VIDEO_CODEC_H264;
+                if(supported_video_codecs.h264.supported)
+                    video_codec_f = get_ffmpeg_video_codec(*video_codec, egl->gpu_info.vendor);
+                break;
+            }
+            case GSR_VIDEO_CODEC_AV1:
+            case GSR_VIDEO_CODEC_AV1_HDR:
+            case GSR_VIDEO_CODEC_AV1_10BIT: {
+                fprintf(stderr, "gsr warning: selected video codec av1 is not supported, trying h264 instead\n");
+                *video_codec = GSR_VIDEO_CODEC_H264;
+                if(supported_video_codecs.h264.supported)
+                    video_codec_f = get_ffmpeg_video_codec(*video_codec, egl->gpu_info.vendor);
+                break;
+            }
+            case GSR_VIDEO_CODEC_VP8:
+            case GSR_VIDEO_CODEC_VP9:
+                // TODO: Cant fallback to other codec because webm only supports vp8/vp9
+                break;
+            case GSR_VIDEO_CODEC_H264_VULKAN: {
+                fprintf(stderr, "gsr warning: selected video codec h264_vulkan is not supported, trying h264 instead\n");
+                *video_codec = GSR_VIDEO_CODEC_H264;
+                // Need to do a query again because this time it's without vulkan
+                if(!get_supported_video_codecs(egl, *video_codec, use_software_video_encoder, true, &supported_video_codecs)) {
+                    fprintf(stderr, "gsr error: failed to query for supported video codecs\n");
+                    _exit(11);
+                }
+                if(supported_video_codecs.h264.supported)
+                    video_codec_f = get_ffmpeg_video_codec(*video_codec, egl->gpu_info.vendor);
+                break;
+            }
+            case GSR_VIDEO_CODEC_HEVC_VULKAN: {
+                fprintf(stderr, "gsr warning: selected video codec hevc_vulkan is not supported, trying hevc instead\n");
+                *video_codec = GSR_VIDEO_CODEC_HEVC;
+                // Need to do a query again because this time it's without vulkan
+                if(!get_supported_video_codecs(egl, *video_codec, use_software_video_encoder, true, &supported_video_codecs)) {
+                    fprintf(stderr, "gsr error: failed to query for supported video codecs\n");
+                    _exit(11);
+                }
+                if(supported_video_codecs.hevc.supported)
+                    video_codec_f = get_ffmpeg_video_codec(*video_codec, egl->gpu_info.vendor);
+                break;
+            }
         }
+    }
+
+    if(!video_codec_f) {
+        const char *video_codec_name = video_codec_to_string(*video_codec);
+        fprintf(stderr, "gsr error: your gpu does not support '%s' video codec. If you are sure that your gpu does support '%s' video encoding and you are using an AMD/Intel GPU,\n"
+            "  then make sure you have installed the GPU specific vaapi packages (intel-media-driver, libva-intel-driver, libva-mesa-driver and linux-firmware).\n"
+            "  It's also possible that your distro has disabled hardware accelerated video encoding for '%s' video codec.\n"
+            "  This may be the case on corporate distros such as Manjaro, Fedora or OpenSUSE.\n"
+            "  You can test this by running 'vainfo | grep VAEntrypointEncSlice' to see if it matches any H264/HEVC/AV1/VP8/VP9 profile.\n"
+            "  On such distros, you need to manually install mesa from source to enable H264/HEVC hardware acceleration, or use a more user friendly distro. Alternatively record with AV1 if supported by your GPU.\n"
+            "  You can alternatively use the flatpak version of GPU Screen Recorder (https://flathub.org/apps/com.dec05eba.gpu_screen_recorder) which bypasses system issues with patented H264/HEVC codecs.\n"
+            "  Make sure you have mesa-extra freedesktop runtime installed when using the flatpak (this should be the default), which can be installed with this command:\n"
+            "  flatpak install --system org.freedesktop.Platform.GL.default//23.08-extra\n"
+            "  If your GPU doesn't support hardware accelerated video encoding then you can use '-encoder cpu' option to encode with your cpu instead.\n", video_codec_name, video_codec_name, video_codec_name);
+        _exit(2);
+    }
+
+    *low_power = video_codec_only_supports_low_power_mode(supported_video_codecs, *video_codec);
 
-        glfwWindowHint(GLFW_CONTEXT_VERSION_MAJOR, 4);
-        glfwWindowHint(GLFW_CONTEXT_VERSION_MINOR, 2);
-        glfwWindowHint(GLFW_OPENGL_FORWARD_COMPAT, GL_TRUE);
-        glfwWindowHint(GLFW_OPENGL_PROFILE, GLFW_OPENGL_CORE_PROFILE);
-        glfwWindowHint(GLFW_RESIZABLE, GL_FALSE);
-        glfwWindowHint(GLFW_VISIBLE, GL_FALSE);
+    return video_codec_f;
+}
 
-        window = glfwCreateWindow(1, 1, "gpu-screen-recorder", nullptr, nullptr);
-        if (!window) {
-            fprintf(stderr, "Error: Failed to create glfw window\n");
-            glfwTerminate();
-            return 1;
+static const AVCodec* select_video_codec_with_fallback(gsr_video_codec *video_codec, const char *file_extension, bool use_software_video_encoder, gsr_egl *egl, bool *low_power) {
+    const bool video_codec_auto = *video_codec == (gsr_video_codec)GSR_VIDEO_CODEC_AUTO;
+    if(video_codec_auto) {
+        if(strcmp(file_extension, "webm") == 0) {
+            fprintf(stderr, "gsr info: using vp8 encoder because a codec was not specified and the file extension is .webm\n");
+            *video_codec = GSR_VIDEO_CODEC_VP8;
+        } else {
+            fprintf(stderr, "gsr info: using h264 encoder because a codec was not specified\n");
+            *video_codec = GSR_VIDEO_CODEC_H264;
         }
+    }
 
-        glfwMakeContextCurrent(window);
-        glfwSwapInterval(0);
+    // TODO: Allow hevc, vp9 and av1 in (enhanced) flv (supported since ffmpeg 6.1)
+    const bool is_flv = strcmp(file_extension, "flv") == 0;
+    if(is_flv) {
+        if(*video_codec != GSR_VIDEO_CODEC_H264) {
+            *video_codec = GSR_VIDEO_CODEC_H264;
+            fprintf(stderr, "gsr warning: hevc/av1 is not compatible with flv, falling back to h264 instead.\n");
+        }
 
-    //#if defined(DEBUG)
-        XSetErrorHandler(x11_error_handler);
-        XSetIOErrorHandler(x11_io_error_handler);
-    //#endif
+        // if(audio_codec != GSR_AUDIO_CODEC_AAC) {
+        //     audio_codec_to_use = "aac";
+        //     audio_codec = GSR_AUDIO_CODEC_AAC;
+        //     fprintf(stderr, "gsr warning: flv only supports aac, falling back to aac instead.\n");
+        // }
+    }
 
-        glewExperimental = GL_TRUE;
-        GLenum nGlewError = glewInit();
-        if (nGlewError != GLEW_OK) {
-            fprintf(stderr, "%s - Error initializing GLEW! %s\n", __FUNCTION__,
-                    glewGetErrorString(nGlewError));
-            return 1;
+    const bool is_hls = strcmp(file_extension, "m3u8") == 0;
+    if(is_hls) {
+        if(video_codec_is_av1(*video_codec)) {
+            *video_codec = GSR_VIDEO_CODEC_HEVC;
+            fprintf(stderr, "gsr warning: av1 is not compatible with hls (m3u8), falling back to hevc instead.\n");
         }
-        glGetError(); // to clear the error caused deep in GLEW
 
-        if (!recreate_window_pixmap(dpy, src_window_id, window_pixmap)) {
-            fprintf(stderr, "Error: Failed to create glx pixmap for window: %lu\n",
-                    src_window_id);
-            return 1;
+        // if(audio_codec != GSR_AUDIO_CODEC_AAC) {
+        //     audio_codec_to_use = "aac";
+        //     audio_codec = GSR_AUDIO_CODEC_AAC;
+        //     fprintf(stderr, "gsr warning: hls (m3u8) only supports aac, falling back to aac instead.\n");
+        // }
+    }
+
+    if(use_software_video_encoder && *video_codec != GSR_VIDEO_CODEC_H264) {
+        fprintf(stderr, "gsr error: \"-encoder cpu\" option is currently only available when using h264 codec option (-k)\n");
+        args_parser_print_usage();
+        _exit(1);
+    }
+
+    return pick_video_codec(video_codec, egl, use_software_video_encoder, video_codec_auto, is_flv, low_power);
+}
+
+static std::vector<AudioDeviceData> create_device_audio_inputs(const std::vector<AudioInput> &audio_inputs, AVCodecContext *audio_codec_context, int num_channels, double num_audio_frames_shift, std::vector<AVFilterContext*> &src_filter_ctx, bool use_amix) {
+    std::vector<AudioDeviceData> audio_track_audio_devices;
+    for(size_t i = 0; i < audio_inputs.size(); ++i) {
+        const auto &audio_input = audio_inputs[i];
+        AVFilterContext *src_ctx = nullptr;
+        if(use_amix)
+            src_ctx = src_filter_ctx[i];
+
+        AudioDeviceData audio_device;
+        audio_device.audio_input = audio_input;
+        audio_device.src_filter_ctx = src_ctx;
+
+        if(audio_input.name.empty()) {
+            audio_device.sound_device.handle = NULL;
+            audio_device.sound_device.frames = 0;
+        } else {
+            const std::string description = "gsr-" + audio_input.name;
+            if(sound_device_get_by_name(&audio_device.sound_device, audio_input.name.c_str(), description.c_str(), num_channels, audio_codec_context->frame_size, audio_codec_context_get_audio_format(audio_codec_context)) != 0) {
+                fprintf(stderr, "gsr error: failed to get \"%s\" audio device\n", audio_input.name.c_str());
+                _exit(1);
+            }
         }
 
-        if(!record_area) {
-            record_width = window_pixmap.texture_width;
-            record_height = window_pixmap.texture_height;
-            fprintf(stderr, "Record size: %dx%d\n", record_width, record_height);
+        audio_device.frame = create_audio_frame(audio_codec_context);
+        audio_device.frame->pts = -audio_codec_context->frame_size * num_audio_frames_shift;
+
+        audio_track_audio_devices.push_back(std::move(audio_device));
+    }
+    return audio_track_audio_devices;
+}
+
+#ifdef GSR_APP_AUDIO
+static AudioDeviceData create_application_audio_audio_input(const MergedAudioInputs &merged_audio_inputs, AVCodecContext *audio_codec_context, int num_channels, double num_audio_frames_shift, gsr_pipewire_audio *pipewire_audio) {
+    AudioDeviceData audio_device;
+    audio_device.frame = create_audio_frame(audio_codec_context);
+    audio_device.frame->pts = -audio_codec_context->frame_size * num_audio_frames_shift;
+
+    char random_str[8];
+    if(!generate_random_characters_standard_alphabet(random_str, sizeof(random_str))) {
+        fprintf(stderr, "gsr error: failed to generate random string\n");
+        _exit(1);
+    }
+    std::string combined_sink_name = "gsr-combined-";
+    combined_sink_name.append(random_str, sizeof(random_str));
+
+    if(!gsr_pipewire_audio_create_virtual_sink(pipewire_audio, combined_sink_name.c_str())) {
+        fprintf(stderr, "gsr error: failed to create virtual sink for application audio\n");
+        _exit(1);
+    }
+
+    combined_sink_name += ".monitor";
+
+    if(sound_device_get_by_name(&audio_device.sound_device, combined_sink_name.c_str(), "gpu-screen-recorder", num_channels, audio_codec_context->frame_size, audio_codec_context_get_audio_format(audio_codec_context)) != 0) {
+        fprintf(stderr, "gsr error: failed to setup audio recording to combined sink\n");
+        _exit(1);
+    }
+
+    std::vector<const char*> audio_devices_sources;
+    for(const auto &audio_input : merged_audio_inputs.audio_inputs) {
+        if(audio_input.type == AudioInputType::DEVICE)
+            audio_devices_sources.push_back(audio_input.name.c_str());
+    }
+
+    bool app_audio_inverted = false;
+    std::vector<const char*> app_names;
+    for(const auto &audio_input : merged_audio_inputs.audio_inputs) {
+        if(audio_input.type == AudioInputType::APPLICATION) {
+            app_names.push_back(audio_input.name.c_str());
+            app_audio_inverted = audio_input.inverted;
+        }
+    }
+
+    if(!audio_devices_sources.empty()) {
+        if(!gsr_pipewire_audio_add_link_from_sources_to_sink(pipewire_audio, audio_devices_sources.data(), audio_devices_sources.size(), combined_sink_name.c_str())) {
+            fprintf(stderr, "gsr error: failed to add application audio link\n");
+            _exit(1);
+        }
+    }
+
+    if(app_audio_inverted) {
+        if(!gsr_pipewire_audio_add_link_from_apps_to_sink_inverted(pipewire_audio, app_names.data(), app_names.size(), combined_sink_name.c_str())) {
+            fprintf(stderr, "gsr error: failed to add application audio link\n");
+            _exit(1);
         }
     } else {
-        window_pixmap.texture_id = 0;
-        window_pixmap.target_texture_id = 0;
-        window_pixmap.texture_width = window_width;
-        window_pixmap.texture_height = window_height;
+        if(!gsr_pipewire_audio_add_link_from_apps_to_sink(pipewire_audio, app_names.data(), app_names.size(), combined_sink_name.c_str())) {
+            fprintf(stderr, "gsr error: failed to add application audio link\n");
+            _exit(1);
+        }
+    }
+
+    return audio_device;
+}
+#endif
+
+static bool get_image_format_from_filename(const char *filename, gsr_image_format *image_format) {
+    if(string_ends_with(filename, ".jpg") || string_ends_with(filename, ".jpeg")) {
+        *image_format = GSR_IMAGE_FORMAT_JPEG;
+        return true;
+    } else if(string_ends_with(filename, ".png")) {
+        *image_format = GSR_IMAGE_FORMAT_PNG;
+        return true;
+    } else {
+        return false;
+    }
+}
+
+// TODO: replace this with start_recording_create_steams
+static bool av_open_file_write_header(AVFormatContext *av_format_context, const char *filename) {
+    int ret = avio_open(&av_format_context->pb, filename, AVIO_FLAG_WRITE);
+    if(ret < 0) {
+        fprintf(stderr, "gsr error: Could not open '%s': %s\n", filename, av_error_to_string(ret));
+        return false;
+    }
+
+    AVDictionary *options = nullptr;
+    av_dict_set(&options, "strict", "experimental", 0);
+    //av_dict_set_int(&av_format_context->metadata, "video_full_range_flag", 1, 0);
 
-        if (!glfwInit()) {
-            fprintf(stderr, "Error: Failed to initialize glfw\n");
-            return 1;
+    ret = avformat_write_header(av_format_context, &options);
+    if(ret < 0)
+        fprintf(stderr, "Error occurred when writing header to output file: %s\n", av_error_to_string(ret));
+
+    const bool success = ret >= 0;
+    if(!success)
+        avio_close(av_format_context->pb);
+
+    av_dict_free(&options);
+    return success;
+}
+
+static int audio_codec_get_frame_size(gsr_audio_codec audio_codec) {
+    switch(audio_codec) {
+        case GSR_AUDIO_CODEC_AAC: return 1024;
+        case GSR_AUDIO_CODEC_OPUS: return 960;
+        case GSR_AUDIO_CODEC_FLAC:
+            assert(false);
+            return 1024;
+    }
+    assert(false);
+    return 1024;
+}
+
+static size_t calculate_estimated_replay_buffer_packets(int64_t replay_buffer_size_secs, int fps, gsr_audio_codec audio_codec, const std::vector<MergedAudioInputs> &audio_inputs) {
+    if(replay_buffer_size_secs == -1)
+        return 0;
+
+    int audio_fps = 0;
+    if(!audio_inputs.empty())
+        audio_fps = AUDIO_SAMPLE_RATE / audio_codec_get_frame_size(audio_codec);
+
+    return replay_buffer_size_secs * (fps + audio_fps * audio_inputs.size());
+}
+
+static void set_display_server_environment_variables() {
+    // Some users dont have properly setup environments (no display manager that does systemctl --user import-environment DISPLAY WAYLAND_DISPLAY)
+    const char *display = getenv("DISPLAY");
+    if(!display) {
+        display = ":0";
+        setenv("DISPLAY", display, true);
+    }
+
+    const char *wayland_display = getenv("WAYLAND_DISPLAY");
+    if(!wayland_display) {
+        wayland_display = "wayland-1";
+        setenv("WAYLAND_DISPLAY", wayland_display, true);
+    }
+}
+
+int main(int argc, char **argv) {
+    setlocale(LC_ALL, "C"); // Sigh... stupid C
+    mallopt(M_MMAP_THRESHOLD, 65536);
+
+    signal(SIGINT, stop_handler);
+    signal(SIGTERM, stop_handler);
+    signal(SIGUSR1, save_replay_handler);
+    signal(SIGUSR2, toggle_pause_handler);
+    signal(SIGRTMIN, toggle_replay_recording_handler);
+    signal(SIGRTMIN+1, save_replay_10_seconds_handler);
+    signal(SIGRTMIN+2, save_replay_30_seconds_handler);
+    signal(SIGRTMIN+3, save_replay_1_minute_handler);
+    signal(SIGRTMIN+4, save_replay_5_minutes_handler);
+    signal(SIGRTMIN+5, save_replay_10_minutes_handler);
+    signal(SIGRTMIN+6, save_replay_30_minutes_handler);
+
+    set_display_server_environment_variables();
+
+    // Stop nvidia driver from buffering frames
+    setenv("__GL_MaxFramesAllowed", "1", true);
+    // If this is set to 1 then cuGraphicsGLRegisterImage will fail for egl context with error: invalid OpenGL or DirectX context,
+    // so we overwrite it
+    setenv("__GL_THREADED_OPTIMIZATIONS", "0", true);
+    // Forces low latency encoding mode. Use this environment variable until vaapi supports setting this as a parameter.
+    // The downside of this is that it always uses maximum power, which is not ideal for replay mode that runs on system startup.
+    // This option was added in mesa 24.1.4, released in july 17, 2024.
+    // TODO: Add an option to enable/disable this?
+    // Seems like the performance issue is not in encoding, but rendering the frame.
+    // Some frames end up taking 10 times longer. Seems to be an issue with amd gpu power management when letting the application sleep on the cpu side?
+    setenv("AMD_DEBUG", "lowlatencyenc", true);
+    // Some people set this to nvidia (for nvdec) or vdpau (for nvidia vdpau), which breaks gpu screen recorder since
+    // nvidia doesn't support vaapi and nvidia-vaapi-driver doesn't support encoding yet.
+    // Let vaapi find the match vaapi driver instead of forcing a specific one.
+    unsetenv("LIBVA_DRIVER_NAME");
+    // Some people set this to force all applications to vsync on nvidia, but this makes eglSwapBuffers never return.
+    unsetenv("__GL_SYNC_TO_VBLANK");
+    // Same as above, but for amd/intel
+    unsetenv("vblank_mode");
+
+    if(geteuid() == 0) {
+        fprintf(stderr, "gsr error: don't run gpu-screen-recorder as the root user\n");
+        _exit(1);
+    }
+
+    args_handlers arg_handlers;
+    arg_handlers.version = version_command;
+    arg_handlers.info = info_command;
+    arg_handlers.list_audio_devices = list_audio_devices_command;
+    arg_handlers.list_application_audio = list_application_audio_command;
+    arg_handlers.list_capture_options = list_capture_options_command;
+
+    args_parser arg_parser;
+    if(!args_parser_parse(&arg_parser, argc, argv, &arg_handlers, NULL))
+        _exit(1);
+
+    //av_log_set_level(AV_LOG_TRACE);
+
+    const Arg *audio_input_arg = args_parser_get_arg(&arg_parser, "-a");
+    assert(audio_input_arg);
+
+    AudioDevices audio_devices;
+    if(audio_input_arg->num_values > 0)
+        audio_devices = get_pulseaudio_inputs();
+
+    std::vector<MergedAudioInputs> requested_audio_inputs = parse_audio_inputs(audio_devices, audio_input_arg);
+
+    const bool uses_app_audio = merged_audio_inputs_has_app_audio(requested_audio_inputs);
+    std::vector<std::string> app_audio_names;
+#ifdef GSR_APP_AUDIO
+    gsr_pipewire_audio pipewire_audio;
+    memset(&pipewire_audio, 0, sizeof(pipewire_audio));
+    if(uses_app_audio) {
+        if(!pulseaudio_server_is_pipewire()) {
+            fprintf(stderr, "gsr error: your sound server is not PipeWire. Application audio is only available when running PipeWire audio server\n");
+            _exit(2);
+        }
+
+        if(!gsr_pipewire_audio_init(&pipewire_audio)) {
+            fprintf(stderr, "gsr error: failed to setup PipeWire audio for application audio capture\n");
+            _exit(2);
         }
+
+        gsr_pipewire_audio_for_each_app(&pipewire_audio, [](const char *app_name, void *userdata) {
+            std::vector<std::string> *app_audio_names = (std::vector<std::string>*)userdata;
+            app_audio_names->push_back(app_name);
+            return true;
+        }, &app_audio_names);
+    }
+#endif
+
+    validate_merged_audio_inputs_app_audio(requested_audio_inputs, app_audio_names);
+
+    const bool is_replaying = arg_parser.replay_buffer_size_secs != -1;
+    const bool is_portal_capture = strcmp(arg_parser.window, "portal") == 0;
+
+    bool wayland = false;
+    Display *dpy = XOpenDisplay(nullptr);
+    if (!dpy) {
+        wayland = true;
+        fprintf(stderr, "gsr warning: failed to connect to the X server. Assuming wayland is running without Xwayland\n");
+    }
+
+    XSetErrorHandler(x11_error_handler);
+    XSetIOErrorHandler(x11_io_error_handler);
+
+    if(!wayland)
+        wayland = is_xwayland(dpy);
+
+    if(!wayland && is_using_prime_run()) {
+        // Disable prime-run and similar options as it doesn't work, the monitor to capture has to be run on the same device.
+        // This is fine on wayland since nvidia uses drm interface there and the monitor query checks the monitors connected
+        // to the drm device.
+        fprintf(stderr, "gsr warning: use of prime-run on X11 is not supported. Disabling prime-run\n");
+        disable_prime_run();
+    }
+
+    gsr_window *window = gsr_window_create(dpy, wayland);
+    if(!window) {
+        fprintf(stderr, "gsr error: failed to create window\n");
+        _exit(1);
+    }
+
+    if(is_portal_capture && is_using_prime_run()) {
+        fprintf(stderr, "gsr warning: use of prime-run with -w portal option is currently not supported. Disabling prime-run\n");
+        disable_prime_run();
+    }
+
+    const bool is_monitor_capture = strcmp(arg_parser.window, "focused") != 0 && strcmp(arg_parser.window, "region") != 0 && !is_portal_capture && contains_non_hex_number(arg_parser.window);
+    gsr_egl egl;
+    if(!gsr_egl_load(&egl, window, is_monitor_capture, arg_parser.gl_debug)) {
+        fprintf(stderr, "gsr error: failed to load opengl\n");
+        _exit(1);
+    }
+
+    gsr_shader_enable_debug_output(arg_parser.gl_debug);
+#ifndef NDEBUG
+    gsr_shader_enable_debug_output(true);
+#endif
+
+    if(!args_parser_validate_with_gl_info(&arg_parser, &egl))
+        _exit(1);
+
+    egl.card_path[0] = '\0';
+    if(monitor_capture_use_drm(window, egl.gpu_info.vendor)) {
+        // TODO: Allow specifying another card, and in other places
+        if(!gsr_get_valid_card_path(&egl, egl.card_path, is_monitor_capture)) {
+            fprintf(stderr, "gsr error: no /dev/dri/cardX device found. Make sure that you have at least one monitor connected or record a single window instead on X11 or record with the -w portal option\n");
+            _exit(2);
+        }
+    }
+
+    // if(wayland && is_monitor_capture) {
+    //     fprintf(stderr, "gsr warning: it's not possible to sync video to recorded monitor exactly on wayland when recording a monitor."
+    //         " If you experience stutter in the video then record with portal capture option instead (-w portal) or use X11 instead\n");
+    // }
+
+    gsr_image_format image_format;
+    if(get_image_format_from_filename(arg_parser.filename, &image_format)) {
+        if(audio_input_arg->num_values > 0) {
+            fprintf(stderr, "gsr error: can't record audio (-a) when taking a screenshot\n");
+            _exit(1);
+        }
+
+        capture_image_to_file(arg_parser, &egl, image_format);
+        _exit(0);
     }
 
-    // Video start
     AVFormatContext *av_format_context;
     // The output format is automatically guessed by the file extension
-    avformat_alloc_output_context2(&av_format_context, nullptr, container_format,
-                                   nullptr);
+    avformat_alloc_output_context2(&av_format_context, nullptr, arg_parser.container_format, arg_parser.filename);
     if (!av_format_context) {
-        fprintf(
-            stderr,
-            "Error: Failed to deduce output format from file extension\n");
-        return 1;
+        if(arg_parser.container_format) {
+            fprintf(stderr, "gsr error: Container format '%s' (argument -c) is not valid\n", arg_parser.container_format);
+        } else {
+            fprintf(stderr, "gsr error: Failed to deduce container format from file extension. Use the '-c' option to specify container format\n");
+            args_parser_print_usage();
+            _exit(1);
+        }
+        _exit(1);
     }
 
-    av_format_context->flags |= AVFMT_FLAG_GENPTS;
     const AVOutputFormat *output_format = av_format_context->oformat;
 
-    //bool use_hevc = strcmp(window_str, "screen") == 0 || strcmp(window_str, "screen-direct") == 0;
-    bool use_hevc = true;
-    if(use_hevc && strcmp(container_format, "flv") == 0) {
-        use_hevc = false;
-        fprintf(stderr, "Warning: hevc is not compatible with flv, falling back to h264 instead.\n");
+    std::string file_extension = output_format->extensions ? output_format->extensions : "";
+    {
+        size_t comma_index = file_extension.find(',');
+        if(comma_index != std::string::npos)
+            file_extension = file_extension.substr(0, comma_index);
+    }
+
+    const bool force_no_audio_offset = arg_parser.is_livestream || arg_parser.is_output_piped || (file_extension != "mp4" && file_extension != "mkv" && file_extension != "webm");
+    const double target_fps = 1.0 / (double)arg_parser.fps;
+
+    const bool uses_amix = merged_audio_inputs_should_use_amix(requested_audio_inputs);
+    arg_parser.audio_codec = select_audio_codec_with_fallback(arg_parser.audio_codec, file_extension, uses_amix);
+    bool low_power = false;
+    const AVCodec *video_codec_f = select_video_codec_with_fallback(&arg_parser.video_codec, file_extension.c_str(), arg_parser.video_encoder == GSR_VIDEO_ENCODER_HW_CPU, &egl, &low_power);
+
+    gsr_capture *capture = create_capture_impl(arg_parser, &egl, false);
+
+    // (Some?) livestreaming services require at least one audio track to work.
+    // If not audio is provided then create one silent audio track.
+    if(arg_parser.is_livestream && requested_audio_inputs.empty()) {
+        fprintf(stderr, "gsr info: live streaming but no audio track was added. Adding a silent audio track\n");
+        MergedAudioInputs mai;
+        mai.audio_inputs.push_back({""});
+        requested_audio_inputs.push_back(std::move(mai));
     }
 
     AVStream *video_stream = nullptr;
-    AVStream *audio_stream = nullptr;
+    std::vector<AudioTrack> audio_tracks;
 
-    AVCodecContext *video_codec_context = create_video_codec_context(av_format_context, quality, record_width, record_height, fps, use_hevc);
-    if(replay_buffer_size_secs == -1)
+    const enum AVPixelFormat video_pix_fmt = get_pixel_format(arg_parser.video_codec, egl.gpu_info.vendor, arg_parser.video_encoder == GSR_VIDEO_ENCODER_HW_CPU);
+    AVCodecContext *video_codec_context = create_video_codec_context(video_pix_fmt, video_codec_f, egl, arg_parser);
+    if(!is_replaying)
         video_stream = create_stream(av_format_context, video_codec_context);
 
-    AVBufferRef *device_ctx;
-    CUgraphicsResource cuda_graphics_resource;
-    open_video(video_codec_context, window_pixmap, &device_ctx, &cuda_graphics_resource, cu_ctx);
-    if(video_stream)
-        avcodec_parameters_from_context(video_stream->codecpar, video_codec_context);
+    if(arg_parser.tune == GSR_TUNE_QUALITY)
+        video_codec_context->max_b_frames = 2;
 
-    AVCodecContext *audio_codec_context = nullptr;
-    AVFrame *audio_frame = nullptr;
-    if(audio_input_arg.value) {
-        audio_codec_context = create_audio_codec_context(av_format_context, fps);
-        if(replay_buffer_size_secs == -1)
-            audio_stream = create_stream(av_format_context, audio_codec_context);
+    AVFrame *video_frame = av_frame_alloc();
+    if(!video_frame) {
+        fprintf(stderr, "gsr error: Failed to allocate video frame\n");
+        _exit(1);
+    }
+    video_frame->format = video_codec_context->pix_fmt;
+    video_frame->width = 0;
+    video_frame->height = 0;
+    video_frame->color_range = video_codec_context->color_range;
+    video_frame->color_primaries = video_codec_context->color_primaries;
+    video_frame->color_trc = video_codec_context->color_trc;
+    video_frame->colorspace = video_codec_context->colorspace;
+    video_frame->chroma_location = video_codec_context->chroma_sample_location;
+
+    gsr_capture_metadata capture_metadata;
+    capture_metadata.width = 0;
+    capture_metadata.height = 0;
+    capture_metadata.fps = arg_parser.fps;
+    capture_metadata.video_codec_context = video_codec_context;
+    capture_metadata.frame = video_frame;
+
+    int capture_result = gsr_capture_start(capture, &capture_metadata);
+    if(capture_result != 0) {
+        fprintf(stderr, "gsr error: gsr_capture_start failed\n");
+        _exit(capture_result);
+    }
 
-        audio_frame = open_audio(audio_codec_context);
-        if(audio_stream)
-            avcodec_parameters_from_context(audio_stream->codecpar, audio_codec_context);
+    video_codec_context->width = capture_metadata.width;
+    video_codec_context->height = capture_metadata.height;
+    video_frame->width = capture_metadata.width;
+    video_frame->height = capture_metadata.height;
+
+    const size_t estimated_replay_buffer_packets = calculate_estimated_replay_buffer_packets(arg_parser.replay_buffer_size_secs, arg_parser.fps, arg_parser.audio_codec, requested_audio_inputs);
+    gsr_encoder encoder;
+    if(!gsr_encoder_init(&encoder, arg_parser.replay_storage, estimated_replay_buffer_packets, arg_parser.replay_buffer_size_secs, arg_parser.filename)) {
+        fprintf(stderr, "gsr error: failed to create encoder\n");
+        _exit(1);
     }
 
-    //av_dump_format(av_format_context, 0, filename, 1);
+    gsr_video_encoder *video_encoder = create_video_encoder(&egl, arg_parser);
+    if(!video_encoder) {
+        fprintf(stderr, "gsr error: failed to create video encoder\n");
+        _exit(1);
+    }
 
-    if (replay_buffer_size_secs == -1 && !(output_format->flags & AVFMT_NOFILE)) {
-        int ret = avio_open(&av_format_context->pb, filename, AVIO_FLAG_WRITE);
-        if (ret < 0) {
-            fprintf(stderr, "Error: Could not open '%s': %s\n", filename, av_error_to_string(ret));
-            return 1;
-        }
+    if(!gsr_video_encoder_start(video_encoder, video_codec_context, video_frame)) {
+        fprintf(stderr, "gsr error: failed to start video encoder\n");
+        _exit(1);
     }
 
-    //video_stream->duration = AV_TIME_BASE * 15;
-    //audio_stream->duration = AV_TIME_BASE * 15;
-    //av_format_context->duration = AV_TIME_BASE * 15;
-    if(replay_buffer_size_secs == -1) {
-        int ret = avformat_write_header(av_format_context, nullptr);
-        if (ret < 0) {
-            fprintf(stderr, "Error occurred when writing header to output file: %s\n", av_error_to_string(ret));
-            return 1;
-        }
+    capture_metadata.width = video_codec_context->width;
+    capture_metadata.height = video_codec_context->height;
+
+    gsr_color_conversion_params color_conversion_params;
+    memset(&color_conversion_params, 0, sizeof(color_conversion_params));
+    color_conversion_params.color_range = arg_parser.color_range;
+    color_conversion_params.egl = &egl;
+    color_conversion_params.load_external_image_shader = gsr_capture_uses_external_image(capture);
+    gsr_video_encoder_get_textures(video_encoder, color_conversion_params.destination_textures, &color_conversion_params.num_destination_textures, &color_conversion_params.destination_color);
+
+    gsr_color_conversion color_conversion;
+    if(gsr_color_conversion_init(&color_conversion, &color_conversion_params) != 0) {
+        fprintf(stderr, "gsr error: main: failed to create color conversion\n");
+        _exit(1);
     }
 
-    // av_frame_free(&rgb_frame);
-    // avcodec_close(av_codec_context);
+    gsr_color_conversion_clear(&color_conversion);
 
-    if(dpy)
-        XSelectInput(dpy, src_window_id, StructureNotifyMask | VisibilityChangeMask);
+    if(arg_parser.video_encoder == GSR_VIDEO_ENCODER_HW_CPU) {
+        open_video_software(video_codec_context, arg_parser);
+    } else {
+        open_video_hardware(video_codec_context, low_power, egl, arg_parser);
+    }
 
-    /*
-    int damage_event;
-    int damage_error;
-    if (!XDamageQueryExtension(dpy, &damage_event, &damage_error)) {
-        fprintf(stderr, "Error: XDamage is not supported by your X11 server\n");
-        return 1;
+    if(video_stream) {
+        avcodec_parameters_from_context(video_stream->codecpar, video_codec_context);
+        gsr_encoder_add_recording_destination(&encoder, video_codec_context, av_format_context, video_stream, 0);
     }
 
-    Damage damage = XDamageCreate(dpy, src_window_id, XDamageReportNonEmpty);
-    XDamageSubtract(dpy, damage,None,None);
-    */
+    int audio_max_frame_size = 1024;
+    int audio_stream_index = VIDEO_STREAM_INDEX + 1;
+    for(const MergedAudioInputs &merged_audio_inputs : requested_audio_inputs) {
+        const bool use_amix = audio_inputs_should_use_amix(merged_audio_inputs.audio_inputs);
+        AVCodecContext *audio_codec_context = create_audio_codec_context(arg_parser.fps, arg_parser.audio_codec, use_amix, arg_parser.audio_bitrate);
 
-    const double start_time_pts = clock_get_monotonic_seconds();
+        AVStream *audio_stream = nullptr;
+        if(!is_replaying) {
+            audio_stream = create_stream(av_format_context, audio_codec_context);
+            if(gsr_encoder_add_recording_destination(&encoder, audio_codec_context, av_format_context, audio_stream, 0) == (size_t)-1)
+                fprintf(stderr, "gsr error: added too many audio sources\n");
+        }
 
-    CUcontext old_ctx;
-    CUarray mapped_array;
-    if(src_window_id) {
-        res = cuCtxPopCurrent(&old_ctx);
-        res = cuCtxPushCurrent(cu_ctx);
+        if(audio_stream && !merged_audio_inputs.track_name.empty())
+            av_dict_set(&audio_stream->metadata, "title", merged_audio_inputs.track_name.c_str(), 0);
 
-        // Get texture
-        res = cuGraphicsResourceSetMapFlags(
-            cuda_graphics_resource, CU_GRAPHICS_MAP_RESOURCE_FLAGS_READ_ONLY);
-        res = cuGraphicsMapResources(1, &cuda_graphics_resource, 0);
+        open_audio(audio_codec_context);
+        if(audio_stream)
+            avcodec_parameters_from_context(audio_stream->codecpar, audio_codec_context);
 
-        // Map texture to cuda array
-        res = cuGraphicsSubResourceGetMappedArray(&mapped_array,
-                                                cuda_graphics_resource, 0, 0);
-    }
+        #if LIBAVCODEC_VERSION_MAJOR < 60
+        const int num_channels = audio_codec_context->channels;
+        #else
+        const int num_channels = audio_codec_context->ch_layout.nb_channels;
+        #endif
+
+        //audio_frame->sample_rate = audio_codec_context->sample_rate;
+
+        std::vector<AVFilterContext*> src_filter_ctx;
+        AVFilterGraph *graph = nullptr;
+        AVFilterContext *sink = nullptr;
+        if(use_amix) {
+            int err = init_filter_graph(audio_codec_context, &graph, &sink, src_filter_ctx, merged_audio_inputs.audio_inputs.size());
+            if(err < 0) {
+                fprintf(stderr, "gsr error: failed to create audio filter\n");
+                _exit(1);
+            }
+        }
 
-    // Release texture
-    // res = cuGraphicsUnmapResources(1, &cuda_graphics_resource, 0);
+        // TODO: Cleanup above
 
-    double start_time = glfwGetTime();
-    double frame_timer_start = start_time;
-    double window_resize_timer = start_time;
-    bool window_resized = false;
-    int fps_counter = 0;
-    int current_fps = 30;
+        const double audio_fps = (double)audio_codec_context->sample_rate / (double)audio_codec_context->frame_size;
+        const double timeout_sec = 1000.0 / audio_fps / 1000.0;
 
-    AVFrame *frame = av_frame_alloc();
-    if (!frame) {
-        fprintf(stderr, "Error: Failed to allocate frame\n");
-        exit(1);
+        const double audio_startup_time_seconds = force_no_audio_offset ? 0 : audio_codec_get_desired_delay(arg_parser.audio_codec, arg_parser.fps);// * ((double)audio_codec_context->frame_size / 1024.0);
+        const double num_audio_frames_shift = audio_startup_time_seconds / timeout_sec;
+
+        std::vector<AudioDeviceData> audio_track_audio_devices;
+        if(audio_inputs_has_app_audio(merged_audio_inputs.audio_inputs)) {
+            assert(!use_amix);
+#ifdef GSR_APP_AUDIO
+            audio_track_audio_devices.push_back(create_application_audio_audio_input(merged_audio_inputs, audio_codec_context, num_channels, num_audio_frames_shift, &pipewire_audio));
+#endif
+        } else {
+            audio_track_audio_devices = create_device_audio_inputs(merged_audio_inputs.audio_inputs, audio_codec_context, num_channels, num_audio_frames_shift, src_filter_ctx, use_amix);
+        }
+
+        AudioTrack audio_track;
+        audio_track.name = merged_audio_inputs.track_name;
+        audio_track.codec_context = audio_codec_context;
+        audio_track.audio_devices = std::move(audio_track_audio_devices);
+        audio_track.graph = graph;
+        audio_track.sink = sink;
+        audio_track.stream_index = audio_stream_index;
+        audio_track.pts = -audio_codec_context->frame_size * num_audio_frames_shift;
+        audio_tracks.push_back(std::move(audio_track));
+        ++audio_stream_index;
+
+        audio_max_frame_size = std::max(audio_max_frame_size, audio_codec_context->frame_size);
     }
-    frame->format = video_codec_context->pix_fmt;
-    frame->width = video_codec_context->width;
-    frame->height = video_codec_context->height;
 
-    if (av_hwframe_get_buffer(video_codec_context->hw_frames_ctx, frame, 0) < 0) {
-        fprintf(stderr, "Error: av_hwframe_get_buffer failed\n");
-        exit(1);
+    //av_dump_format(av_format_context, 0, filename, 1);
+
+    if(!is_replaying) {
+        if(!av_open_file_write_header(av_format_context, arg_parser.filename))
+            _exit(1);
     }
 
-    if(window_pixmap.texture_width < record_width)
-        frame->width = window_pixmap.texture_width & ~1;
-    else
-        frame->width = record_width & ~1;
+    double fps_start_time = clock_get_monotonic_seconds();
+    //double frame_timer_start = fps_start_time;
+    int fps_counter = 0;
+    int damage_fps_counter = 0;
+
+    bool paused = false;
+    std::atomic<double> paused_time_offset(0.0);
+    double paused_time_start = 0.0;
+    bool replay_recording = false;
+    RecordingStartResult replay_recording_start_result;
+    std::vector<size_t> replay_recording_items;
+    std::string replay_recording_filepath;
+    bool force_iframe_frame = false; // Only needed for video since audio frames are always iframes
+
+    std::mutex audio_filter_mutex;
+
+    const double record_start_time = clock_get_monotonic_seconds();
+
+    const size_t audio_buffer_size = audio_max_frame_size * 4 * 2; // max 4 bytes/sample, 2 channels
+    uint8_t *empty_audio = (uint8_t*)malloc(audio_buffer_size);
+    if(!empty_audio) {
+        fprintf(stderr, "gsr error: failed to create empty audio\n");
+        _exit(1);
+    }
+    memset(empty_audio, 0, audio_buffer_size);
+
+    for(AudioTrack &audio_track : audio_tracks) {
+        for(AudioDeviceData &audio_device : audio_track.audio_devices) {
+            audio_device.thread = std::thread([&]() mutable {
+                const AVSampleFormat sound_device_sample_format = audio_format_to_sample_format(audio_codec_context_get_audio_format(audio_track.codec_context));
+                // TODO: Always do conversion for now. This fixes issue with stuttering audio on pulseaudio with opus + multiple audio sources merged
+                const bool needs_audio_conversion = true;//audio_track.codec_context->sample_fmt != sound_device_sample_format;
+                SwrContext *swr = nullptr;
+                if(needs_audio_conversion) {
+                    swr = swr_alloc();
+                    if(!swr) {
+                        fprintf(stderr, "Failed to create SwrContext\n");
+                        _exit(1);
+                    }
+                    #if LIBAVUTIL_VERSION_MAJOR <= 56
+                    av_opt_set_channel_layout(swr, "in_channel_layout", AV_CH_LAYOUT_STEREO, 0);
+                    av_opt_set_channel_layout(swr, "out_channel_layout", AV_CH_LAYOUT_STEREO, 0);
+                    #elif LIBAVUTIL_VERSION_MAJOR >= 59
+                    av_opt_set_chlayout(swr, "in_chlayout", &audio_track.codec_context->ch_layout, 0);
+                    av_opt_set_chlayout(swr, "out_chlayout", &audio_track.codec_context->ch_layout, 0);
+                    #else
+                    av_opt_set_chlayout(swr, "in_channel_layout", &audio_track.codec_context->ch_layout, 0);
+                    av_opt_set_chlayout(swr, "out_channel_layout", &audio_track.codec_context->ch_layout, 0);
+                    #endif
+                    av_opt_set_int(swr, "in_sample_rate", audio_track.codec_context->sample_rate, 0);
+                    av_opt_set_int(swr, "out_sample_rate", audio_track.codec_context->sample_rate, 0);
+                    av_opt_set_sample_fmt(swr, "in_sample_fmt", sound_device_sample_format, 0);
+                    av_opt_set_sample_fmt(swr, "out_sample_fmt", audio_track.codec_context->sample_fmt, 0);
+                    swr_init(swr);
+                }
 
-    if(window_pixmap.texture_height < record_height)
-        frame->height = window_pixmap.texture_height & ~1;
-    else
-        frame->height = record_height & ~1;
+                const double audio_fps = (double)audio_track.codec_context->sample_rate / (double)audio_track.codec_context->frame_size;
+                const int64_t timeout_ms = std::round(1000.0 / audio_fps);
+                const double timeout_sec = 1000.0 / audio_fps / 1000.0;
+                bool first_frame = true;
+                int64_t num_received_frames = 0;
+
+                while(running) {
+                    void *sound_buffer;
+                    int sound_buffer_size = -1;
+                    //const double time_before_read_seconds = clock_get_monotonic_seconds();
+                    if(audio_device.sound_device.handle) {
+                        // TODO: use this instead of calculating time to read. But this can fluctuate and we dont want to go back in time,
+                        // also it's 0.0 for some users???
+                        double latency_seconds = 0.0;
+                        sound_buffer_size = sound_device_read_next_chunk(&audio_device.sound_device, &sound_buffer, timeout_sec * 2.0, &latency_seconds);
+                    }
 
-    std::mutex write_output_mutex;
-    std::thread audio_thread;
+                    const bool got_audio_data = sound_buffer_size >= 0;
+                    //fprintf(stderr, "got audio data: %s\n", got_audio_data ? "yes" : "no");
+                    //const double time_after_read_seconds = clock_get_monotonic_seconds();
+                    //const double time_to_read_seconds = time_after_read_seconds - time_before_read_seconds;
+                    //fprintf(stderr, "time to read: %f, %s, %f\n", time_to_read_seconds, got_audio_data ? "yes" : "no", timeout_sec);
+                    const double this_audio_frame_time = clock_get_monotonic_seconds() - paused_time_offset;
 
-    double record_start_time = glfwGetTime();
-    std::deque<AVPacket> frame_data_queue;
-    bool frames_erased = false;
+                    if(paused) {
+                        if(!audio_device.sound_device.handle)
+                            av_usleep(timeout_ms * 1000);
 
-    SoundDevice sound_device;
-    uint8_t *audio_frame_buf;
-    if(audio_input_arg.value) {
-        if(sound_device_get_by_name(&sound_device, audio_input_arg.value, audio_codec_context->channels, audio_codec_context->frame_size) != 0) {
-            fprintf(stderr, "failed to get 'pulse' sound device\n");
-            exit(1);
-        }
-
-        int audio_buffer_size = av_samples_get_buffer_size(NULL, audio_codec_context->channels, audio_codec_context->frame_size, audio_codec_context->sample_fmt, 1);
-        audio_frame_buf = (uint8_t *)av_malloc(audio_buffer_size);
-        avcodec_fill_audio_frame(audio_frame, audio_codec_context->channels, audio_codec_context->sample_fmt, (const uint8_t*)audio_frame_buf, audio_buffer_size, 1);
-
-        audio_thread = std::thread([record_start_time, replay_buffer_size_secs, &frame_data_queue, &frames_erased, audio_codec_context, start_time_pts, fps](AVFormatContext *av_format_context, AVStream *audio_stream, uint8_t *audio_frame_buf, SoundDevice *sound_device, AVFrame *audio_frame, std::mutex *write_output_mutex) mutable {
-            
-            SwrContext *swr = swr_alloc();
-            if(!swr) {
-                fprintf(stderr, "Failed to create SwrContext\n");
-                exit(1);
-            }
-            av_opt_set_int(swr, "in_channel_layout", audio_codec_context->channel_layout, 0);
-            av_opt_set_int(swr, "out_channel_layout", audio_codec_context->channel_layout, 0);
-            av_opt_set_int(swr, "in_sample_rate", audio_codec_context->sample_rate, 0);
-            av_opt_set_int(swr, "out_sample_rate", audio_codec_context->sample_rate, 0);
-            av_opt_set_sample_fmt(swr, "in_sample_fmt", AV_SAMPLE_FMT_S16, 0);
-            av_opt_set_sample_fmt(swr, "out_sample_fmt", AV_SAMPLE_FMT_FLTP, 0);
-            swr_init(swr);
+                        continue;
+                    }
 
-            while(running) {
-                void *sound_buffer;
-                int sound_buffer_size = sound_device_read_next_chunk(sound_device, &sound_buffer);
-                if(sound_buffer_size >= 0) {
-                    // TODO: Instead of converting audio, get float audio from alsa. Or does alsa do conversion internally to get this format?
-                    swr_convert(swr, &audio_frame_buf, audio_frame->nb_samples, (const uint8_t**)&sound_buffer, sound_buffer_size);
-                    audio_frame->extended_data = &audio_frame_buf;
-                    audio_frame->pts = (clock_get_monotonic_seconds() - start_time_pts) * AV_TIME_BASE;
-
-                    int ret = avcodec_send_frame(audio_codec_context, audio_frame);
-                    if(ret < 0){
-                        fprintf(stderr, "Failed to encode!\n");
+                    int ret = av_frame_make_writable(audio_device.frame);
+                    if (ret < 0) {
+                        fprintf(stderr, "Failed to make audio frame writable\n");
                         break;
                     }
-                    if(ret >= 0)
-                        receive_frames(audio_codec_context, AUDIO_STREAM_INDEX, audio_stream, audio_frame, av_format_context, record_start_time, frame_data_queue, replay_buffer_size_secs, frames_erased, *write_output_mutex);
-                } else {
-                    fprintf(stderr, "failed to read sound from device, error: %d\n", sound_buffer_size);
-                }
-            }
 
-            swr_free(&swr);
-        }, av_format_context, audio_stream, audio_frame_buf, &sound_device, audio_frame, &write_output_mutex);
-    }
+                    // TODO: Is this |received_audio_time| really correct?
+                    const int64_t num_expected_frames = std::floor((this_audio_frame_time - record_start_time) / timeout_sec);
+                    int64_t num_missing_frames = std::max((int64_t)0LL, num_expected_frames - num_received_frames);
+
+                    if(got_audio_data)
+                        num_missing_frames = std::max((int64_t)0LL, num_missing_frames - 1);
+
+                    if(!audio_device.sound_device.handle)
+                        num_missing_frames = std::max((int64_t)1, num_missing_frames);
+
+                    // Fucking hell is there a better way to do this? I JUST WANT TO KEEP VIDEO AND AUDIO SYNCED HOLY FUCK I WANT TO KILL MYSELF NOW.
+                    // THIS PIECE OF SHIT WANTS EMPTY FRAMES OTHERWISE VIDEO PLAYS TOO FAST TO KEEP UP WITH AUDIO OR THE AUDIO PLAYS TOO EARLY.
+                    // BUT WE CANT USE DELAYS TO GIVE DUMMY DATA BECAUSE PULSEAUDIO MIGHT GIVE AUDIO A BIG DELAYED!!!
+                    // This garbage is needed because we want to produce constant frame rate videos instead of variable frame rate
+                    // videos because bad software such as video editing software and VLC do not support variable frame rate software,
+                    // despite nvidia shadowplay and xbox game bar producing variable frame rate videos.
+                    // So we have to make sure we produce frames at the same relative rate as the video.
+                    if((num_missing_frames >= 1 && got_audio_data) || num_missing_frames >= 5 || !audio_device.sound_device.handle) {
+                        // TODO:
+                        //audio_track.frame->data[0] = empty_audio;
+                        if(first_frame || num_missing_frames >= 5) {
+                            if(needs_audio_conversion)
+                                swr_convert(swr, &audio_device.frame->data[0], audio_track.codec_context->frame_size, (const uint8_t**)&empty_audio, audio_track.codec_context->frame_size);
+                            else
+                                audio_device.frame->data[0] = empty_audio;
+                        }
+                        first_frame = false;
+
+                        // TODO: Check if duplicate frame can be saved just by writing it with a different pts instead of sending it again
+                        std::lock_guard<std::mutex> lock(audio_filter_mutex);
+                        for(int i = 0; i < num_missing_frames; ++i) {
+                            if(audio_track.graph) {
+                                // TODO: av_buffersrc_add_frame
+                                if(av_buffersrc_write_frame(audio_device.src_filter_ctx, audio_device.frame) < 0) {
+                                    fprintf(stderr, "gsr error: failed to add audio frame to filter\n");
+                                }
+                            } else {
+                                ret = avcodec_send_frame(audio_track.codec_context, audio_device.frame);
+                                if(ret >= 0) {
+                                    // TODO: Move to separate thread because this could write to network (for example when livestreaming)
+                                    gsr_encoder_receive_packets(&encoder, audio_track.codec_context, audio_device.frame->pts, audio_track.stream_index);
+                                } else {
+                                    fprintf(stderr, "Failed to encode audio!\n");
+                                }
+                                audio_track.pts += audio_track.codec_context->frame_size;
+                            }
+
+                            audio_device.frame->pts += audio_track.codec_context->frame_size;
+                            num_received_frames++;
+                        }
+                    }
 
-    handle_new_pid_file(replay_buffer_size_secs == -1 ? "record" : "replay");
-    started = 1;
+                    if(!audio_device.sound_device.handle)
+                        av_usleep(timeout_ms * 1000);
+
+                    if(got_audio_data) {
+                        // TODO: Instead of converting audio, get float audio from alsa. Or does alsa do conversion internally to get this format?
+                        if(needs_audio_conversion)
+                            swr_convert(swr, &audio_device.frame->data[0], audio_track.codec_context->frame_size, (const uint8_t**)&sound_buffer, audio_track.codec_context->frame_size);
+                        else
+                            audio_device.frame->data[0] = (uint8_t*)sound_buffer;
+                        first_frame = false;
+
+                        std::lock_guard<std::mutex> lock(audio_filter_mutex);
+
+                        if(audio_track.graph) {
+                            // TODO: av_buffersrc_add_frame
+                            if(av_buffersrc_write_frame(audio_device.src_filter_ctx, audio_device.frame) < 0) {
+                                fprintf(stderr, "gsr error: failed to add audio frame to filter\n");
+                            }
+                        } else {
+                            ret = avcodec_send_frame(audio_track.codec_context, audio_device.frame);
+                            if(ret >= 0) {
+                                // TODO: Move to separate thread because this could write to network (for example when livestreaming)
+                                gsr_encoder_receive_packets(&encoder, audio_track.codec_context, audio_device.frame->pts, audio_track.stream_index);
+                            } else {
+                                fprintf(stderr, "Failed to encode audio!\n");
+                            }
+                            audio_track.pts += audio_track.codec_context->frame_size;
+                        }
 
-    bool redraw = true;
-    XEvent e;
-    while (running) {
-        double frame_start = glfwGetTime();
-        glfwPollEvents();
-        if(window)
-            glClear(GL_COLOR_BUFFER_BIT);
+                        audio_device.frame->pts += audio_track.codec_context->frame_size;
+                        num_received_frames++;
+                    }
+                }
 
-        redraw = true;
+                if(swr)
+                    swr_free(&swr);
+            });
+        }
+    }
 
-        if(src_window_id) {
-            if (XCheckTypedWindowEvent(dpy, src_window_id, DestroyNotify, &e)) {
-                running = 0;
+    std::thread amix_thread;
+    if(uses_amix) {
+        amix_thread = std::thread([&]() {
+            AVFrame *aframe = av_frame_alloc();
+            while(running) {
+                {
+                    std::lock_guard<std::mutex> lock(audio_filter_mutex);
+                    for(AudioTrack &audio_track : audio_tracks) {
+                        if(!audio_track.sink)
+                            continue;
+
+                        int err = 0;
+                        while ((err = av_buffersink_get_frame(audio_track.sink, aframe)) >= 0) {
+                            aframe->pts = audio_track.pts;
+                            err = avcodec_send_frame(audio_track.codec_context, aframe);
+                            if(err >= 0){
+                                // TODO: Move to separate thread because this could write to network (for example when livestreaming)
+                                gsr_encoder_receive_packets(&encoder, audio_track.codec_context, aframe->pts, audio_track.stream_index);
+                            } else {
+                                fprintf(stderr, "Failed to encode audio!\n");
+                            }
+                            av_frame_unref(aframe);
+                            audio_track.pts += audio_track.codec_context->frame_size;
+                        }
+                    }
+                }
+                av_usleep(5 * 1000); // 5 milliseconds
             }
+            av_frame_free(&aframe);
+        });
+    }
 
-            if (XCheckTypedWindowEvent(dpy, src_window_id, VisibilityNotify, &e)) {
-                window_resize_timer = glfwGetTime();
-                window_resized = true;
-            }
+    // Set update_fps to 24 to test if duplicate/delayed frames cause video/audio desync or too fast/slow video.
+    //const double update_fps = fps + 190;
+    bool should_stop_error = false;
 
-            if (XCheckTypedWindowEvent(dpy, src_window_id, ConfigureNotify, &e) && e.xconfigure.window == src_window_id) {
-                // Window resize
-                if(e.xconfigure.width != window_width || e.xconfigure.height != window_height) {
-                    window_width = e.xconfigure.width;
-                    window_height = e.xconfigure.height;
-                    window_resize_timer = glfwGetTime();
-                    window_resized = true;
-                }
-            }
+    int64_t video_pts_counter = 0;
+    int64_t video_prev_pts = 0;
 
-            const double window_resize_timeout = 1.0; // 1 second
-            if(window_resized && glfwGetTime() - window_resize_timer >= window_resize_timeout) {
-                window_resized = false;
-                fprintf(stderr, "Resize window!\n");
-                recreate_window_pixmap(dpy, src_window_id, window_pixmap);
-                // Resolution must be a multiple of two
-                //video_stream->codec->width = window_pixmap.texture_width & ~1;
-                //video_stream->codec->height = window_pixmap.texture_height & ~1;
-
-                cuGraphicsUnregisterResource(cuda_graphics_resource);
-                res = cuGraphicsGLRegisterImage(
-                    &cuda_graphics_resource, window_pixmap.target_texture_id, GL_TEXTURE_2D,
-                    CU_GRAPHICS_REGISTER_FLAGS_READ_ONLY);
-                if (res != CUDA_SUCCESS) {
-                    const char *err_str;
-                    cuGetErrorString(res, &err_str);
-                    fprintf(stderr,
-                            "Error: cuGraphicsGLRegisterImage failed, error %s, texture "
-                            "id: %u\n",
-                            err_str, window_pixmap.target_texture_id);
-                    running = false;
-                    break;
-                }
+    bool hdr_metadata_set = false;
+    const bool hdr = video_codec_is_hdr(arg_parser.video_codec);
 
-                res = cuGraphicsResourceSetMapFlags(
-                    cuda_graphics_resource, CU_GRAPHICS_MAP_RESOURCE_FLAGS_READ_ONLY);
-                res = cuGraphicsMapResources(1, &cuda_graphics_resource, 0);
-                res = cuGraphicsSubResourceGetMappedArray(&mapped_array, cuda_graphics_resource, 0, 0);
+    double damage_timeout_seconds = arg_parser.framerate_mode == GSR_FRAMERATE_MODE_CONTENT ? 0.5 : 0.1;
+    damage_timeout_seconds = std::max(damage_timeout_seconds, target_fps);
 
-                av_frame_free(&frame);
-                frame = av_frame_alloc();
-                if (!frame) {
-                    fprintf(stderr, "Error: Failed to allocate frame\n");
-                    running = false;
-                    break;
-                }
-                frame->format = video_codec_context->pix_fmt;
-                frame->width = video_codec_context->width;
-                frame->height = video_codec_context->height;
+    bool use_damage_tracking = false;
+    gsr_damage damage;
+    memset(&damage, 0, sizeof(damage));
+    if(gsr_window_get_display_server(window) == GSR_DISPLAY_SERVER_X11) {
+        gsr_damage_init(&damage, &egl, arg_parser.record_cursor);
+        use_damage_tracking = true;
+    }
 
-                if (av_hwframe_get_buffer(video_codec_context->hw_frames_ctx, frame, 0) < 0) {
-                    fprintf(stderr, "Error: av_hwframe_get_buffer failed\n");
-                    running = false;
-                    break;
-                }
+    if(is_monitor_capture)
+        gsr_damage_set_target_monitor(&damage, arg_parser.window);
 
-                if(window_pixmap.texture_width < record_width)
-                    frame->width = window_pixmap.texture_width & ~1;
-                else
-                    frame->width = record_width & ~1;
+    while(running) {
+        while(gsr_window_process_event(window)) {
+            gsr_damage_on_event(&damage, gsr_window_get_event_data(window));
+            gsr_capture_on_event(capture, &egl);
+        }
+        gsr_damage_tick(&damage);
+        gsr_capture_tick(capture);
 
-                if(window_pixmap.texture_height < record_height)
-                    frame->height = window_pixmap.texture_height & ~1;
-                else
-                    frame->height = record_height & ~1;
+        if(!is_monitor_capture) {
+            Window damage_target_window = 0;
+            if(capture->get_window_id)
+                damage_target_window = capture->get_window_id(capture);
 
-                cuMemsetD8((CUdeviceptr)frame->data[0], 0, record_width * record_height * 4);
-            }
+            if(damage_target_window != 0)
+                gsr_damage_set_target_window(&damage, damage_target_window);
         }
 
-        ++fps_counter;
+        should_stop_error = false;
+        if(gsr_capture_should_stop(capture, &should_stop_error)) {
+            running = 0;
+            break;
+        }
+
+        bool damaged = false;
+        if(use_damage_tracking)
+            damaged = gsr_damage_is_damaged(&damage);
+        else if(capture->is_damaged)
+            damaged = capture->is_damaged(capture);
+        else
+            damaged = true;
+
+        // TODO: Readd wayland sync warning when removing this
+        if(arg_parser.framerate_mode != GSR_FRAMERATE_MODE_CONTENT)
+            damaged = true;
+
+        if(damaged)
+            ++damage_fps_counter;
 
-        double time_now = glfwGetTime();
-        double frame_timer_elapsed = time_now - frame_timer_start;
-        double elapsed = time_now - start_time;
+        ++fps_counter;
+        const double time_now = clock_get_monotonic_seconds();
+        //const double frame_timer_elapsed = time_now - frame_timer_start;
+        const double elapsed = time_now - fps_start_time;
         if (elapsed >= 1.0) {
-            fprintf(stderr, "update fps: %d\n", fps_counter);
-            start_time = time_now;
-            current_fps = fps_counter;
+            if(arg_parser.verbose) {
+                fprintf(stderr, "update fps: %d, damage fps: %d\n", fps_counter, damage_fps_counter);
+            }
+            fps_start_time = time_now;
             fps_counter = 0;
+            damage_fps_counter = 0;
         }
 
-        double frame_time_overflow = frame_timer_elapsed - target_fps;
-        if (frame_time_overflow >= 0.0) {
-            frame_timer_start = time_now - frame_time_overflow;
-
-            bool frame_captured = true;
-            if(redraw) {
-                redraw = false;
-                if(src_window_id) {
-                    // TODO: Use a framebuffer instead. glCopyImageSubData requires
-                    // opengl 4.2
-                    glCopyImageSubData(
-                        window_pixmap.texture_id, GL_TEXTURE_2D, 0, 0, 0, 0,
-                        window_pixmap.target_texture_id, GL_TEXTURE_2D, 0, 0, 0, 0,
-                        window_pixmap.texture_width, window_pixmap.texture_height, 1);
-                    int err = glGetError();
-                    if(err != 0) {
-                        static bool error_shown = false;
-                        if(!error_shown) {
-                            error_shown = true;
-                            fprintf(stderr, "Error: glCopyImageSubData failed, gl error: %d\n", err);
-                        }
-                    }
-                    glfwSwapBuffers(window);
-                    // int err = glGetError();
-                    // fprintf(stderr, "error: %d\n", err);
+        const double this_video_frame_time = clock_get_monotonic_seconds() - paused_time_offset;
+        const int64_t expected_frames = std::floor((this_video_frame_time - record_start_time) / target_fps);
+        const int64_t num_missed_frames = expected_frames - video_pts_counter;
+
+        if(damaged && num_missed_frames >= 1 && !paused) {
+            gsr_damage_clear(&damage);
+            if(capture->clear_damage)
+                capture->clear_damage(capture);
+
+            // TODO: Dont do this if no damage?
+            egl.glClear(0);
+
+            bool capture_has_synchronous_task = false;
+            if(capture->capture_has_synchronous_task) {
+                capture_has_synchronous_task = capture->capture_has_synchronous_task(capture);
+                if(capture_has_synchronous_task) {
+                    paused_time_start = clock_get_monotonic_seconds();
+                    paused = true;
+                }
+            }
 
-                    // TODO: Remove this copy, which is only possible by using nvenc directly and encoding window_pixmap.target_texture_id
+            gsr_capture_capture(capture, &capture_metadata, &color_conversion);
+
+            if(capture_has_synchronous_task) {
+                paused_time_offset = paused_time_offset + (clock_get_monotonic_seconds() - paused_time_start);
+                paused = false;
+            }
 
-                    CUDA_MEMCPY2D memcpy_struct;
-                    memcpy_struct.srcXInBytes = 0;
-                    memcpy_struct.srcY = 0;
-                    memcpy_struct.srcMemoryType = CUmemorytype::CU_MEMORYTYPE_ARRAY;
+            gsr_egl_swap_buffers(&egl);
+            gsr_video_encoder_copy_textures_to_frame(video_encoder, video_frame, &color_conversion);
 
-                    memcpy_struct.dstXInBytes = 0;
-                    memcpy_struct.dstY = 0;
-                    memcpy_struct.dstMemoryType = CUmemorytype::CU_MEMORYTYPE_DEVICE;
+            if(hdr && !hdr_metadata_set && !is_replaying && add_hdr_metadata_to_video_stream(capture, video_stream))
+                hdr_metadata_set = true;
+
+            // TODO: Check if duplicate frame can be saved just by writing it with a different pts instead of sending it again
+            const int num_frames_to_encode = arg_parser.framerate_mode == GSR_FRAMERATE_MODE_CONSTANT ? num_missed_frames : 1;
+            for(int i = 0; i < num_frames_to_encode; ++i) {
+                if(arg_parser.framerate_mode == GSR_FRAMERATE_MODE_CONSTANT) {
+                    video_frame->pts = video_pts_counter + i;
+                } else {
+                    video_frame->pts = (this_video_frame_time - record_start_time) * (double)AV_TIME_BASE;
+                    const bool same_pts = video_frame->pts == video_prev_pts;
+                    video_prev_pts = video_frame->pts;
+                    if(same_pts)
+                        continue;
+                }
 
-                    memcpy_struct.srcArray = mapped_array;
-                    memcpy_struct.dstDevice = (CUdeviceptr)frame->data[0];
-                    memcpy_struct.dstPitch = frame->linesize[0];
-                    memcpy_struct.WidthInBytes = frame->width * 4;
-                    memcpy_struct.Height = frame->height;
-                    cuMemcpy2D(&memcpy_struct);
+                if(force_iframe_frame) {
+                    video_frame->pict_type = AV_PICTURE_TYPE_I;
+                }
 
-                    frame_captured = true;
+                int ret = avcodec_send_frame(video_codec_context, video_frame);
+                if(ret == 0) {
+                    // TODO: Move to separate thread because this could write to network (for example when livestreaming)
+                    gsr_encoder_receive_packets(&encoder, video_codec_context, video_frame->pts, VIDEO_STREAM_INDEX);
                 } else {
-                    // TODO: Check when src_cu_device_ptr changes and re-register resource
-                    uint32_t byte_size = 0;
-                    CUdeviceptr src_cu_device_ptr = 0;
-                    frame_captured = nv_fbc_library.capture(&src_cu_device_ptr, &byte_size);
-                    frame->data[0] = (uint8_t*)src_cu_device_ptr;
+                    fprintf(stderr, "gsr error: avcodec_send_frame failed, error: %s\n", av_error_to_string(ret));
+                }
+
+                if(force_iframe_frame) {
+                    force_iframe_frame = false;
+                    video_frame->pict_type = AV_PICTURE_TYPE_NONE;
                 }
-                // res = cuCtxPopCurrent(&old_ctx);
             }
 
-            frame->pts = (clock_get_monotonic_seconds() - start_time_pts) * AV_TIME_BASE;
-            if (avcodec_send_frame(video_codec_context, frame) >= 0) {
-                receive_frames(video_codec_context, VIDEO_STREAM_INDEX, video_stream, frame, av_format_context,
-                               record_start_time, frame_data_queue, replay_buffer_size_secs, frames_erased, write_output_mutex);
+            video_pts_counter += num_missed_frames;
+        }
+
+        if(toggle_pause == 1 && !is_replaying) {
+            const bool new_paused_state = !paused;
+            if(new_paused_state) {
+                paused_time_start = clock_get_monotonic_seconds();
+                fprintf(stderr, "Paused\n");
             } else {
-                fprintf(stderr, "Error: avcodec_send_frame failed\n");
+                paused_time_offset = paused_time_offset + (clock_get_monotonic_seconds() - paused_time_start);
+                fprintf(stderr, "Unpaused\n");
+            }
+
+            toggle_pause = 0;
+            paused = !paused;
+        }
+
+        if(toggle_replay_recording && !arg_parser.replay_recording_directory) {
+            toggle_replay_recording = 0;
+            printf("gsr error: Unable to start recording since the -ro option was not specified\n");
+            fflush(stdout);
+        }
+
+        if(toggle_replay_recording && arg_parser.replay_recording_directory) {
+            toggle_replay_recording = 0;
+            const bool new_replay_recording_state = !replay_recording;
+            if(new_replay_recording_state) {
+                std::lock_guard<std::mutex> lock(audio_filter_mutex);
+                replay_recording_items.clear();
+                replay_recording_filepath = create_new_recording_filepath_from_timestamp(arg_parser.replay_recording_directory, "Video", file_extension, arg_parser.date_folders);
+                replay_recording_start_result = start_recording_create_streams(replay_recording_filepath.c_str(), arg_parser.container_format, video_codec_context, audio_tracks, hdr, capture);
+                if(replay_recording_start_result.av_format_context) {
+                    const size_t video_recording_destination_id = gsr_encoder_add_recording_destination(&encoder, video_codec_context, replay_recording_start_result.av_format_context, replay_recording_start_result.video_stream, video_frame->pts);
+                    if(video_recording_destination_id != (size_t)-1)
+                        replay_recording_items.push_back(video_recording_destination_id);
+
+                    for(const auto &audio_input : replay_recording_start_result.audio_inputs) {
+                        const size_t audio_recording_destination_id = gsr_encoder_add_recording_destination(&encoder, audio_input.audio_track->codec_context, replay_recording_start_result.av_format_context, audio_input.stream, audio_input.audio_track->pts);
+                        if(audio_recording_destination_id != (size_t)-1)
+                            replay_recording_items.push_back(audio_recording_destination_id);
+                    }
+
+                    replay_recording = true;
+                    force_iframe_frame = true;
+                    fprintf(stderr, "Started recording\n");
+                } else {
+                    printf("gsr error: Failed to start recording\n");
+                    fflush(stdout);
+                }
+            } else if(replay_recording_start_result.av_format_context) {
+                for(size_t id : replay_recording_items) {
+                    gsr_encoder_remove_recording_destination(&encoder, id);
+                }
+                replay_recording_items.clear();
+
+                if(stop_recording_close_streams(replay_recording_start_result.av_format_context)) {
+                    fprintf(stderr, "Stopped recording\n");
+                    puts(replay_recording_filepath.c_str());
+                    fflush(stdout);
+                    if(arg_parser.recording_saved_script)
+                        run_recording_saved_script_async(arg_parser.recording_saved_script, replay_recording_filepath.c_str(), "regular");
+                } else {
+                    printf("gsr error: Failed to save recording\n");
+                    fflush(stdout);
+                }
+
+                replay_recording_start_result = RecordingStartResult{};
+                replay_recording = false;
+                replay_recording_filepath.clear();
             }
         }
 
         if(save_replay_thread.valid() && save_replay_thread.wait_for(std::chrono::seconds(0)) == std::future_status::ready) {
             save_replay_thread.get();
-            puts(save_replay_output_filepath.c_str());
-            for(size_t i = 0; i < save_replay_packets.size(); ++i) {
-                av_packet_unref(&save_replay_packets[i]);
+            if(save_replay_output_filepath.empty()) {
+                printf("gsr error: Failed to save replay\n");
+                fflush(stdout);
+            } else {
+                puts(save_replay_output_filepath.c_str());
+                fflush(stdout);
+                if(arg_parser.recording_saved_script)
+                    run_recording_saved_script_async(arg_parser.recording_saved_script, save_replay_output_filepath.c_str(), "replay");
             }
-            save_replay_packets.clear();
         }
 
-        if(save_replay == 1 && !save_replay_thread.valid() && replay_buffer_size_secs != -1) {
-            save_replay = 0;
-            save_replay_async(video_codec_context, audio_codec_context, VIDEO_STREAM_INDEX, AUDIO_STREAM_INDEX, frame_data_queue, frames_erased, filename, container_format);
+        if(save_replay_seconds != 0 && !save_replay_thread.valid() && is_replaying) {
+            int current_save_replay_seconds = save_replay_seconds;
+            if(current_save_replay_seconds > 0)
+                current_save_replay_seconds += arg_parser.keyint;
+
+            save_replay_seconds = 0;
+            save_replay_output_filepath.clear();
+            save_replay_async(video_codec_context, VIDEO_STREAM_INDEX, audio_tracks, encoder.replay_buffer, arg_parser.filename, arg_parser.container_format, file_extension, arg_parser.date_folders, hdr, capture, current_save_replay_seconds);
+
+            if(arg_parser.restart_replay_on_save && current_save_replay_seconds == save_replay_seconds_full)
+                gsr_replay_buffer_clear(encoder.replay_buffer);
         }
 
-        // av_frame_free(&frame);
-        double frame_end = glfwGetTime();
-        double frame_sleep_fps = 1.0 / 250.0;
-        double sleep_time = frame_sleep_fps - (frame_end - frame_start);
-        if(sleep_time > 0.0)
-            usleep(sleep_time * 1000.0 * 1000.0);
+        const double time_at_frame_end = clock_get_monotonic_seconds() - paused_time_offset;
+        const double time_elapsed_total = time_at_frame_end - record_start_time;
+        const int64_t frames_elapsed = std::floor(time_elapsed_total / target_fps);
+        const double time_at_next_frame = (frames_elapsed + 1) * target_fps;
+        double time_to_next_frame = time_at_next_frame - time_elapsed_total;
+        if(time_to_next_frame > target_fps)
+            time_to_next_frame = target_fps;
+        const int64_t end_num_missed_frames = frames_elapsed - video_pts_counter;
+
+        if(time_to_next_frame > 0.0 && end_num_missed_frames <= 0)
+            av_usleep(time_to_next_frame * 1000.0 * 1000.0);
+        else {
+            if(paused)
+                av_usleep(20.0 * 1000.0); // 20 milliseconds
+            else if(arg_parser.framerate_mode == GSR_FRAMERATE_MODE_CONTENT)
+                av_usleep(2.8 * 1000.0); // 2.8 milliseconds
+        }
     }
 
-	running = 0;
+    running = 0;
 
-    if(save_replay_thread.valid())
+    if(save_replay_thread.valid()) {
         save_replay_thread.get();
+        if(save_replay_output_filepath.empty()) {
+            // TODO: Output failed to save
+        } else {
+            puts(save_replay_output_filepath.c_str());
+            fflush(stdout);
+            if(arg_parser.recording_saved_script)
+                run_recording_saved_script_async(arg_parser.recording_saved_script, save_replay_output_filepath.c_str(), "replay");
+        }
+    }
+
+    if(replay_recording_start_result.av_format_context) {
+        for(size_t id : replay_recording_items) {
+            gsr_encoder_remove_recording_destination(&encoder, id);
+        }
+        replay_recording_items.clear();
+
+        if(stop_recording_close_streams(replay_recording_start_result.av_format_context)) {
+            fprintf(stderr, "Stopped recording\n");
+            puts(replay_recording_filepath.c_str());
+            fflush(stdout);
+            if(arg_parser.recording_saved_script)
+                run_recording_saved_script_async(arg_parser.recording_saved_script, replay_recording_filepath.c_str(), "regular");
+        } else {
+            printf("gsr error: Failed to save recording\n");
+            fflush(stdout);
+        }
+    }
 
-    if(audio_input_arg.value) {
-        audio_thread.join();
-        sound_device_close(&sound_device);
+    for(AudioTrack &audio_track : audio_tracks) {
+        for(auto &audio_device : audio_track.audio_devices) {
+            audio_device.thread.join();
+            sound_device_close(&audio_device.sound_device);
+        }
     }
 
-    if (replay_buffer_size_secs == -1 && av_write_trailer(av_format_context) != 0) {
+    if(amix_thread.joinable())
+        amix_thread.join();
+
+    // TODO: Replace this with start_recording_create_steams
+    if(!is_replaying && av_write_trailer(av_format_context) != 0) {
         fprintf(stderr, "Failed to write trailer\n");
     }
 
-    if(replay_buffer_size_secs == -1 && !(output_format->flags & AVFMT_NOFILE))
+    if(!is_replaying) {
         avio_close(av_format_context->pb);
+        avformat_free_context(av_format_context);
+    }
+
+    gsr_damage_deinit(&damage);
+    gsr_color_conversion_deinit(&color_conversion);
+    gsr_video_encoder_destroy(video_encoder, video_codec_context);
+    gsr_encoder_deinit(&encoder);
+    gsr_capture_destroy(capture);
+#ifdef GSR_APP_AUDIO
+    gsr_pipewire_audio_deinit(&pipewire_audio);
+#endif
+
+    if(!is_replaying && arg_parser.recording_saved_script)
+        run_recording_saved_script_async(arg_parser.recording_saved_script, arg_parser.filename, "regular");
 
     if(dpy) {
-        XCompositeUnredirectWindow(dpy, src_window_id, CompositeRedirectAutomatic);
-        XCloseDisplay(dpy);
+        // TODO: This causes a crash, why? maybe some other library dlclose xlib and that also happened to unload this???
+        //XCloseDisplay(dpy);
     }
 
-    unlink(pid_file);
+    //gsr_egl_unload(&egl);
+    //gsr_window_destroy(&window);
+
+    //av_frame_free(&video_frame);
+    free(empty_audio);
+    args_parser_deinit(&arg_parser);
+    // We do an _exit here because cuda uses at_exit to do _something_ that causes the program to freeze,
+    // but only on some nvidia driver versions on some gpus (RTX?), and _exit exits the program without calling
+    // the at_exit registered functions.
+    // Cuda (cuvid library in this case) seems to be waiting for a thread that never finishes execution.
+    // Maybe this happens because we dont clean up all ffmpeg resources?
+    // TODO: Investigate this.
+    _exit(should_stop_error ? 3 : 0);
 }