diff --git a/.github/ISSUE_TEMPLATE/bug_report.md b/.github/ISSUE_TEMPLATE/bug_report.md
new file mode 100644
index 00000000..dd84ea78
--- /dev/null
+++ b/.github/ISSUE_TEMPLATE/bug_report.md
@@ -0,0 +1,38 @@
+---
+name: Bug report
+about: Create a report to help us improve
+title: ''
+labels: ''
+assignees: ''
+
+---
+
+**Describe the bug**
+A clear and concise description of what the bug is.
+
+**To Reproduce**
+Steps to reproduce the behavior:
+1. Go to '...'
+2. Click on '....'
+3. Scroll down to '....'
+4. See error
+
+**Expected behavior**
+A clear and concise description of what you expected to happen.
+
+**Screenshots**
+If applicable, add screenshots to help explain your problem.
+
+**Desktop (please complete the following information):**
+ - OS: [e.g. iOS]
+ - Browser [e.g. chrome, safari]
+ - Version [e.g. 22]
+
+**Smartphone (please complete the following information):**
+ - Device: [e.g. iPhone6]
+ - OS: [e.g. iOS8.1]
+ - Browser [e.g. stock browser, safari]
+ - Version [e.g. 22]
+
+**Additional context**
+Add any other context about the problem here.
diff --git a/.github/ISSUE_TEMPLATE/feature_request.md b/.github/ISSUE_TEMPLATE/feature_request.md
new file mode 100644
index 00000000..bbcbbe7d
--- /dev/null
+++ b/.github/ISSUE_TEMPLATE/feature_request.md
@@ -0,0 +1,20 @@
+---
+name: Feature request
+about: Suggest an idea for this project
+title: ''
+labels: ''
+assignees: ''
+
+---
+
+**Is your feature request related to a problem? Please describe.**
+A clear and concise description of what the problem is. Ex. I'm always frustrated when [...]
+
+**Describe the solution you'd like**
+A clear and concise description of what you want to happen.
+
+**Describe alternatives you've considered**
+A clear and concise description of any alternative solutions or features you've considered.
+
+**Additional context**
+Add any other context or screenshots about the feature request here.
diff --git a/.gitignore b/.gitignore
index 1a84c28c..49708f47 100644
--- a/.gitignore
+++ b/.gitignore
@@ -171,4 +171,9 @@ cython_debug/
 .vscode
 *.bin
 
-.DS_Store
\ No newline at end of file
+.DS_Store
+
+# gpt4all-chat
+CMakeLists.txt.user
+gpt4all-chat/meta/*
+gpt4all-chat/models/*
diff --git a/.gitmodules b/.gitmodules
index 371af62e..eb06ee48 100644
--- a/.gitmodules
+++ b/.gitmodules
@@ -1,3 +1,3 @@
-[submodule "peft"]
-	path = peft
-	url = https://github.com/huggingface/peft.git
+[submodule "llama.cpp"]
+	path = gpt4all-chat/llmodel/llama.cpp
+	url = https://github.com/manyoso/llama.cpp.git
diff --git a/gpt4all-chat/CMakeLists.txt b/gpt4all-chat/CMakeLists.txt
new file mode 100644
index 00000000..fbe018b9
--- /dev/null
+++ b/gpt4all-chat/CMakeLists.txt
@@ -0,0 +1,225 @@
+cmake_minimum_required(VERSION 3.16)
+
+if(APPLE)
+  option(BUILD_UNIVERSAL "Build a Universal binary on macOS" OFF)
+  if(BUILD_UNIVERSAL)
+    # Build a Universal binary on macOS
+    # This requires that the found Qt library is compiled as Universal binaries.
+    set(CMAKE_OSX_ARCHITECTURES "arm64;x86_64" CACHE STRING "" FORCE)
+  else()
+    # Build for the host architecture on macOS
+    set(CMAKE_OSX_ARCHITECTURES "${CMAKE_HOST_SYSTEM_PROCESSOR}" CACHE STRING "" FORCE)
+  endif()
+endif()
+
+set(APP_VERSION_MAJOR 2)
+set(APP_VERSION_MINOR 4)
+set(APP_VERSION_PATCH 2)
+set(APP_VERSION "${APP_VERSION_MAJOR}.${APP_VERSION_MINOR}.${APP_VERSION_PATCH}")
+
+# Include the binary directory for the generated header file
+include_directories("${CMAKE_CURRENT_BINARY_DIR}")
+
+project(gpt4all VERSION ${APP_VERSION} LANGUAGES CXX C)
+
+set(CMAKE_AUTOMOC ON)
+set(CMAKE_AUTORCC ON)
+set(CMAKE_CXX_STANDARD_REQUIRED ON)
+
+option(GPT4ALL_LOCALHOST OFF "Build installer for localhost repo")
+option(GPT4ALL_AVX_ONLY OFF "Build for avx only")
+option(GPT4ALL_OFFLINE_INSTALLER "Build an offline installer" OFF)
+
+# Generate a header file with the version number
+configure_file(
+  "${CMAKE_CURRENT_SOURCE_DIR}/cmake/config.h.in"
+  "${CMAKE_CURRENT_BINARY_DIR}/config.h"
+)
+
+find_package(Qt6 6.2 COMPONENTS Core Quick QuickDialogs2 Svg REQUIRED)
+
+# Get the Qt6Core target properties
+get_target_property(Qt6Core_INCLUDE_DIRS Qt6::Core INTERFACE_INCLUDE_DIRECTORIES)
+get_target_property(Qt6Core_LIBRARY_RELEASE Qt6::Core LOCATION_RELEASE)
+
+# Find the qmake binary
+find_program(QMAKE_EXECUTABLE NAMES qmake qmake6 PATHS ${Qt6Core_INCLUDE_DIRS}/../.. NO_DEFAULT_PATH)
+
+# Get the Qt 6 root directory
+get_filename_component(Qt6_ROOT_DIR "${Qt6Core_LIBRARY_RELEASE}" DIRECTORY)
+get_filename_component(Qt6_ROOT_DIR "${Qt6_ROOT_DIR}/.." ABSOLUTE)
+
+message(STATUS "qmake binary: ${QMAKE_EXECUTABLE}")
+message(STATUS "Qt 6 root directory: ${Qt6_ROOT_DIR}")
+
+add_subdirectory(llmodel)
+
+set (CMAKE_RUNTIME_OUTPUT_DIRECTORY ${CMAKE_BINARY_DIR}/bin)
+
+qt_add_executable(chat
+    main.cpp
+    chat.h chat.cpp
+    chatllm.h chatllm.cpp
+    chatmodel.h chatlistmodel.h chatlistmodel.cpp
+    download.h download.cpp
+    network.h network.cpp
+    llm.h llm.cpp
+    sysinfo.h
+)
+
+qt_add_qml_module(chat
+    URI gpt4all
+    VERSION 1.0
+    QML_FILES
+      main.qml
+      qml/ChatDrawer.qml
+      qml/ModelDownloaderDialog.qml
+      qml/NetworkDialog.qml
+      qml/NewVersionDialog.qml
+      qml/ThumbsDownDialog.qml
+      qml/SettingsDialog.qml
+      qml/StartupDialog.qml
+      qml/PopupDialog.qml
+      qml/AboutDialog.qml
+      qml/Theme.qml
+    RESOURCES
+      icons/send_message.svg
+      icons/stop_generating.svg
+      icons/regenerate.svg
+      icons/copy.svg
+      icons/settings.svg
+      icons/edit.svg
+      icons/trash.svg
+      icons/network.svg
+      icons/thumbs_up.svg
+      icons/thumbs_down.svg
+      icons/logo.svg
+      icons/logo-32.png
+      icons/logo-48.png
+      icons/favicon.ico
+      icons/favicon.icns
+)
+
+set_target_properties(chat PROPERTIES
+    MACOSX_BUNDLE_GUI_IDENTIFIER gpt4all
+    MACOSX_BUNDLE_BUNDLE_VERSION ${PROJECT_VERSION}
+    MACOSX_BUNDLE_SHORT_VERSION_STRING ${PROJECT_VERSION_MAJOR}.${PROJECT_VERSION_MINOR}
+    MACOSX_BUNDLE TRUE
+    WIN32_EXECUTABLE TRUE
+    MACOSX_BUNDLE_ICON_FILE "favicon.icns"
+)
+
+if(${CMAKE_SYSTEM_NAME} MATCHES Darwin)
+    set_target_properties(chat PROPERTIES
+        OUTPUT_NAME gpt4all
+    )
+endif()
+
+target_compile_definitions(chat
+    PRIVATE $<$<OR:$<CONFIG:Debug>,$<CONFIG:RelWithDebInfo>>:QT_QML_DEBUG>)
+target_link_libraries(chat
+    PRIVATE Qt6::Quick Qt6::Svg)
+target_link_libraries(chat
+    PRIVATE llmodel)
+
+set(COMPONENT_NAME_MAIN ${PROJECT_NAME})
+set(CMAKE_INSTALL_PREFIX ${CMAKE_BINARY_DIR}/install)
+
+if(NOT (CMAKE_HOST_SYSTEM_NAME STREQUAL "Darwin" AND CMAKE_HOST_SYSTEM_PROCESSOR STREQUAL "arm64"))
+    add_executable(test_hw test_hw.cpp)
+    install(TARGETS test_hw DESTINATION bin COMPONENT ${COMPONENT_NAME_MAIN})
+endif()
+
+install(TARGETS chat DESTINATION bin COMPONENT ${COMPONENT_NAME_MAIN})
+install(TARGETS llmodel DESTINATION lib COMPONENT ${COMPONENT_NAME_MAIN})
+install(TARGETS llama DESTINATION lib COMPONENT ${COMPONENT_NAME_MAIN})
+
+set(CPACK_GENERATOR "IFW")
+set(CPACK_VERBATIM_VARIABLES YES)
+set(CPACK_IFW_VERBOSE ON)
+
+if(${CMAKE_SYSTEM_NAME} MATCHES Linux)
+    set(LINUXDEPLOYQT "$ENV{HOME}/dev/linuxdeployqt/build/tools/linuxdeployqt/linuxdeployqt")
+    configure_file("${CMAKE_CURRENT_SOURCE_DIR}/cmake/deploy-qt-linux.cmake.in"
+                   "${CMAKE_BINARY_DIR}/cmake/deploy-qt-linux.cmake" @ONLY)
+    set(CPACK_PRE_BUILD_SCRIPTS ${CMAKE_BINARY_DIR}/cmake/deploy-qt-linux.cmake)
+    set(CPACK_IFW_ROOT "~/Qt/Tools/QtInstallerFramework/4.5")
+    set(CPACK_PACKAGE_FILE_NAME "${COMPONENT_NAME_MAIN}-installer-linux")
+    set(CPACK_IFW_TARGET_DIRECTORY "@HomeDir@/${COMPONENT_NAME_MAIN}")
+elseif(${CMAKE_SYSTEM_NAME} MATCHES Windows)
+    find_program(WINDEPLOYQT windeployqt HINTS ${_qt_bin_dir})
+    configure_file("${CMAKE_CURRENT_SOURCE_DIR}/cmake/deploy-qt-windows.cmake.in"
+                   "${CMAKE_BINARY_DIR}/cmake/deploy-qt-windows.cmake" @ONLY)
+    set(CPACK_PRE_BUILD_SCRIPTS ${CMAKE_BINARY_DIR}/cmake/deploy-qt-windows.cmake)
+    set(CPACK_IFW_ROOT "C:/Qt/Tools/QtInstallerFramework/4.5")
+    set(CPACK_IFW_PACKAGE_ICON "${CMAKE_CURRENT_SOURCE_DIR}/icons/favicon.ico")
+    set(CPACK_PACKAGE_FILE_NAME "${COMPONENT_NAME_MAIN}-installer-win64")
+    set(CPACK_IFW_TARGET_DIRECTORY "@HomeDir@\\${COMPONENT_NAME_MAIN}")
+elseif(${CMAKE_SYSTEM_NAME} MATCHES Darwin)
+    find_program(MACDEPLOYQT macdeployqt HINTS ${_qt_bin_dir})
+    configure_file("${CMAKE_CURRENT_SOURCE_DIR}/cmake/deploy-qt-mac.cmake.in"
+                   "${CMAKE_BINARY_DIR}/cmake/deploy-qt-mac.cmake" @ONLY)
+    set(CPACK_PRE_BUILD_SCRIPTS ${CMAKE_BINARY_DIR}/cmake/deploy-qt-mac.cmake)
+    set(CPACK_IFW_ROOT "~/Qt/Tools/QtInstallerFramework/4.5")
+    set(CPACK_IFW_PACKAGE_ICON "${CMAKE_CURRENT_SOURCE_DIR}/icons/favicon.icns")
+    set(CPACK_PACKAGE_FILE_NAME "${COMPONENT_NAME_MAIN}-installer-darwin")
+    set(CPACK_IFW_TARGET_DIRECTORY "@ApplicationsDir@/${COMPONENT_NAME_MAIN}")
+    set(CPACK_BUNDLE_NAME ${COMPONENT_NAME_MAIN})
+    set(CPACK_BUNDLE_ICON "${CMAKE_CURRENT_SOURCE_DIR}/icons/favicon.icns")
+endif()
+
+set(CPACK_PACKAGE_INSTALL_DIRECTORY ${COMPONENT_NAME_MAIN})
+set(CPACK_PACKAGE_VERSION_MAJOR ${PROJECT_VERSION_MAJOR})
+set(CPACK_PACKAGE_VERSION_MINOR ${PROJECT_VERSION_MINOR})
+SET(CPACK_PACKAGE_VERSION_PATCH ${PROJECT_VERSION_PATCH})
+set(CPACK_PACKAGE_HOMEPAGE_URL "https://gpt4all.io")
+set(CPACK_PACKAGE_ICON "${CMAKE_CURRENT_SOURCE_DIR}/icons/logo-48.png")
+set(CPACK_RESOURCE_FILE_LICENSE ${CMAKE_CURRENT_SOURCE_DIR}/LICENSE)
+set(CPACK_RESOURCE_FILE_README ${CMAKE_CURRENT_SOURCE_DIR}/README.md)
+set(CPACK_PACKAGE_EXECUTABLES "GPT4All")
+set(CPACK_CREATE_DESKTOP_LINKS "GPT4All")
+set(CPACK_IFW_PACKAGE_NAME "GPT4All")
+set(CPACK_IFW_PACKAGE_TITLE "GPT4All Installer")
+set(CPACK_IFW_PACKAGE_PUBLISHER "Nomic, Inc.")
+set(CPACK_IFW_PRODUCT_URL "https://gpt4all.io")
+set(CPACK_IFW_PACKAGE_WIZARD_STYLE "Aero")
+set(CPACK_IFW_PACKAGE_LOGO "${CMAKE_CURRENT_SOURCE_DIR}/icons/logo-48.png")
+set(CPACK_IFW_PACKAGE_WINDOW_ICON "${CMAKE_CURRENT_SOURCE_DIR}/icons/logo-32.png")
+set(CPACK_IFW_PACKAGE_WIZARD_SHOW_PAGE_LIST OFF)
+
+include(InstallRequiredSystemLibraries)
+include(CPack)
+include(CPackIFW)
+cpack_add_component(${COMPONENT_NAME_MAIN} DOWNLOADED)
+cpack_ifw_configure_component(${COMPONENT_NAME_MAIN} ESSENTIAL FORCED_INSTALLATION)
+cpack_ifw_configure_component(${COMPONENT_NAME_MAIN} VERSION ${APP_VERSION})
+cpack_ifw_configure_component(${COMPONENT_NAME_MAIN} LICENSES "MIT LICENSE" ${CPACK_RESOURCE_FILE_LICENSE})
+cpack_ifw_configure_component(${COMPONENT_NAME_MAIN} SCRIPT "${CMAKE_CURRENT_SOURCE_DIR}/cmake/installerscript.qs")
+cpack_ifw_configure_component(${COMPONENT_NAME_MAIN} REPLACES "gpt4all-chat") #Was used in very earliest prototypes
+
+if (GPT4ALL_LOCALHOST)
+    cpack_ifw_add_repository("GPT4AllRepository" URL "http://localhost/repository")
+elseif(GPT4ALL_OFFLINE_INSTALLER)
+    cpack_ifw_add_repository("GPT4AllRepository" URL "file://${CMAKE_BINARY_DIR}/packages")
+else()
+  if(${CMAKE_SYSTEM_NAME} MATCHES Linux)
+    if (GPT4ALL_AVX_ONLY)
+      cpack_ifw_add_repository("GPT4AllRepository" URL "https://gpt4all.io/installer_repos/avx_only/linux/repository")
+    else()
+      cpack_ifw_add_repository("GPT4AllRepository" URL "https://gpt4all.io/installer_repos/linux/repository")
+    endif()
+  elseif(${CMAKE_SYSTEM_NAME} MATCHES Windows)
+    #To sign the target on windows have to create a batch script add use it as a custom target and then use CPACK_IFW_EXTRA_TARGETS to set this extra target
+    if (GPT4ALL_AVX_ONLY)
+      cpack_ifw_add_repository("GPT4AllRepository" URL "https://gpt4all.io/installer_repos/avx_only/windows/repository")
+    else()
+      cpack_ifw_add_repository("GPT4AllRepository" URL "https://gpt4all.io/installer_repos/windows/repository")
+    endif()
+  elseif(${CMAKE_SYSTEM_NAME} MATCHES Darwin)
+    if (GPT4ALL_AVX_ONLY)
+      cpack_ifw_add_repository("GPT4AllRepository" URL "https://gpt4all.io/installer_repos/avx_only/mac/repository")
+    else()
+      cpack_ifw_add_repository("GPT4AllRepository" URL "https://gpt4all.io/installer_repos/mac/repository")
+    endif()
+  endif()
+endif()
diff --git a/gpt4all-chat/LICENSE b/gpt4all-chat/LICENSE
new file mode 100644
index 00000000..09ca4546
--- /dev/null
+++ b/gpt4all-chat/LICENSE
@@ -0,0 +1,15 @@
+Copyright 2023 Nomic, Inc., Aaron Miller
+
+Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the “Software”), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED “AS IS”, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
+
+ADDENDUM:
+
+Any LLM models that are loaded and used by the application are not themselves
+subject to this license if indeed they are even copyrightable. The terms of
+this license apply only to the application software and its accompanying
+documentation and do not extend to any LLM models, whether created by the
+author of the application or obtained from third-party sources.
diff --git a/gpt4all-chat/README.md b/gpt4all-chat/README.md
index d78f4611..4bbe6016 100644
--- a/gpt4all-chat/README.md
+++ b/gpt4all-chat/README.md
@@ -1,2 +1,78 @@
-# GPT4All Chat
-This directory will contain the code to build out the QT chat GUI.
+# gpt4all-chat
+
+Cross platform Qt based GUI for GPT4All versions with GPT-J as the base
+model. NOTE: The model seen in the screenshot is actually a preview of a
+new training run for GPT4All based on GPT-J. The GPT4All project is busy
+at work getting ready to release this model including installers for all
+three major OS's. In the meantime, you can try this UI out with the original
+GPT-J model by following build instructions below.
+
+![image](https://user-images.githubusercontent.com/50458173/231464085-da9edff6-a593-410e-8f38-7513f75c8aab.png)
+
+## Install
+
+One click installers for macOS, Linux, and Windows at https://gpt4all.io
+
+## Features
+
+* Cross-platform (Linux, Windows, MacOSX)
+* Fast CPU based inference using ggml for GPT-J based models
+* The UI is made to look and feel like you've come to expect from a chatty gpt
+* Check for updates so you can alway stay fresh with latest models
+* Easy to install with precompiled binaries available for all three major desktop platforms
+* Multi-modal - Ability to load more than one model and switch between them
+* Supports both llama.cpp and gptj.cpp style models
+* Model downloader in GUI featuring many popular open source models
+* Settings dialog to change temp, top_p, top_k, threads, etc
+* Copy your conversation to clipboard
+* Check for updates to get the very latest GUI
+
+## Feature wishlist
+
+* Multi-chat - a list of current and past chats and the ability to save/delete/export and switch between
+* Text to speech - have the AI response with voice
+* Speech to text - give the prompt with your voice
+* Python bindings
+* Typescript bindings
+* Plugin support for langchain other developer tools
+* Save your prompt/responses to disk
+* Upload prompt/respones manually/automatically to nomic.ai to aid future training runs
+* Syntax highlighting support for programming languages, etc.
+* REST API with a built-in webserver in the chat gui itself with a headless operation mode as well
+* Advanced settings for changing temperature, topk, etc. (DONE)
+* YOUR IDEA HERE
+
+## Building and running
+
+* Follow the visual instructions on the [build_and_run](build_and_run.md) page
+
+## Getting the latest
+
+If you've already checked out the source code and/or built the program make sure when you do a git fetch to get the latest changes and that you also do ```git submodule update --init --recursive``` to update the submodules.
+
+## Manual download of models
+* https://gpt4all.io/models/ggml-mpt-7b-chat.bin (default) (md5sum 756249d3d6abe23bde3b1ae272628640) Current best non-commercially licensable chat model based on MPT and trained by Mosaic ML.
+* https://gpt4all.io/models/ggml-gpt4all-j-v1.3-groovy.bin (default) (md5sum 81a09a0ddf89690372fc296ff7f625af) Current best commercially licensable model based on GPT-J and trained by Nomic AI on the latest curated GPT4All dataset.
+* https://gpt4all.io/models/ggml-gpt4all-l13b-snoozy.bin (md5sum 91f886b68fbce697e9a3cd501951e455) Current best non-commercially licensable model based on Llama 13b and trained by Nomic AI on the latest curated GPT4All dataset.
+* https://gpt4all.io/models/ggml-gpt4all-j-v1.2-jazzy.bin (md5sum 879344aaa9d62fdccbda0be7a09e7976) An commercially licensable model based on GPT-J and trained by Nomic AI on the v2 GPT4All dataset.
+* https://gpt4all.io/models/ggml-gpt4all-j-v1.1-breezy.bin (md5sum 61d48a82cb188cceb14ebb8082bfec37) An commercially licensable model based on GPT-J and trained by Nomic AI on the v1 GPT4All dataset.
+* https://gpt4all.io/models/ggml-gpt4all-j.bin (md5sum 5b5a3f9b858d33b29b52b89692415595) An commercially licensable model based on GPT-J and trained by Nomic AI on the v0 GPT4All dataset.
+* https://gpt4all.io/models/ggml-vicuna-7b-1.1-q4_2.bin (md5sum 29119f8fa11712704c6b22ac5ab792ea) An non-commercially licensable model based on Llama 7b and trained by teams from UC Berkeley, CMU, Stanford, MBZUAI, and UC San Diego.
+* https://gpt4all.io/models/ggml-vicuna-13b-1.1-q4_2.bin (md5sum 95999b7b0699e2070af63bf5d34101a8) An non-commercially licensable model based on Llama 13b and trained by teams from UC Berkeley, CMU, Stanford, MBZUAI, and UC San Diego.
+* https://gpt4all.io/models/ggml-wizardLM-7B.q4_2.bin (md5sum 99e6d129745a3f1fb1121abed747b05a) An non-commercially licensable model based on Llama 7b and trained by Microsoft and Peking University.
+* https://gpt4all.io/models/ggml-stable-vicuna-13B.q4_2.bin (md5sum 6cb4ee297537c9133bddab9692879de0) An non-commercially licensable model based on Llama 13b and RLHF trained by Stable AI.
+* https://gpt4all.io/models/ggml-mpt-7b-base.bin (md5sum 120c32a51d020066288df045ef5d52b9) A commercially licensable model base pre-trained by Mosaic ML.
+
+## Terminal Only Interface with no Qt dependency
+
+Check out https://github.com/kuvaus/LlamaGPTJ-chat which is using the llmodel backend so it is compliant with our ecosystem and all models downloaded above should work with it.
+
+## Contributing
+
+* Pull requests welcome. See the feature wish list for ideas :)
+
+
+## License
+The source code of this chat interface is currently under a MIT license. The underlying GPT4All-j model is released under non-restrictive open-source Apache 2 License.
+
+The GPT4All-J license allows for users to use generated outputs as they see fit. Users take responsibility for ensuring their content meets applicable requirements for publication in a given context or region.
diff --git a/gpt4all-chat/build_and_run.md b/gpt4all-chat/build_and_run.md
new file mode 100644
index 00000000..e111d0b4
--- /dev/null
+++ b/gpt4all-chat/build_and_run.md
@@ -0,0 +1,57 @@
+# Install Qt 6.x and setup/build gpt4all-chat from source
+
+Depending upon your operating system, there are many ways that Qt is distributed. 
+Here is the recommended method for getting the Qt dependency installed to setup and build 
+gpt4all-chat from source.
+
+## Create a [Qt account](https://login.qt.io/register) 
+
+![image](https://github.com/nomic-ai/gpt4all-chat/assets/10168/d1e44cab-4245-4144-a91c-7b02267df2b2)
+
+## Go to the Qt open source [download page](https://www.qt.io/download-qt-installer-oss)
+
+![image](https://github.com/nomic-ai/gpt4all-chat/assets/10168/d68f5f45-cca3-4fe9-acf4-cabdcb95f669)
+
+## Start the installer and sign in
+
+![image](https://github.com/nomic-ai/gpt4all-chat/assets/10168/899b1422-51ae-4bb5-acc9-b9027a8e9b19)
+
+## After some screens about license, select custom
+
+![image](https://github.com/nomic-ai/gpt4all-chat/assets/10168/2290031a-fdb0-4f47-a7f1-d77ad5451068)
+
+## Select the following
+
+![image](https://github.com/nomic-ai/gpt4all-chat/assets/10168/c6e999e5-cc8a-4dfc-8065-b59139e8c7ae)
+
+NOTE: This is for macOS. For Linux it is similar, but you need ming64 for Windows, not the MSVC install
+
+## Open up QtCreator
+
+![image](https://github.com/nomic-ai/gpt4all-chat/assets/10168/a34978f4-a220-459c-af66-e901d7ccd7bb)
+
+## Clone the git repo for gpt4all-chat
+
+```
+git clone --recurse-submodules https://github.com/nomic-ai/gpt4all-chat
+```
+
+## Open the gpt4all-chat project in QtCreator
+
+![image](https://github.com/nomic-ai/gpt4all-chat/assets/10168/3d3e2743-2a1d-43d6-9e55-62f7f4306de7)
+
+NOTE: File->Open File or Project and navigate to the gpt4all-chat repo and choose the CMakeLists.txt
+
+## Configure project
+
+![image](https://github.com/nomic-ai/gpt4all-chat/assets/10168/44d5aafb-a95d-434b-ba2a-a3138c0e49a0)
+
+## Build project
+
+![image](https://github.com/nomic-ai/gpt4all-chat/assets/10168/43cd7b42-32f0-4efa-9612-d51f85637103)
+
+## Run project
+
+![image](https://github.com/nomic-ai/gpt4all-chat/assets/10168/611ea795-bdcd-4feb-a466-eb1c2e936e7e)
+
+
diff --git a/gpt4all-chat/chat.cpp b/gpt4all-chat/chat.cpp
new file mode 100644
index 00000000..2a6b941f
--- /dev/null
+++ b/gpt4all-chat/chat.cpp
@@ -0,0 +1,274 @@
+#include "chat.h"
+#include "llm.h"
+#include "network.h"
+#include "download.h"
+
+Chat::Chat(QObject *parent)
+    : QObject(parent)
+    , m_id(Network::globalInstance()->generateUniqueId())
+    , m_name(tr("New Chat"))
+    , m_chatModel(new ChatModel(this))
+    , m_responseInProgress(false)
+    , m_creationDate(QDateTime::currentSecsSinceEpoch())
+    , m_llmodel(new ChatLLM(this))
+{
+    // Should be in same thread
+    connect(Download::globalInstance(), &Download::modelListChanged, this, &Chat::modelListChanged, Qt::DirectConnection);
+    connect(this, &Chat::modelNameChanged, this, &Chat::modelListChanged, Qt::DirectConnection);
+
+    // Should be in different threads
+    connect(m_llmodel, &ChatLLM::isModelLoadedChanged, this, &Chat::isModelLoadedChanged, Qt::QueuedConnection);
+    connect(m_llmodel, &ChatLLM::responseChanged, this, &Chat::handleResponseChanged, Qt::QueuedConnection);
+    connect(m_llmodel, &ChatLLM::responseStarted, this, &Chat::responseStarted, Qt::QueuedConnection);
+    connect(m_llmodel, &ChatLLM::responseStopped, this, &Chat::responseStopped, Qt::QueuedConnection);
+    connect(m_llmodel, &ChatLLM::modelNameChanged, this, &Chat::handleModelNameChanged, Qt::QueuedConnection);
+    connect(m_llmodel, &ChatLLM::modelLoadingError, this, &Chat::modelLoadingError, Qt::QueuedConnection);
+    connect(m_llmodel, &ChatLLM::recalcChanged, this, &Chat::handleRecalculating, Qt::QueuedConnection);
+    connect(m_llmodel, &ChatLLM::generatedNameChanged, this, &Chat::generatedNameChanged, Qt::QueuedConnection);
+
+    connect(this, &Chat::promptRequested, m_llmodel, &ChatLLM::prompt, Qt::QueuedConnection);
+    connect(this, &Chat::modelNameChangeRequested, m_llmodel, &ChatLLM::modelNameChangeRequested, Qt::QueuedConnection);
+    connect(this, &Chat::loadDefaultModelRequested, m_llmodel, &ChatLLM::loadDefaultModel, Qt::QueuedConnection);
+    connect(this, &Chat::loadModelRequested, m_llmodel, &ChatLLM::loadModel, Qt::QueuedConnection);
+    connect(this, &Chat::unloadModelRequested, m_llmodel, &ChatLLM::unloadModel, Qt::QueuedConnection);
+    connect(this, &Chat::reloadModelRequested, m_llmodel, &ChatLLM::reloadModel, Qt::QueuedConnection);
+    connect(this, &Chat::generateNameRequested, m_llmodel, &ChatLLM::generateName, Qt::QueuedConnection);
+
+    // The following are blocking operations and will block the gui thread, therefore must be fast
+    // to respond to
+    connect(this, &Chat::regenerateResponseRequested, m_llmodel, &ChatLLM::regenerateResponse, Qt::BlockingQueuedConnection);
+    connect(this, &Chat::resetResponseRequested, m_llmodel, &ChatLLM::resetResponse, Qt::BlockingQueuedConnection);
+    connect(this, &Chat::resetContextRequested, m_llmodel, &ChatLLM::resetContext, Qt::BlockingQueuedConnection);
+}
+
+void Chat::reset()
+{
+    stopGenerating();
+    // Erase our current on disk representation as we're completely resetting the chat along with id
+    LLM::globalInstance()->chatListModel()->removeChatFile(this);
+    emit resetContextRequested(); // blocking queued connection
+    m_id = Network::globalInstance()->generateUniqueId();
+    emit idChanged();
+    // NOTE: We deliberately do no reset the name or creation date to indictate that this was originally
+    // an older chat that was reset for another purpose. Resetting this data will lead to the chat
+    // name label changing back to 'New Chat' and showing up in the chat model list as a 'New Chat'
+    // further down in the list. This might surprise the user. In the future, we me might get rid of
+    // the "reset context" button in the UI. Right now, by changing the model in the combobox dropdown
+    // we effectively do a reset context. We *have* to do this right now when switching between different
+    // types of models. The only way to get rid of that would be a very long recalculate where we rebuild
+    // the context if we switch between different types of models. Probably the right way to fix this
+    // is to allow switching models but throwing up a dialog warning users if we switch between types
+    // of models that a long recalculation will ensue.
+    m_chatModel->clear();
+}
+
+bool Chat::isModelLoaded() const
+{
+    return m_llmodel->isModelLoaded();
+}
+
+void Chat::prompt(const QString &prompt, const QString &prompt_template, int32_t n_predict,
+    int32_t top_k, float top_p, float temp, int32_t n_batch, float repeat_penalty,
+    int32_t repeat_penalty_tokens)
+{
+    emit promptRequested(prompt, prompt_template, n_predict, top_k, top_p, temp, n_batch,
+        repeat_penalty, repeat_penalty_tokens, LLM::globalInstance()->threadCount());
+}
+
+void Chat::regenerateResponse()
+{
+    emit regenerateResponseRequested(); // blocking queued connection
+}
+
+void Chat::stopGenerating()
+{
+    m_llmodel->stopGenerating();
+}
+
+QString Chat::response() const
+{
+    return m_llmodel->response();
+}
+
+void Chat::handleResponseChanged()
+{
+    const int index = m_chatModel->count() - 1;
+    m_chatModel->updateValue(index, response());
+    emit responseChanged();
+}
+
+void Chat::responseStarted()
+{
+    m_responseInProgress = true;
+    emit responseInProgressChanged();
+}
+
+void Chat::responseStopped()
+{
+    m_responseInProgress = false;
+    emit responseInProgressChanged();
+    if (m_llmodel->generatedName().isEmpty())
+        emit generateNameRequested();
+    if (chatModel()->count() < 3)
+        Network::globalInstance()->sendChatStarted();
+}
+
+QString Chat::modelName() const
+{
+    return m_llmodel->modelName();
+}
+
+void Chat::setModelName(const QString &modelName)
+{
+    // doesn't block but will unload old model and load new one which the gui can see through changes
+    // to the isModelLoaded property
+    emit modelNameChangeRequested(modelName);
+}
+
+void Chat::newPromptResponsePair(const QString &prompt)
+{
+    m_chatModel->appendPrompt(tr("Prompt: "), prompt);
+    m_chatModel->appendResponse(tr("Response: "), prompt);
+    emit resetResponseRequested(); // blocking queued connection
+}
+
+bool Chat::isRecalc() const
+{
+    return m_llmodel->isRecalc();
+}
+
+void Chat::loadDefaultModel()
+{
+    emit loadDefaultModelRequested();
+}
+
+void Chat::loadModel(const QString &modelName)
+{
+    emit loadModelRequested(modelName);
+}
+
+void Chat::unloadModel()
+{
+    stopGenerating();
+    emit unloadModelRequested();
+}
+
+void Chat::reloadModel()
+{
+    emit reloadModelRequested(m_savedModelName);
+}
+
+void Chat::generatedNameChanged()
+{
+    // Only use the first three words maximum and remove newlines and extra spaces
+    QString gen = m_llmodel->generatedName().simplified();
+    QStringList words = gen.split(' ', Qt::SkipEmptyParts);
+    int wordCount = qMin(3, words.size());
+    m_name = words.mid(0, wordCount).join(' ');
+    emit nameChanged();
+}
+
+void Chat::handleRecalculating()
+{
+    Network::globalInstance()->sendRecalculatingContext(m_chatModel->count());
+    emit recalcChanged();
+}
+
+void Chat::handleModelNameChanged()
+{
+    m_savedModelName = modelName();
+    emit modelNameChanged();
+}
+
+bool Chat::serialize(QDataStream &stream, int version) const
+{
+    stream << m_creationDate;
+    stream << m_id;
+    stream << m_name;
+    stream << m_userName;
+    stream << m_savedModelName;
+    if (!m_llmodel->serialize(stream, version))
+        return false;
+    if (!m_chatModel->serialize(stream, version))
+        return false;
+    return stream.status() == QDataStream::Ok;
+}
+
+bool Chat::deserialize(QDataStream &stream, int version)
+{
+    stream >> m_creationDate;
+    stream >> m_id;
+    emit idChanged();
+    stream >> m_name;
+    stream >> m_userName;
+    emit nameChanged();
+    stream >> m_savedModelName;
+
+    // Prior to version 2 gptj models had a bug that fixed the kv_cache to F32 instead of F16 so
+    // unfortunately, we cannot deserialize these
+    if (version < 2 && m_savedModelName.contains("gpt4all-j"))
+        return false;
+
+    if (!m_llmodel->deserialize(stream, version))
+        return false;
+    if (!m_chatModel->deserialize(stream, version))
+        return false;
+    emit chatModelChanged();
+    return stream.status() == QDataStream::Ok;
+}
+
+QList<QString> Chat::modelList() const
+{
+    // Build a model list from exepath and from the localpath
+    QList<QString> list;
+
+    QString exePath = QCoreApplication::applicationDirPath() + QDir::separator();
+    QString localPath = Download::globalInstance()->downloadLocalModelsPath();
+
+    {
+        QDir dir(exePath);
+        dir.setNameFilters(QStringList() << "ggml-*.bin");
+        QStringList fileNames = dir.entryList();
+        for (QString f : fileNames) {
+            QString filePath = exePath + f;
+            QFileInfo info(filePath);
+            QString name = info.completeBaseName().remove(0, 5);
+            if (info.exists()) {
+                if (name == modelName())
+                    list.prepend(name);
+                else
+                    list.append(name);
+            }
+        }
+    }
+
+    if (localPath != exePath) {
+        QDir dir(localPath);
+        dir.setNameFilters(QStringList() << "ggml-*.bin");
+        QStringList fileNames = dir.entryList();
+        for (QString f : fileNames) {
+            QString filePath = localPath + f;
+            QFileInfo info(filePath);
+            QString name = info.completeBaseName().remove(0, 5);
+            if (info.exists() && !list.contains(name)) { // don't allow duplicates
+                if (name == modelName())
+                    list.prepend(name);
+                else
+                    list.append(name);
+            }
+        }
+    }
+
+    if (list.isEmpty()) {
+        if (exePath != localPath) {
+            qWarning() << "ERROR: Could not find any applicable models in"
+                       << exePath << "nor" << localPath;
+        } else {
+            qWarning() << "ERROR: Could not find any applicable models in"
+                       << exePath;
+        }
+        return QList<QString>();
+    }
+
+    return list;
+}
diff --git a/gpt4all-chat/chat.h b/gpt4all-chat/chat.h
new file mode 100644
index 00000000..4ec97ee6
--- /dev/null
+++ b/gpt4all-chat/chat.h
@@ -0,0 +1,106 @@
+#ifndef CHAT_H
+#define CHAT_H
+
+#include <QObject>
+#include <QtQml>
+#include <QDataStream>
+
+#include "chatllm.h"
+#include "chatmodel.h"
+
+class Chat : public QObject
+{
+    Q_OBJECT
+    Q_PROPERTY(QString id READ id NOTIFY idChanged)
+    Q_PROPERTY(QString name READ name WRITE setName NOTIFY nameChanged)
+    Q_PROPERTY(ChatModel *chatModel READ chatModel NOTIFY chatModelChanged)
+    Q_PROPERTY(bool isModelLoaded READ isModelLoaded NOTIFY isModelLoadedChanged)
+    Q_PROPERTY(QString response READ response NOTIFY responseChanged)
+    Q_PROPERTY(QString modelName READ modelName WRITE setModelName NOTIFY modelNameChanged)
+    Q_PROPERTY(bool responseInProgress READ responseInProgress NOTIFY responseInProgressChanged)
+    Q_PROPERTY(bool isRecalc READ isRecalc NOTIFY recalcChanged)
+    Q_PROPERTY(QList<QString> modelList READ modelList NOTIFY modelListChanged)
+    QML_ELEMENT
+    QML_UNCREATABLE("Only creatable from c++!")
+
+public:
+    explicit Chat(QObject *parent = nullptr);
+
+    QString id() const { return m_id; }
+    QString name() const { return m_userName.isEmpty() ? m_name : m_userName; }
+    void setName(const QString &name)
+    {
+        m_userName = name;
+        emit nameChanged();
+    }
+    ChatModel *chatModel() { return m_chatModel; }
+
+    Q_INVOKABLE void reset();
+    Q_INVOKABLE bool isModelLoaded() const;
+    Q_INVOKABLE void prompt(const QString &prompt, const QString &prompt_template, int32_t n_predict,
+        int32_t top_k, float top_p, float temp, int32_t n_batch, float repeat_penalty, int32_t repeat_penalty_tokens);
+    Q_INVOKABLE void regenerateResponse();
+    Q_INVOKABLE void stopGenerating();
+    Q_INVOKABLE void newPromptResponsePair(const QString &prompt);
+
+    QString response() const;
+    bool responseInProgress() const { return m_responseInProgress; }
+    QString modelName() const;
+    void setModelName(const QString &modelName);
+    bool isRecalc() const;
+
+    void loadDefaultModel();
+    void loadModel(const QString &modelName);
+    void unloadModel();
+    void reloadModel();
+
+    qint64 creationDate() const { return m_creationDate; }
+    bool serialize(QDataStream &stream, int version) const;
+    bool deserialize(QDataStream &stream, int version);
+
+    QList<QString> modelList() const;
+
+Q_SIGNALS:
+    void idChanged();
+    void nameChanged();
+    void chatModelChanged();
+    void isModelLoadedChanged();
+    void responseChanged();
+    void responseInProgressChanged();
+    void promptRequested(const QString &prompt, const QString &prompt_template, int32_t n_predict,
+        int32_t top_k, float top_p, float temp, int32_t n_batch, float repeat_penalty, int32_t repeat_penalty_tokens,
+        int32_t n_threads);
+    void regenerateResponseRequested();
+    void resetResponseRequested();
+    void resetContextRequested();
+    void modelNameChangeRequested(const QString &modelName);
+    void modelNameChanged();
+    void recalcChanged();
+    void loadDefaultModelRequested();
+    void loadModelRequested(const QString &modelName);
+    void unloadModelRequested();
+    void reloadModelRequested(const QString &modelName);
+    void generateNameRequested();
+    void modelListChanged();
+    void modelLoadingError(const QString &error);
+
+private Q_SLOTS:
+    void handleResponseChanged();
+    void responseStarted();
+    void responseStopped();
+    void generatedNameChanged();
+    void handleRecalculating();
+    void handleModelNameChanged();
+
+private:
+    QString m_id;
+    QString m_name;
+    QString m_userName;
+    QString m_savedModelName;
+    ChatModel *m_chatModel;
+    bool m_responseInProgress;
+    qint64 m_creationDate;
+    ChatLLM *m_llmodel;
+};
+
+#endif // CHAT_H
diff --git a/gpt4all-chat/chatlistmodel.cpp b/gpt4all-chat/chatlistmodel.cpp
new file mode 100644
index 00000000..3fd2246f
--- /dev/null
+++ b/gpt4all-chat/chatlistmodel.cpp
@@ -0,0 +1,246 @@
+#include "chatlistmodel.h"
+#include "download.h"
+
+#include <QFile>
+#include <QDataStream>
+
+#define CHAT_FORMAT_MAGIC 0xF5D553CC
+#define CHAT_FORMAT_VERSION 2
+
+ChatListModel::ChatListModel(QObject *parent)
+    : QAbstractListModel(parent)
+    , m_newChat(nullptr)
+    , m_dummyChat(nullptr)
+    , m_currentChat(nullptr)
+    , m_shouldSaveChats(false)
+{
+    addDummyChat();
+
+    ChatsRestoreThread *thread = new ChatsRestoreThread;
+    connect(thread, &ChatsRestoreThread::chatRestored, this, &ChatListModel::restoreChat);
+    connect(thread, &ChatsRestoreThread::finished, this, &ChatListModel::chatsRestoredFinished);
+    connect(thread, &ChatsRestoreThread::finished, thread, &QObject::deleteLater);
+    thread->start();
+}
+
+bool ChatListModel::shouldSaveChats() const
+{
+    return m_shouldSaveChats;
+}
+
+void ChatListModel::setShouldSaveChats(bool b)
+{
+    if (m_shouldSaveChats == b)
+        return;
+    m_shouldSaveChats = b;
+    emit shouldSaveChatsChanged();
+}
+
+void ChatListModel::removeChatFile(Chat *chat) const
+{
+    const QString savePath = Download::globalInstance()->downloadLocalModelsPath();
+    QFile file(savePath + "/gpt4all-" + chat->id() + ".chat");
+    if (!file.exists())
+        return;
+    bool success = file.remove();
+    if (!success)
+        qWarning() << "ERROR: Couldn't remove chat file:" << file.fileName();
+}
+
+void ChatListModel::saveChats() const
+{
+    if (!m_shouldSaveChats)
+        return;
+
+    QElapsedTimer timer;
+    timer.start();
+    const QString savePath = Download::globalInstance()->downloadLocalModelsPath();
+    for (Chat *chat : m_chats) {
+        QString fileName = "gpt4all-" + chat->id() + ".chat";
+        QFile file(savePath + "/" + fileName);
+        bool success = file.open(QIODevice::WriteOnly);
+        if (!success) {
+            qWarning() << "ERROR: Couldn't save chat to file:" << file.fileName();
+            continue;
+        }
+        QDataStream out(&file);
+
+        out << (quint32)CHAT_FORMAT_MAGIC;
+        out << (qint32)CHAT_FORMAT_VERSION;
+        out.setVersion(QDataStream::Qt_6_2);
+
+        qDebug() << "serializing chat" << fileName;
+        if (!chat->serialize(out, CHAT_FORMAT_VERSION)) {
+            qWarning() << "ERROR: Couldn't serialize chat to file:" << file.fileName();
+            file.remove();
+        }
+        file.close();
+    }
+    qint64 elapsedTime = timer.elapsed();
+    qDebug() << "serializing chats took:" << elapsedTime << "ms";
+}
+
+void ChatsRestoreThread::run()
+{
+    QElapsedTimer timer;
+    timer.start();
+    struct FileInfo {
+        bool oldFile;
+        qint64 creationDate;
+        QString file;
+    };
+    QList<FileInfo> files;
+    {
+        // Look for any files in the original spot which was the settings config directory
+        QSettings settings;
+        QFileInfo settingsInfo(settings.fileName());
+        QString settingsPath = settingsInfo.absolutePath();
+        QDir dir(settingsPath);
+        dir.setNameFilters(QStringList() << "gpt4all-*.chat");
+        QStringList fileNames = dir.entryList();
+        for (QString f : fileNames) {
+            QString filePath = settingsPath + "/" + f;
+            QFile file(filePath);
+            bool success = file.open(QIODevice::ReadOnly);
+            if (!success) {
+                qWarning() << "ERROR: Couldn't restore chat from file:" << file.fileName();
+                continue;
+            }
+            QDataStream in(&file);
+            FileInfo info;
+            info.oldFile = true;
+            info.file = filePath;
+            in >> info.creationDate;
+            files.append(info);
+            file.close();
+        }
+    }
+    {
+        const QString savePath = Download::globalInstance()->downloadLocalModelsPath();
+        QDir dir(savePath);
+        dir.setNameFilters(QStringList() << "gpt4all-*.chat");
+        QStringList fileNames = dir.entryList();
+        for (QString f : fileNames) {
+            QString filePath = savePath + "/" + f;
+            QFile file(filePath);
+            bool success = file.open(QIODevice::ReadOnly);
+            if (!success) {
+                qWarning() << "ERROR: Couldn't restore chat from file:" << file.fileName();
+                continue;
+            }
+            QDataStream in(&file);
+            // Read and check the header
+            quint32 magic;
+            in >> magic;
+            if (magic != CHAT_FORMAT_MAGIC) {
+                qWarning() << "ERROR: Chat file has bad magic:" << file.fileName();
+                continue;
+            }
+
+            // Read the version
+            qint32 version;
+            in >> version;
+            if (version < 1) {
+                qWarning() << "ERROR: Chat file has non supported version:" << file.fileName();
+                continue;
+            }
+
+            if (version <= 1)
+                in.setVersion(QDataStream::Qt_6_2);
+
+            FileInfo info;
+            info.oldFile = false;
+            info.file = filePath;
+            in >> info.creationDate;
+            files.append(info);
+            file.close();
+        }
+    }
+    std::sort(files.begin(), files.end(), [](const FileInfo &a, const FileInfo &b) {
+        return a.creationDate > b.creationDate;
+    });
+
+    for (FileInfo &f : files) {
+            QFile file(f.file);
+            bool success = file.open(QIODevice::ReadOnly);
+            if (!success) {
+                qWarning() << "ERROR: Couldn't restore chat from file:" << file.fileName();
+                continue;
+            }
+            QDataStream in(&file);
+
+            qint32 version = 0;
+            if (!f.oldFile) {
+                // Read and check the header
+                quint32 magic;
+                in >> magic;
+                if (magic != CHAT_FORMAT_MAGIC) {
+                    qWarning() << "ERROR: Chat file has bad magic:" << file.fileName();
+                    continue;
+                }
+
+                // Read the version
+                in >> version;
+                if (version < 1) {
+                    qWarning() << "ERROR: Chat file has non supported version:" << file.fileName();
+                    continue;
+                }
+
+                if (version <= 1)
+                    in.setVersion(QDataStream::Qt_6_2);
+            }
+
+            qDebug() << "deserializing chat" << f.file;
+
+            Chat *chat = new Chat;
+            chat->moveToThread(qApp->thread());
+            if (!chat->deserialize(in, version)) {
+                qWarning() << "ERROR: Couldn't deserialize chat from file:" << file.fileName();
+                file.remove();
+            } else {
+                emit chatRestored(chat);
+            }
+            if (f.oldFile)
+               file.remove(); // No longer storing in this directory
+            file.close();
+    }
+
+    qint64 elapsedTime = timer.elapsed();
+    qDebug() << "deserializing chats took:" << elapsedTime << "ms";
+}
+
+void ChatListModel::restoreChat(Chat *chat)
+{
+    chat->setParent(this);
+    connect(chat, &Chat::nameChanged, this, &ChatListModel::nameChanged);
+    connect(chat, &Chat::modelLoadingError, this, &ChatListModel::handleModelLoadingError);
+
+    if (m_dummyChat) {
+        beginResetModel();
+        m_chats = QList<Chat*>({chat});
+        setCurrentChat(chat);
+        delete m_dummyChat;
+        m_dummyChat = nullptr;
+        endResetModel();
+    } else {
+        beginInsertRows(QModelIndex(), m_chats.size(), m_chats.size());
+        m_chats.append(chat);
+        endInsertRows();
+    }
+}
+
+void ChatListModel::chatsRestoredFinished()
+{
+    if (m_dummyChat) {
+        beginResetModel();
+        Chat *dummy = m_dummyChat;
+        m_dummyChat = nullptr;
+        m_chats.clear();
+        addChat();
+        delete dummy;
+        endResetModel();
+    }
+
+    if (m_chats.isEmpty())
+        addChat();
+}
diff --git a/gpt4all-chat/chatlistmodel.h b/gpt4all-chat/chatlistmodel.h
new file mode 100644
index 00000000..c695e05d
--- /dev/null
+++ b/gpt4all-chat/chatlistmodel.h
@@ -0,0 +1,233 @@
+#ifndef CHATLISTMODEL_H
+#define CHATLISTMODEL_H
+
+#include <QAbstractListModel>
+#include "chat.h"
+
+class ChatsRestoreThread : public QThread
+{
+    Q_OBJECT
+public:
+    void run() override;
+
+Q_SIGNALS:
+    void chatRestored(Chat *chat);
+};
+
+class ChatListModel : public QAbstractListModel
+{
+    Q_OBJECT
+    Q_PROPERTY(int count READ count NOTIFY countChanged)
+    Q_PROPERTY(Chat *currentChat READ currentChat WRITE setCurrentChat NOTIFY currentChatChanged)
+    Q_PROPERTY(bool shouldSaveChats READ shouldSaveChats WRITE setShouldSaveChats NOTIFY shouldSaveChatsChanged)
+
+public:
+    explicit ChatListModel(QObject *parent = nullptr);
+
+    enum Roles {
+        IdRole = Qt::UserRole + 1,
+        NameRole
+    };
+
+    int rowCount(const QModelIndex &parent = QModelIndex()) const override
+    {
+        Q_UNUSED(parent)
+        return m_chats.size();
+    }
+
+    QVariant data(const QModelIndex &index, int role = Qt::DisplayRole) const override
+    {
+        if (!index.isValid() || index.row() < 0 || index.row() >= m_chats.size())
+            return QVariant();
+
+        const Chat *item = m_chats.at(index.row());
+        switch (role) {
+            case IdRole:
+                return item->id();
+            case NameRole:
+                return item->name();
+        }
+
+        return QVariant();
+    }
+
+    QHash<int, QByteArray> roleNames() const override
+    {
+        QHash<int, QByteArray> roles;
+        roles[IdRole] = "id";
+        roles[NameRole] = "name";
+        return roles;
+    }
+
+    bool shouldSaveChats() const;
+    void setShouldSaveChats(bool b);
+
+    Q_INVOKABLE void addChat()
+    {
+        // Don't add a new chat if we already have one
+        if (m_newChat || m_dummyChat)
+            return;
+
+        // Create a new chat pointer and connect it to determine when it is populated
+        m_newChat = new Chat(this);
+        connect(m_newChat->chatModel(), &ChatModel::countChanged,
+            this, &ChatListModel::newChatCountChanged);
+        connect(m_newChat, &Chat::nameChanged,
+            this, &ChatListModel::nameChanged);
+
+        beginInsertRows(QModelIndex(), 0, 0);
+        m_chats.prepend(m_newChat);
+        endInsertRows();
+        emit countChanged();
+        setCurrentChat(m_newChat);
+    }
+
+    Q_INVOKABLE void addDummyChat()
+    {
+        // Create a new dummy chat pointer and don't connect it
+        m_dummyChat = new Chat(this);
+        beginInsertRows(QModelIndex(), 0, 0);
+        m_chats.prepend(m_dummyChat);
+        endInsertRows();
+        emit countChanged();
+        m_currentChat = m_dummyChat;
+        emit currentChatChanged();
+    }
+
+    void setNewChat(Chat* chat)
+    {
+        // Don't add a new chat if we already have one
+        if (m_newChat)
+            return;
+
+        m_newChat = chat;
+        connect(m_newChat->chatModel(), &ChatModel::countChanged,
+            this, &ChatListModel::newChatCountChanged);
+        connect(m_newChat, &Chat::nameChanged,
+            this, &ChatListModel::nameChanged);
+        connect(m_newChat, &Chat::modelLoadingError,
+            this, &ChatListModel::handleModelLoadingError);
+        setCurrentChat(m_newChat);
+    }
+
+    Q_INVOKABLE void removeChat(Chat* chat)
+    {
+        if (!m_chats.contains(chat)) {
+            qWarning() << "WARNING: Removing chat failed with id" << chat->id();
+            return;
+        }
+
+        removeChatFile(chat);
+
+        if (chat == m_newChat) {
+            m_newChat->disconnect(this);
+            m_newChat = nullptr;
+        }
+
+        const int index = m_chats.indexOf(chat);
+        if (m_chats.count() < 2) {
+            addChat();
+        } else {
+            int nextIndex;
+            if (index == m_chats.count() - 1)
+                nextIndex = index - 1;
+            else
+                nextIndex = index + 1;
+            Chat *nextChat = get(nextIndex);
+            Q_ASSERT(nextChat);
+            setCurrentChat(nextChat);
+        }
+
+        const int newIndex = m_chats.indexOf(chat);
+        beginRemoveRows(QModelIndex(), newIndex, newIndex);
+        m_chats.removeAll(chat);
+        endRemoveRows();
+        delete chat;
+    }
+
+    Chat *currentChat() const
+    {
+        return m_currentChat;
+    }
+
+    void setCurrentChat(Chat *chat)
+    {
+        if (!m_chats.contains(chat)) {
+            qWarning() << "ERROR: Setting current chat failed with id" << chat->id();
+            return;
+        }
+
+        if (m_currentChat && m_currentChat->isModelLoaded())
+            m_currentChat->unloadModel();
+
+        m_currentChat = chat;
+        if (!m_currentChat->isModelLoaded())
+            m_currentChat->reloadModel();
+        emit currentChatChanged();
+    }
+
+    Q_INVOKABLE Chat* get(int index)
+    {
+        if (index < 0 || index >= m_chats.size()) return nullptr;
+        return m_chats.at(index);
+    }
+
+    int count() const { return m_chats.size(); }
+
+    void removeChatFile(Chat *chat) const;
+    void saveChats() const;
+    void restoreChat(Chat *chat);
+    void chatsRestoredFinished();
+
+Q_SIGNALS:
+    void countChanged();
+    void currentChatChanged();
+    void shouldSaveChatsChanged();
+
+private Q_SLOTS:
+    void newChatCountChanged()
+    {
+        Q_ASSERT(m_newChat && m_newChat->chatModel()->count());
+        m_newChat->chatModel()->disconnect(this);
+        m_newChat = nullptr;
+    }
+
+    void nameChanged()
+    {
+        Chat *chat = qobject_cast<Chat *>(sender());
+        if (!chat)
+            return;
+
+        int row = m_chats.indexOf(chat);
+        if (row < 0 || row >= m_chats.size())
+            return;
+
+        QModelIndex index = createIndex(row, 0);
+        emit dataChanged(index, index, {NameRole});
+    }
+
+    void handleModelLoadingError(const QString &error)
+    {
+        Chat *chat = qobject_cast<Chat *>(sender());
+        qWarning() << "ERROR:" << qPrintable(error) << "id" << chat->id();
+        removeChat(chat);
+    }
+
+    void printChats()
+    {
+        for (auto c : m_chats) {
+            qDebug() << c->name()
+                << (c == m_currentChat ? "currentChat: true" : "currentChat: false")
+                << (c == m_newChat ? "newChat: true" : "newChat: false");
+        }
+    }
+
+private:
+    bool m_shouldSaveChats;
+    Chat* m_newChat;
+    Chat* m_dummyChat;
+    Chat* m_currentChat;
+    QList<Chat*> m_chats;
+};
+
+#endif // CHATITEMMODEL_H
diff --git a/gpt4all-chat/chatllm.cpp b/gpt4all-chat/chatllm.cpp
new file mode 100644
index 00000000..2ffbc3c7
--- /dev/null
+++ b/gpt4all-chat/chatllm.cpp
@@ -0,0 +1,483 @@
+#include "chatllm.h"
+#include "chat.h"
+#include "download.h"
+#include "network.h"
+#include "llmodel/gptj.h"
+#include "llmodel/llamamodel.h"
+#include "llmodel/mpt.h"
+
+#include <QCoreApplication>
+#include <QDir>
+#include <QFile>
+#include <QProcess>
+#include <QResource>
+#include <QSettings>
+#include <fstream>
+
+//#define DEBUG
+
+#define MPT_INTERNAL_STATE_VERSION 0
+#define GPTJ_INTERNAL_STATE_VERSION 0
+#define LLAMA_INTERNAL_STATE_VERSION 0
+
+static QString modelFilePath(const QString &modelName)
+{
+    QString appPath = QCoreApplication::applicationDirPath()
+        + "/ggml-" + modelName + ".bin";
+    QFileInfo infoAppPath(appPath);
+    if (infoAppPath.exists())
+        return appPath;
+
+    QString downloadPath = Download::globalInstance()->downloadLocalModelsPath()
+        + "/ggml-" + modelName + ".bin";
+
+    QFileInfo infoLocalPath(downloadPath);
+    if (infoLocalPath.exists())
+        return downloadPath;
+    return QString();
+}
+
+ChatLLM::ChatLLM(Chat *parent)
+    : QObject{nullptr}
+    , m_llmodel(nullptr)
+    , m_promptResponseTokens(0)
+    , m_responseLogits(0)
+    , m_isRecalc(false)
+    , m_chat(parent)
+{
+    moveToThread(&m_llmThread);
+    connect(this, &ChatLLM::sendStartup, Network::globalInstance(), &Network::sendStartup);
+    connect(this, &ChatLLM::sendModelLoaded, Network::globalInstance(), &Network::sendModelLoaded);
+    connect(m_chat, &Chat::idChanged, this, &ChatLLM::handleChatIdChanged);
+    m_llmThread.setObjectName(m_chat->id());
+    m_llmThread.start();
+}
+
+bool ChatLLM::loadDefaultModel()
+{
+    const QList<QString> models = m_chat->modelList();
+    if (models.isEmpty()) {
+        // try again when we get a list of models
+        connect(Download::globalInstance(), &Download::modelListChanged, this,
+            &ChatLLM::loadDefaultModel, Qt::SingleShotConnection);
+        return false;
+    }
+
+    QSettings settings;
+    settings.sync();
+    // The user default model can be set by the user in the settings dialog. The "default" user
+    // default model is "Application default" which signals we should use the default model that was
+    // specified by the models.json file.
+    QString defaultModel = settings.value("userDefaultModel").toString();
+    if (defaultModel.isEmpty() || !models.contains(defaultModel) || defaultModel == "Application default")
+        defaultModel = settings.value("defaultModel").toString();
+    if (defaultModel.isEmpty() || !models.contains(defaultModel))
+        defaultModel = models.first();
+    return loadModel(defaultModel);
+}
+
+bool ChatLLM::loadModel(const QString &modelName)
+{
+    if (isModelLoaded() && m_modelName == modelName)
+        return true;
+
+    if (isModelLoaded()) {
+        resetContextPrivate();
+        delete m_llmodel;
+        m_llmodel = nullptr;
+        emit isModelLoadedChanged();
+    }
+
+    bool isGPTJ = false;
+    bool isMPT = false;
+    QString filePath = modelFilePath(modelName);
+    QFileInfo info(filePath);
+    if (info.exists()) {
+
+        auto fin = std::ifstream(filePath.toStdString(), std::ios::binary);
+        uint32_t magic;
+        fin.read((char *) &magic, sizeof(magic));
+        fin.seekg(0);
+        fin.close();
+        isGPTJ = magic == 0x67676d6c;
+        isMPT = magic == 0x67676d6d;
+        if (isGPTJ) {
+            m_modelType = ModelType::GPTJ_;
+            m_llmodel = new GPTJ;
+            m_llmodel->loadModel(filePath.toStdString());
+        } else if (isMPT) {
+            m_modelType = ModelType::MPT_;
+            m_llmodel = new MPT;
+            m_llmodel->loadModel(filePath.toStdString());
+        } else {
+            m_modelType = ModelType::LLAMA_;
+            m_llmodel = new LLamaModel;
+            m_llmodel->loadModel(filePath.toStdString());
+        }
+
+        restoreState();
+
+#if defined(DEBUG)
+    qDebug() << "chatllm modelLoadedChanged" << m_chat->id();
+    fflush(stdout);
+#endif
+
+        emit isModelLoadedChanged();
+
+        static bool isFirstLoad = true;
+        if (isFirstLoad) {
+            emit sendStartup();
+            isFirstLoad = false;
+        } else
+            emit sendModelLoaded();
+    } else {
+        const QString error = QString("Could not find model %1").arg(modelName);
+        emit modelLoadingError(error);
+    }
+
+    if (m_llmodel)
+        setModelName(info.completeBaseName().remove(0, 5)); // remove the ggml- prefix
+
+    return m_llmodel;
+}
+
+bool ChatLLM::isModelLoaded() const
+{
+    return m_llmodel && m_llmodel->isModelLoaded();
+}
+
+void ChatLLM::regenerateResponse()
+{
+    m_ctx.n_past -= m_promptResponseTokens;
+    m_ctx.n_past = std::max(0, m_ctx.n_past);
+    // FIXME: This does not seem to be needed in my testing and llama models don't to it. Remove?
+    m_ctx.logits.erase(m_ctx.logits.end() -= m_responseLogits, m_ctx.logits.end());
+    m_ctx.tokens.erase(m_ctx.tokens.end() -= m_promptResponseTokens, m_ctx.tokens.end());
+    m_promptResponseTokens = 0;
+    m_responseLogits = 0;
+    m_response = std::string();
+    emit responseChanged();
+}
+
+void ChatLLM::resetResponse()
+{
+    m_promptResponseTokens = 0;
+    m_responseLogits = 0;
+    m_response = std::string();
+    emit responseChanged();
+}
+
+void ChatLLM::resetContext()
+{
+    resetContextPrivate();
+    emit sendResetContext();
+}
+
+void ChatLLM::resetContextPrivate()
+{
+    regenerateResponse();
+    m_ctx = LLModel::PromptContext();
+}
+
+std::string remove_leading_whitespace(const std::string& input) {
+    auto first_non_whitespace = std::find_if(input.begin(), input.end(), [](unsigned char c) {
+        return !std::isspace(c);
+    });
+
+    return std::string(first_non_whitespace, input.end());
+}
+
+std::string trim_whitespace(const std::string& input) {
+    auto first_non_whitespace = std::find_if(input.begin(), input.end(), [](unsigned char c) {
+        return !std::isspace(c);
+    });
+
+    auto last_non_whitespace = std::find_if(input.rbegin(), input.rend(), [](unsigned char c) {
+        return !std::isspace(c);
+    }).base();
+
+    return std::string(first_non_whitespace, last_non_whitespace);
+}
+
+QString ChatLLM::response() const
+{
+    return QString::fromStdString(remove_leading_whitespace(m_response));
+}
+
+QString ChatLLM::modelName() const
+{
+    return m_modelName;
+}
+
+void ChatLLM::setModelName(const QString &modelName)
+{
+    m_modelName = modelName;
+    emit modelNameChanged();
+}
+
+void ChatLLM::modelNameChangeRequested(const QString &modelName)
+{
+    if (!loadModel(modelName))
+        qWarning() << "ERROR: Could not load model" << modelName;
+}
+
+bool ChatLLM::handlePrompt(int32_t token)
+{
+    // m_promptResponseTokens and m_responseLogits are related to last prompt/response not
+    // the entire context window which we can reset on regenerate prompt
+#if defined(DEBUG)
+    qDebug() << "chatllm prompt process" << m_chat->id() << token;
+#endif
+    ++m_promptResponseTokens;
+    return !m_stopGenerating;
+}
+
+bool ChatLLM::handleResponse(int32_t token, const std::string &response)
+{
+#if defined(DEBUG)
+    printf("%s", response.c_str());
+    fflush(stdout);
+#endif
+
+    // check for error
+    if (token < 0) {
+        m_response.append(response);
+        emit responseChanged();
+        return false;
+    }
+
+    // m_promptResponseTokens and m_responseLogits are related to last prompt/response not
+    // the entire context window which we can reset on regenerate prompt
+    ++m_promptResponseTokens;
+    Q_ASSERT(!response.empty());
+    m_response.append(response);
+    emit responseChanged();
+    return !m_stopGenerating;
+}
+
+bool ChatLLM::handleRecalculate(bool isRecalc)
+{
+    if (m_isRecalc != isRecalc) {
+        m_isRecalc = isRecalc;
+        emit recalcChanged();
+    }
+    return !m_stopGenerating;
+}
+
+bool ChatLLM::prompt(const QString &prompt, const QString &prompt_template, int32_t n_predict, int32_t top_k,
+    float top_p, float temp, int32_t n_batch, float repeat_penalty, int32_t repeat_penalty_tokens, int n_threads)
+{
+    if (!isModelLoaded())
+        return false;
+
+    QString instructPrompt = prompt_template.arg(prompt);
+
+    m_stopGenerating = false;
+    auto promptFunc = std::bind(&ChatLLM::handlePrompt, this, std::placeholders::_1);
+    auto responseFunc = std::bind(&ChatLLM::handleResponse, this, std::placeholders::_1,
+        std::placeholders::_2);
+    auto recalcFunc = std::bind(&ChatLLM::handleRecalculate, this, std::placeholders::_1);
+    emit responseStarted();
+    qint32 logitsBefore = m_ctx.logits.size();
+    m_ctx.n_predict = n_predict;
+    m_ctx.top_k = top_k;
+    m_ctx.top_p = top_p;
+    m_ctx.temp = temp;
+    m_ctx.n_batch = n_batch;
+    m_ctx.repeat_penalty = repeat_penalty;
+    m_ctx.repeat_last_n = repeat_penalty_tokens;
+    m_llmodel->setThreadCount(n_threads);
+#if defined(DEBUG)
+    printf("%s", qPrintable(instructPrompt));
+    fflush(stdout);
+#endif
+    m_llmodel->prompt(instructPrompt.toStdString(), promptFunc, responseFunc, recalcFunc, m_ctx);
+#if defined(DEBUG)
+    printf("\n");
+    fflush(stdout);
+#endif
+    m_responseLogits += m_ctx.logits.size() - logitsBefore;
+    std::string trimmed = trim_whitespace(m_response);
+    if (trimmed != m_response) {
+        m_response = trimmed;
+        emit responseChanged();
+    }
+    emit responseStopped();
+    return true;
+}
+
+void ChatLLM::unloadModel()
+{
+#if defined(DEBUG)
+    qDebug() << "chatllm unloadModel" << m_chat->id();
+#endif
+    saveState();
+    delete m_llmodel;
+    m_llmodel = nullptr;
+    emit isModelLoadedChanged();
+}
+
+void ChatLLM::reloadModel(const QString &modelName)
+{
+#if defined(DEBUG)
+    qDebug() << "chatllm reloadModel" << m_chat->id();
+#endif
+    if (modelName.isEmpty()) {
+        loadDefaultModel();
+    } else {
+        loadModel(modelName);
+    }
+}
+
+void ChatLLM::generateName()
+{
+    Q_ASSERT(isModelLoaded());
+    if (!isModelLoaded())
+        return;
+
+    QString instructPrompt("### Instruction:\n"
+                           "Describe response above in three words.\n"
+                           "### Response:\n");
+    auto promptFunc = std::bind(&ChatLLM::handleNamePrompt, this, std::placeholders::_1);
+    auto responseFunc = std::bind(&ChatLLM::handleNameResponse, this, std::placeholders::_1,
+        std::placeholders::_2);
+    auto recalcFunc = std::bind(&ChatLLM::handleNameRecalculate, this, std::placeholders::_1);
+    LLModel::PromptContext ctx = m_ctx;
+#if defined(DEBUG)
+    printf("%s", qPrintable(instructPrompt));
+    fflush(stdout);
+#endif
+    m_llmodel->prompt(instructPrompt.toStdString(), promptFunc, responseFunc, recalcFunc, ctx);
+#if defined(DEBUG)
+    printf("\n");
+    fflush(stdout);
+#endif
+    std::string trimmed = trim_whitespace(m_nameResponse);
+    if (trimmed != m_nameResponse) {
+        m_nameResponse = trimmed;
+        emit generatedNameChanged();
+    }
+}
+
+void ChatLLM::handleChatIdChanged()
+{
+    m_llmThread.setObjectName(m_chat->id());
+}
+
+bool ChatLLM::handleNamePrompt(int32_t token)
+{
+    Q_UNUSED(token);
+    qt_noop();
+    return true;
+}
+
+bool ChatLLM::handleNameResponse(int32_t token, const std::string &response)
+{
+    Q_UNUSED(token);
+
+    m_nameResponse.append(response);
+    emit generatedNameChanged();
+    QString gen = QString::fromStdString(m_nameResponse).simplified();
+    QStringList words = gen.split(' ', Qt::SkipEmptyParts);
+    int wordCount = words.size();
+    return words.size() <= 3;
+}
+
+bool ChatLLM::handleNameRecalculate(bool isRecalc)
+{
+    Q_UNUSED(isRecalc);
+    Q_UNREACHABLE();
+    return true;
+}
+
+bool ChatLLM::serialize(QDataStream &stream, int version)
+{
+    if (version > 1) {
+        stream << m_modelType;
+        switch (m_modelType) {
+        case MPT_: stream << MPT_INTERNAL_STATE_VERSION; break;
+        case GPTJ_: stream << GPTJ_INTERNAL_STATE_VERSION; break;
+        case LLAMA_: stream << LLAMA_INTERNAL_STATE_VERSION; break;
+        default: Q_UNREACHABLE();
+        }
+    }
+    stream << response();
+    stream << generatedName();
+    stream << m_promptResponseTokens;
+    stream << m_responseLogits;
+    stream << m_ctx.n_past;
+    stream << quint64(m_ctx.logits.size());
+    stream.writeRawData(reinterpret_cast<const char*>(m_ctx.logits.data()), m_ctx.logits.size() * sizeof(float));
+    stream << quint64(m_ctx.tokens.size());
+    stream.writeRawData(reinterpret_cast<const char*>(m_ctx.tokens.data()), m_ctx.tokens.size() * sizeof(int));
+    saveState();
+    QByteArray compressed = qCompress(m_state);
+    stream << compressed;
+#if defined(DEBUG)
+    qDebug() << "chatllm serialize" << m_chat->id() << m_state.size();
+#endif
+    return stream.status() == QDataStream::Ok;
+}
+
+bool ChatLLM::deserialize(QDataStream &stream, int version)
+{
+    if (version > 1) {
+        int internalStateVersion;
+        stream >> m_modelType;
+        stream >> internalStateVersion; // for future use
+    }
+    QString response;
+    stream >> response;
+    m_response = response.toStdString();
+    QString nameResponse;
+    stream >> nameResponse;
+    m_nameResponse = nameResponse.toStdString();
+    stream >> m_promptResponseTokens;
+    stream >> m_responseLogits;
+    stream >> m_ctx.n_past;
+    quint64 logitsSize;
+    stream >> logitsSize;
+    m_ctx.logits.resize(logitsSize);
+    stream.readRawData(reinterpret_cast<char*>(m_ctx.logits.data()), logitsSize * sizeof(float));
+    quint64 tokensSize;
+    stream >> tokensSize;
+    m_ctx.tokens.resize(tokensSize);
+    stream.readRawData(reinterpret_cast<char*>(m_ctx.tokens.data()), tokensSize * sizeof(int));
+    if (version > 0) {
+        QByteArray compressed;
+        stream >> compressed;
+        m_state = qUncompress(compressed);
+    } else {
+        stream >> m_state;
+    }
+#if defined(DEBUG)
+    qDebug() << "chatllm deserialize" << m_chat->id();
+#endif
+    return stream.status() == QDataStream::Ok;
+}
+
+void ChatLLM::saveState()
+{
+    if (!isModelLoaded())
+        return;
+
+    const size_t stateSize = m_llmodel->stateSize();
+    m_state.resize(stateSize);
+#if defined(DEBUG)
+    qDebug() << "chatllm saveState" << m_chat->id() << "size:" << m_state.size();
+#endif
+    m_llmodel->saveState(static_cast<uint8_t*>(reinterpret_cast<void*>(m_state.data())));
+}
+
+void ChatLLM::restoreState()
+{
+    if (!isModelLoaded() || m_state.isEmpty())
+        return;
+
+#if defined(DEBUG)
+    qDebug() << "chatllm restoreState" << m_chat->id() << "size:" << m_state.size();
+#endif
+    m_llmodel->restoreState(static_cast<const uint8_t*>(reinterpret_cast<void*>(m_state.data())));
+    m_state.clear();
+    m_state.resize(0);
+}
diff --git a/gpt4all-chat/chatllm.h b/gpt4all-chat/chatllm.h
new file mode 100644
index 00000000..bb488b16
--- /dev/null
+++ b/gpt4all-chat/chatllm.h
@@ -0,0 +1,100 @@
+#ifndef CHATLLM_H
+#define CHATLLM_H
+
+#include <QObject>
+#include <QThread>
+
+#include "llmodel/llmodel.h"
+
+class Chat;
+class ChatLLM : public QObject
+{
+    Q_OBJECT
+    Q_PROPERTY(bool isModelLoaded READ isModelLoaded NOTIFY isModelLoadedChanged)
+    Q_PROPERTY(QString response READ response NOTIFY responseChanged)
+    Q_PROPERTY(QString modelName READ modelName WRITE setModelName NOTIFY modelNameChanged)
+    Q_PROPERTY(bool isRecalc READ isRecalc NOTIFY recalcChanged)
+    Q_PROPERTY(QString generatedName READ generatedName NOTIFY generatedNameChanged)
+
+public:
+    enum ModelType {
+        MPT_,
+        GPTJ_,
+        LLAMA_
+    };
+
+    ChatLLM(Chat *parent);
+
+    bool isModelLoaded() const;
+    void regenerateResponse();
+    void resetResponse();
+    void resetContext();
+
+    void stopGenerating() { m_stopGenerating = true; }
+
+    QString response() const;
+    QString modelName() const;
+
+    void setModelName(const QString &modelName);
+
+    bool isRecalc() const { return m_isRecalc; }
+
+    QString generatedName() const { return QString::fromStdString(m_nameResponse); }
+
+    bool serialize(QDataStream &stream, int version);
+    bool deserialize(QDataStream &stream, int version);
+
+public Q_SLOTS:
+    bool prompt(const QString &prompt, const QString &prompt_template, int32_t n_predict,
+        int32_t top_k, float top_p, float temp, int32_t n_batch, float repeat_penalty, int32_t repeat_penalty_tokens,
+        int32_t n_threads);
+    bool loadDefaultModel();
+    bool loadModel(const QString &modelName);
+    void modelNameChangeRequested(const QString &modelName);
+    void unloadModel();
+    void reloadModel(const QString &modelName);
+    void generateName();
+    void handleChatIdChanged();
+
+Q_SIGNALS:
+    void isModelLoadedChanged();
+    void modelLoadingError(const QString &error);
+    void responseChanged();
+    void responseStarted();
+    void responseStopped();
+    void modelNameChanged();
+    void recalcChanged();
+    void sendStartup();
+    void sendModelLoaded();
+    void sendResetContext();
+    void generatedNameChanged();
+    void stateChanged();
+
+private:
+    void resetContextPrivate();
+    bool handlePrompt(int32_t token);
+    bool handleResponse(int32_t token, const std::string &response);
+    bool handleRecalculate(bool isRecalc);
+    bool handleNamePrompt(int32_t token);
+    bool handleNameResponse(int32_t token, const std::string &response);
+    bool handleNameRecalculate(bool isRecalc);
+    void saveState();
+    void restoreState();
+
+private:
+    LLModel::PromptContext m_ctx;
+    LLModel *m_llmodel;
+    std::string m_response;
+    std::string m_nameResponse;
+    quint32 m_promptResponseTokens;
+    quint32 m_responseLogits;
+    QString m_modelName;
+    ModelType m_modelType;
+    Chat *m_chat;
+    QByteArray m_state;
+    QThread m_llmThread;
+    std::atomic<bool> m_stopGenerating;
+    bool m_isRecalc;
+};
+
+#endif // CHATLLM_H
diff --git a/gpt4all-chat/chatmodel.h b/gpt4all-chat/chatmodel.h
new file mode 100644
index 00000000..e3c01a9a
--- /dev/null
+++ b/gpt4all-chat/chatmodel.h
@@ -0,0 +1,261 @@
+#ifndef CHATMODEL_H
+#define CHATMODEL_H
+
+#include <QAbstractListModel>
+#include <QtQml>
+#include <QDataStream>
+
+struct ChatItem
+{
+    Q_GADGET
+    Q_PROPERTY(int id MEMBER id)
+    Q_PROPERTY(QString name MEMBER name)
+    Q_PROPERTY(QString value MEMBER value)
+    Q_PROPERTY(QString prompt MEMBER prompt)
+    Q_PROPERTY(QString newResponse MEMBER newResponse)
+    Q_PROPERTY(bool currentResponse MEMBER currentResponse)
+    Q_PROPERTY(bool stopped MEMBER stopped)
+    Q_PROPERTY(bool thumbsUpState MEMBER thumbsUpState)
+    Q_PROPERTY(bool thumbsDownState MEMBER thumbsDownState)
+
+public:
+    int id = 0;
+    QString name;
+    QString value;
+    QString prompt;
+    QString newResponse;
+    bool currentResponse = false;
+    bool stopped = false;
+    bool thumbsUpState = false;
+    bool thumbsDownState = false;
+};
+Q_DECLARE_METATYPE(ChatItem)
+
+class ChatModel : public QAbstractListModel
+{
+    Q_OBJECT
+    Q_PROPERTY(int count READ count NOTIFY countChanged)
+
+public:
+    explicit ChatModel(QObject *parent = nullptr) : QAbstractListModel(parent) {}
+
+    enum Roles {
+        IdRole = Qt::UserRole + 1,
+        NameRole,
+        ValueRole,
+        PromptRole,
+        NewResponseRole,
+        CurrentResponseRole,
+        StoppedRole,
+        ThumbsUpStateRole,
+        ThumbsDownStateRole
+    };
+
+    int rowCount(const QModelIndex &parent = QModelIndex()) const override
+    {
+        Q_UNUSED(parent)
+        return m_chatItems.size();
+    }
+
+    QVariant data(const QModelIndex &index, int role = Qt::DisplayRole) const override
+    {
+        if (!index.isValid() || index.row() < 0 || index.row() >= m_chatItems.size())
+            return QVariant();
+
+        const ChatItem &item = m_chatItems.at(index.row());
+        switch (role) {
+            case IdRole:
+                return item.id;
+            case NameRole:
+                return item.name;
+            case ValueRole:
+                return item.value;
+            case PromptRole:
+                return item.prompt;
+            case NewResponseRole:
+                return item.newResponse;
+            case CurrentResponseRole:
+                return item.currentResponse;
+            case StoppedRole:
+                return item.stopped;
+            case ThumbsUpStateRole:
+                return item.thumbsUpState;
+            case ThumbsDownStateRole:
+                return item.thumbsDownState;
+        }
+
+        return QVariant();
+    }
+
+    QHash<int, QByteArray> roleNames() const override
+    {
+        QHash<int, QByteArray> roles;
+        roles[IdRole] = "id";
+        roles[NameRole] = "name";
+        roles[ValueRole] = "value";
+        roles[PromptRole] = "prompt";
+        roles[NewResponseRole] = "newResponse";
+        roles[CurrentResponseRole] = "currentResponse";
+        roles[StoppedRole] = "stopped";
+        roles[ThumbsUpStateRole] = "thumbsUpState";
+        roles[ThumbsDownStateRole] = "thumbsDownState";
+        return roles;
+    }
+
+    void appendPrompt(const QString &name, const QString &value)
+    {
+        ChatItem item;
+        item.name = name;
+        item.value = value;
+        beginInsertRows(QModelIndex(), m_chatItems.size(), m_chatItems.size());
+        m_chatItems.append(item);
+        endInsertRows();
+        emit countChanged();
+    }
+
+    void appendResponse(const QString &name, const QString &prompt)
+    {
+        ChatItem item;
+        item.id = m_chatItems.count(); // This is only relevant for responses
+        item.name = name;
+        item.prompt = prompt;
+        item.currentResponse = true;
+        beginInsertRows(QModelIndex(), m_chatItems.size(), m_chatItems.size());
+        m_chatItems.append(item);
+        endInsertRows();
+        emit countChanged();
+    }
+
+    Q_INVOKABLE void clear()
+    {
+        if (m_chatItems.isEmpty()) return;
+
+        beginResetModel();
+        m_chatItems.clear();
+        endResetModel();
+        emit countChanged();
+    }
+
+    Q_INVOKABLE ChatItem get(int index)
+    {
+        if (index < 0 || index >= m_chatItems.size()) return ChatItem();
+        return m_chatItems.at(index);
+    }
+
+    Q_INVOKABLE void updateCurrentResponse(int index, bool b)
+    {
+        if (index < 0 || index >= m_chatItems.size()) return;
+
+        ChatItem &item = m_chatItems[index];
+        if (item.currentResponse != b) {
+            item.currentResponse = b;
+            emit dataChanged(createIndex(index, 0), createIndex(index, 0), {CurrentResponseRole});
+        }
+    }
+
+    Q_INVOKABLE void updateStopped(int index, bool b)
+    {
+        if (index < 0 || index >= m_chatItems.size()) return;
+
+        ChatItem &item = m_chatItems[index];
+        if (item.stopped != b) {
+            item.stopped = b;
+            emit dataChanged(createIndex(index, 0), createIndex(index, 0), {StoppedRole});
+        }
+    }
+
+    Q_INVOKABLE void updateValue(int index, const QString &value)
+    {
+        if (index < 0 || index >= m_chatItems.size()) return;
+
+        ChatItem &item = m_chatItems[index];
+        if (item.value != value) {
+            item.value = value;
+            emit dataChanged(createIndex(index, 0), createIndex(index, 0), {ValueRole});
+        }
+    }
+
+    Q_INVOKABLE void updateThumbsUpState(int index, bool b)
+    {
+        if (index < 0 || index >= m_chatItems.size()) return;
+
+        ChatItem &item = m_chatItems[index];
+        if (item.thumbsUpState != b) {
+            item.thumbsUpState = b;
+            emit dataChanged(createIndex(index, 0), createIndex(index, 0), {ThumbsUpStateRole});
+        }
+    }
+
+    Q_INVOKABLE void updateThumbsDownState(int index, bool b)
+    {
+        if (index < 0 || index >= m_chatItems.size()) return;
+
+        ChatItem &item = m_chatItems[index];
+        if (item.thumbsDownState != b) {
+            item.thumbsDownState = b;
+            emit dataChanged(createIndex(index, 0), createIndex(index, 0), {ThumbsDownStateRole});
+        }
+    }
+
+    Q_INVOKABLE void updateNewResponse(int index, const QString &newResponse)
+    {
+        if (index < 0 || index >= m_chatItems.size()) return;
+
+        ChatItem &item = m_chatItems[index];
+        if (item.newResponse != newResponse) {
+            item.newResponse = newResponse;
+            emit dataChanged(createIndex(index, 0), createIndex(index, 0), {NewResponseRole});
+        }
+    }
+
+    int count() const { return m_chatItems.size(); }
+
+    bool serialize(QDataStream &stream, int version) const
+    {
+        stream << count();
+        for (auto c : m_chatItems) {
+            stream << c.id;
+            stream << c.name;
+            stream << c.value;
+            stream << c.prompt;
+            stream << c.newResponse;
+            stream << c.currentResponse;
+            stream << c.stopped;
+            stream << c.thumbsUpState;
+            stream << c.thumbsDownState;
+        }
+        return stream.status() == QDataStream::Ok;
+    }
+
+    bool deserialize(QDataStream &stream, int version)
+    {
+        int size;
+        stream >> size;
+        for (int i = 0; i < size; ++i) {
+            ChatItem c;
+            stream >> c.id;
+            stream >> c.name;
+            stream >> c.value;
+            stream >> c.prompt;
+            stream >> c.newResponse;
+            stream >> c.currentResponse;
+            stream >> c.stopped;
+            stream >> c.thumbsUpState;
+            stream >> c.thumbsDownState;
+            beginInsertRows(QModelIndex(), m_chatItems.size(), m_chatItems.size());
+            m_chatItems.append(c);
+            endInsertRows();
+        }
+        emit countChanged();
+        return stream.status() == QDataStream::Ok;
+    }
+
+Q_SIGNALS:
+    void countChanged();
+
+private:
+
+    QList<ChatItem> m_chatItems;
+};
+
+#endif // CHATMODEL_H
diff --git a/gpt4all-chat/cmake/config.h.in b/gpt4all-chat/cmake/config.h.in
new file mode 100644
index 00000000..e578a82d
--- /dev/null
+++ b/gpt4all-chat/cmake/config.h.in
@@ -0,0 +1,7 @@
+#ifndef CONFIG_H
+#define CONFIG_H
+
+#define APP_VERSION "@APP_VERSION@"
+#define GPT4ALL_AVX_ONLY "@GPT4ALL_AVX_ONLY@"
+
+#endif // CONFIG_H
diff --git a/gpt4all-chat/cmake/deploy-qt-linux.cmake.in b/gpt4all-chat/cmake/deploy-qt-linux.cmake.in
new file mode 100644
index 00000000..8c4240f1
--- /dev/null
+++ b/gpt4all-chat/cmake/deploy-qt-linux.cmake.in
@@ -0,0 +1,12 @@
+set(LINUXDEPLOYQT "@LINUXDEPLOYQT@")
+set(COMPONENT_NAME_MAIN "@COMPONENT_NAME_MAIN@")
+set(CMAKE_CURRENT_SOURCE_DIR "@CMAKE_CURRENT_SOURCE_DIR@")
+set(DATA_DIR ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data)
+set(BIN_DIR ${DATA_DIR}/bin)
+set(Qt6_ROOT_DIR "@Qt6_ROOT_DIR@")
+set(ENV{LD_LIBRARY_PATH} "${BIN_DIR}:${Qt6_ROOT_DIR}/../lib/")
+execute_process(COMMAND ${LINUXDEPLOYQT} ${BIN_DIR}/chat -qmldir=${CMAKE_CURRENT_SOURCE_DIR} -bundle-non-qt-libs -qmake=${Qt6_ROOT_DIR}/bin/qmake -verbose=2)
+file(COPY "${CMAKE_CURRENT_SOURCE_DIR}/icons/logo-32.png"
+     DESTINATION ${DATA_DIR})
+file(COPY "${CMAKE_CURRENT_SOURCE_DIR}/icons/logo-48.png"
+     DESTINATION ${DATA_DIR})
diff --git a/gpt4all-chat/cmake/deploy-qt-mac.cmake.in b/gpt4all-chat/cmake/deploy-qt-mac.cmake.in
new file mode 100644
index 00000000..f6ceb718
--- /dev/null
+++ b/gpt4all-chat/cmake/deploy-qt-mac.cmake.in
@@ -0,0 +1,16 @@
+set(MACDEPLOYQT "@MACDEPLOYQT@")
+set(COMPONENT_NAME_MAIN "@COMPONENT_NAME_MAIN@")
+set(CMAKE_CURRENT_SOURCE_DIR "@CMAKE_CURRENT_SOURCE_DIR@")
+execute_process(COMMAND ${MACDEPLOYQT} ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data/bin/gpt4all.app -qmldir=${CMAKE_CURRENT_SOURCE_DIR} -verbose=2)
+file(COPY ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data/lib/libllama.dylib
+     DESTINATION ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data/bin/gpt4all.app/Contents/Frameworks)
+file(COPY ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data/lib/libllmodel.dylib
+     DESTINATION ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data/bin/gpt4all.app/Contents/Frameworks)
+file(COPY "${CMAKE_CURRENT_SOURCE_DIR}/icons/favicon.icns"
+     DESTINATION ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data/bin/gpt4all.app/Contents/Resources)
+file(COPY "${CMAKE_CURRENT_SOURCE_DIR}/icons/logo-32.png"
+     DESTINATION ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data)
+file(COPY "${CMAKE_CURRENT_SOURCE_DIR}/icons/logo-48.png"
+     DESTINATION ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data)
+file(COPY "${CMAKE_CURRENT_SOURCE_DIR}/icons/favicon.icns"
+     DESTINATION ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data)
diff --git a/gpt4all-chat/cmake/deploy-qt-windows.cmake.in b/gpt4all-chat/cmake/deploy-qt-windows.cmake.in
new file mode 100644
index 00000000..80493951
--- /dev/null
+++ b/gpt4all-chat/cmake/deploy-qt-windows.cmake.in
@@ -0,0 +1,14 @@
+set(WINDEPLOYQT "@WINDEPLOYQT@")
+set(COMPONENT_NAME_MAIN "@COMPONENT_NAME_MAIN@")
+set(CMAKE_CURRENT_SOURCE_DIR "@CMAKE_CURRENT_SOURCE_DIR@")
+execute_process(COMMAND ${WINDEPLOYQT} --qmldir ${CMAKE_CURRENT_SOURCE_DIR} ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data/bin)
+file(COPY ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data/lib/libllama.dll
+     DESTINATION ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data/bin)
+file(COPY ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data/lib/libllmodel.dll
+     DESTINATION ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data/bin)
+file(COPY "${CMAKE_CURRENT_SOURCE_DIR}/icons/logo-32.png"
+     DESTINATION ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data)
+file(COPY "${CMAKE_CURRENT_SOURCE_DIR}/icons/logo-48.png"
+     DESTINATION ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data)
+file(COPY "${CMAKE_CURRENT_SOURCE_DIR}/icons/favicon.ico"
+     DESTINATION ${CPACK_TEMPORARY_INSTALL_DIRECTORY}/packages/${COMPONENT_NAME_MAIN}/data)
diff --git a/gpt4all-chat/cmake/installerscript.qs b/gpt4all-chat/cmake/installerscript.qs
new file mode 100644
index 00000000..841e1e52
--- /dev/null
+++ b/gpt4all-chat/cmake/installerscript.qs
@@ -0,0 +1,68 @@
+function Component() {
+}
+
+var targetDirectory;
+Component.prototype.beginInstallation = function() {
+    targetDirectory = installer.value("TargetDir");
+};
+
+Component.prototype.createOperations = function()
+{
+    try {
+        // call the base create operations function
+        component.createOperations();
+        if (systemInfo.productType === "windows") {
+            try {
+                var userProfile = installer.environmentVariable("USERPROFILE");
+                installer.setValue("UserProfile", userProfile);
+                component.addOperation("CreateShortcut",
+                    targetDirectory + "/bin/chat.exe",
+                    "@UserProfile@/Desktop/GPT4All.lnk",
+                    "workingDirectory=" + targetDirectory + "/bin",
+                    "iconPath=" + targetDirectory + "/favicon.ico",
+                    "iconId=0", "description=Open GPT4All");
+            } catch (e) {
+                print("ERROR: creating desktop shortcut" + e);
+            }
+            component.addOperation("CreateShortcut",
+                targetDirectory + "/bin/chat.exe",
+                "@StartMenuDir@/GPT4All.lnk",
+                "workingDirectory=" + targetDirectory + "/bin",
+                "iconPath=" + targetDirectory + "/favicon.ico",
+                "iconId=0", "description=Open GPT4All");
+        } else if (systemInfo.productType === "osx") {
+            var gpt4allAppPath = targetDirectory + "/bin/gpt4all.app";
+            var symlinkPath = targetDirectory + "/../GPT4All.app";
+            // Remove the symlink if it already exists
+            component.addOperation("Execute", "rm", "-f", symlinkPath);
+            // Create the symlink
+            component.addOperation("Execute", "ln", "-s", gpt4allAppPath, symlinkPath);
+        } else { // linux
+            var homeDir = installer.environmentVariable("HOME");
+            if (!installer.fileExists(homeDir + "/Desktop/GPT4All.desktop")) {
+                component.addOperation("CreateDesktopEntry",
+                    homeDir + "/Desktop/GPT4All.desktop",
+                    "Type=Application\nTerminal=false\nExec=\"" + targetDirectory +
+                    "/bin/chat\"\nName=GPT4All\nIcon=" + targetDirectory +
+                    "/logo-48.png\nName[en_US]=GPT4All");
+            }
+        }
+    } catch (e) {
+        print("ERROR: running post installscript.qs" + e);
+    }
+}
+
+Component.prototype.createOperationsForArchive = function(archive)
+{
+    component.createOperationsForArchive(archive);
+
+    if (systemInfo.productType === "osx") {
+        var uninstallTargetDirectory = installer.value("TargetDir");
+        var symlinkPath = uninstallTargetDirectory + "/../GPT4All.app";
+
+        // Remove the symlink during uninstallation
+        if (installer.isUninstaller()) {
+            component.addOperation("Execute", "rm", "-f", symlinkPath, "UNDOEXECUTE");
+        }
+    }
+}
diff --git a/gpt4all-chat/cmake/sign_dmg.py b/gpt4all-chat/cmake/sign_dmg.py
new file mode 100644
index 00000000..c448db36
--- /dev/null
+++ b/gpt4all-chat/cmake/sign_dmg.py
@@ -0,0 +1,81 @@
+import os
+import subprocess
+import tempfile
+import shutil
+import click
+from typing import Optional
+
+# Requires click
+# pip install click
+
+# Example usage
+# python sign_dmg.py --input-dmg /path/to/your/input.dmg --output-dmg /path/to/your/output.dmg --signing-identity "Developer ID Application: YOUR_NAME (TEAM_ID)"
+
+# NOTE: This script assumes that you have the necessary Developer ID Application certificate in your
+# Keychain Access and that the codesign and hdiutil command-line tools are available on your system.
+
+@click.command()
+@click.option('--input-dmg', required=True, help='Path to the input DMG file.')
+@click.option('--output-dmg', required=True, help='Path to the output signed DMG file.')
+@click.option('--sha1-hash', help='SHA-1 hash of the Developer ID Application certificate')
+@click.option('--signing-identity', default=None, help='Common name of the Developer ID Application certificate')
+def sign_dmg(input_dmg: str, output_dmg: str, signing_identity: Optional[str] = None, sha1_hash: Optional[str] = None) -> None:
+    if not signing_identity and not sha1_hash:
+        print("Error: Either --signing-identity or --sha1-hash must be provided.")
+        exit(1)
+
+    # Mount the input DMG
+    mount_point = tempfile.mkdtemp()
+    subprocess.run(['hdiutil', 'attach', input_dmg, '-mountpoint', mount_point])
+
+    # Copy the contents of the DMG to a temporary folder
+    temp_dir = tempfile.mkdtemp()
+    shutil.copytree(mount_point, os.path.join(temp_dir, 'contents'))
+    subprocess.run(['hdiutil', 'detach', mount_point])
+
+    # Find the .app bundle in the temporary folder
+    app_bundle = None
+    for item in os.listdir(os.path.join(temp_dir, 'contents')):
+        if item.endswith('.app'):
+            app_bundle = os.path.join(temp_dir, 'contents', item)
+            break
+
+    if not app_bundle:
+        print('No .app bundle found in the DMG.')
+        exit(1)
+
+    # Sign the .app bundle
+    try:
+        subprocess.run([
+            'codesign',
+            '--deep',
+            '--force',
+            '--verbose',
+            '--options', 'runtime',
+            '--timestamp',
+            '--sign', sha1_hash or signing_identity,
+            app_bundle
+        ], check=True)
+    except subprocess.CalledProcessError as e:
+        print(f"Error during codesign: {e}")
+        # Clean up temporary directories
+        shutil.rmtree(temp_dir)
+        shutil.rmtree(mount_point)
+        exit(1)
+
+    # Create a new DMG containing the signed .app bundle
+    subprocess.run([
+        'hdiutil', 'create',
+        '-volname', os.path.splitext(os.path.basename(input_dmg))[0],
+        '-srcfolder', os.path.join(temp_dir, 'contents'),
+        '-ov',
+        '-format', 'UDZO',
+        output_dmg
+    ])
+
+    # Clean up temporary directories
+    shutil.rmtree(temp_dir)
+    shutil.rmtree(mount_point)
+
+if __name__ == '__main__':
+    sign_dmg()
diff --git a/gpt4all-chat/download.cpp b/gpt4all-chat/download.cpp
new file mode 100644
index 00000000..736c8fa1
--- /dev/null
+++ b/gpt4all-chat/download.cpp
@@ -0,0 +1,600 @@
+#include "download.h"
+#include "network.h"
+
+#include <QCoreApplication>
+#include <QNetworkRequest>
+#include <QNetworkAccessManager>
+#include <QJsonDocument>
+#include <QJsonObject>
+#include <QJsonArray>
+#include <QUrl>
+#include <QDir>
+#include <QStandardPaths>
+#include <QSettings>
+
+class MyDownload: public Download { };
+Q_GLOBAL_STATIC(MyDownload, downloadInstance)
+Download *Download::globalInstance()
+{
+    return downloadInstance();
+}
+
+Download::Download()
+    : QObject(nullptr)
+    , m_hashAndSave(new HashAndSaveFile)
+{
+    connect(this, &Download::requestHashAndSave, m_hashAndSave,
+        &HashAndSaveFile::hashAndSave, Qt::QueuedConnection);
+    connect(m_hashAndSave, &HashAndSaveFile::hashAndSaveFinished, this,
+        &Download::handleHashAndSaveFinished, Qt::QueuedConnection);
+    connect(&m_networkManager, &QNetworkAccessManager::sslErrors, this,
+        &Download::handleSslErrors);
+    connect(this, &Download::downloadLocalModelsPathChanged, this, &Download::updateModelList);
+    updateModelList();
+    updateReleaseNotes();
+    QSettings settings;
+    settings.sync();
+    m_downloadLocalModelsPath = settings.value("modelPath",
+        defaultLocalModelsPath()).toString();
+    m_startTime = QDateTime::currentDateTime();
+}
+
+bool operator==(const ModelInfo& lhs, const ModelInfo& rhs) {
+    return lhs.filename == rhs.filename && lhs.md5sum == rhs.md5sum;
+}
+
+bool operator==(const ReleaseInfo& lhs, const ReleaseInfo& rhs) {
+    return lhs.version == rhs.version;
+}
+
+bool compareVersions(const QString &a, const QString &b) {
+    QStringList aParts = a.split('.');
+    QStringList bParts = b.split('.');
+
+    for (int i = 0; i < std::min(aParts.size(), bParts.size()); ++i) {
+        int aInt = aParts[i].toInt();
+        int bInt = bParts[i].toInt();
+
+        if (aInt > bInt) {
+            return true;
+        } else if (aInt < bInt) {
+            return false;
+        }
+    }
+
+    return aParts.size() > bParts.size();
+}
+
+QList<ModelInfo> Download::modelList() const
+{
+    // We make sure the default model is listed first
+    QList<ModelInfo> values = m_modelMap.values();
+    ModelInfo defaultInfo;
+    ModelInfo bestGPTJInfo;
+    ModelInfo bestLlamaInfo;
+    ModelInfo bestMPTInfo;
+    QList<ModelInfo> filtered;
+    for (ModelInfo v : values) {
+        if (v.isDefault)
+            defaultInfo = v;
+        if (v.bestGPTJ)
+            bestGPTJInfo = v;
+        if (v.bestLlama)
+            bestLlamaInfo = v;
+        if (v.bestMPT)
+            bestMPTInfo = v;
+        filtered.append(v);
+    }
+
+    Q_ASSERT(defaultInfo == bestGPTJInfo || defaultInfo == bestLlamaInfo || defaultInfo == bestMPTInfo);
+
+    if (bestLlamaInfo.bestLlama) {
+        filtered.removeAll(bestLlamaInfo);
+        filtered.prepend(bestLlamaInfo);
+    }
+
+    if (bestGPTJInfo.bestGPTJ) {
+        filtered.removeAll(bestGPTJInfo);
+        filtered.prepend(bestGPTJInfo);
+    }
+
+    if (bestMPTInfo.bestMPT) {
+        filtered.removeAll(bestMPTInfo);
+        filtered.prepend(bestMPTInfo);
+    }
+
+    return filtered;
+}
+
+ReleaseInfo Download::releaseInfo() const
+{
+    const QString currentVersion = QCoreApplication::applicationVersion();
+    if (m_releaseMap.contains(currentVersion))
+        return m_releaseMap.value(currentVersion);
+    return ReleaseInfo();
+}
+
+bool Download::hasNewerRelease() const
+{
+    const QString currentVersion = QCoreApplication::applicationVersion();
+    QList<QString> versions = m_releaseMap.keys();
+    std::sort(versions.begin(), versions.end(), compareVersions);
+    if (versions.isEmpty())
+        return false;
+    return compareVersions(versions.first(), currentVersion);
+}
+
+QString Download::downloadLocalModelsPath() const {
+    return m_downloadLocalModelsPath;
+}
+
+void Download::setDownloadLocalModelsPath(const QString &modelPath) {
+    QString filePath = (modelPath.startsWith("file://") ?
+                        QUrl(modelPath).toLocalFile() : modelPath);
+    QString canonical = QFileInfo(filePath).canonicalFilePath() + "/";
+    if (m_downloadLocalModelsPath != canonical) {
+        m_downloadLocalModelsPath = canonical;
+        emit downloadLocalModelsPathChanged();
+    }
+}
+
+bool Download::isFirstStart() const
+{
+    QSettings settings;
+    settings.sync();
+    QString lastVersionStarted = settings.value("download/lastVersionStarted").toString();
+    bool first = lastVersionStarted != QCoreApplication::applicationVersion();
+    settings.setValue("download/lastVersionStarted", QCoreApplication::applicationVersion());
+    settings.sync();
+    return first;
+}
+
+QString Download::incompleteDownloadPath(const QString &modelFile) {
+    QString downloadPath = downloadLocalModelsPath() + "incomplete-" +
+                           modelFile;
+    return downloadPath;
+}
+
+QString Download::defaultLocalModelsPath() const
+{
+    QString localPath = QStandardPaths::writableLocation(QStandardPaths::AppLocalDataLocation)
+        + "/";
+    QString testWritePath = localPath + QString("test_write.txt");
+    QString canonicalLocalPath = QFileInfo(localPath).canonicalFilePath() + "/";
+    QDir localDir(localPath);
+    if (!localDir.exists()) {
+        if (!localDir.mkpath(localPath)) {
+            qWarning() << "ERROR: Local download directory can't be created:" << canonicalLocalPath;
+            return canonicalLocalPath;
+        }
+    }
+
+    if (QFileInfo::exists(testWritePath))
+        return canonicalLocalPath;
+
+    QFile testWriteFile(testWritePath);
+    if (testWriteFile.open(QIODeviceBase::ReadWrite)) {
+        testWriteFile.close();
+        return canonicalLocalPath;
+    }
+
+    qWarning() << "ERROR: Local download path appears not writeable:" << canonicalLocalPath;
+    return canonicalLocalPath;
+}
+
+void Download::updateModelList()
+{
+    QUrl jsonUrl("http://gpt4all.io/models/models.json");
+    QNetworkRequest request(jsonUrl);
+    QSslConfiguration conf = request.sslConfiguration();
+    conf.setPeerVerifyMode(QSslSocket::VerifyNone);
+    request.setSslConfiguration(conf);
+    QNetworkReply *jsonReply = m_networkManager.get(request);
+    connect(jsonReply, &QNetworkReply::finished, this, &Download::handleModelsJsonDownloadFinished);
+}
+
+void Download::updateReleaseNotes()
+{
+    QUrl jsonUrl("http://gpt4all.io/meta/release.json");
+    QNetworkRequest request(jsonUrl);
+    QSslConfiguration conf = request.sslConfiguration();
+    conf.setPeerVerifyMode(QSslSocket::VerifyNone);
+    request.setSslConfiguration(conf);
+    QNetworkReply *jsonReply = m_networkManager.get(request);
+    connect(jsonReply, &QNetworkReply::finished, this, &Download::handleReleaseJsonDownloadFinished);
+}
+
+void Download::downloadModel(const QString &modelFile)
+{
+    QFile *tempFile = new QFile(incompleteDownloadPath(modelFile));
+    QDateTime modTime = tempFile->fileTime(QFile::FileModificationTime);
+    bool success = tempFile->open(QIODevice::WriteOnly | QIODevice::Append);
+    qWarning() << "Opening temp file for writing:" << tempFile->fileName();
+    if (!success) {
+        qWarning() << "ERROR: Could not open temp file:"
+            << tempFile->fileName() << modelFile;
+        return;
+    }
+    size_t incomplete_size = tempFile->size();
+    if (incomplete_size > 0) {
+        if (modTime < m_startTime) {
+            qWarning() << "File last modified before app started, rewinding by 1MB";
+            if (incomplete_size >= 1024 * 1024) {
+                incomplete_size -= 1024 * 1024;
+            } else {
+                incomplete_size = 0;
+            }
+        }
+        tempFile->seek(incomplete_size);
+    }
+
+    Network::globalInstance()->sendDownloadStarted(modelFile);
+    QNetworkRequest request("http://gpt4all.io/models/" + modelFile);
+    request.setRawHeader("range", QString("bytes=%1-").arg(incomplete_size).toUtf8());
+    QSslConfiguration conf = request.sslConfiguration();
+    conf.setPeerVerifyMode(QSslSocket::VerifyNone);
+    request.setSslConfiguration(conf);
+    QNetworkReply *modelReply = m_networkManager.get(request);
+    connect(modelReply, &QNetworkReply::downloadProgress, this, &Download::handleDownloadProgress);
+    connect(modelReply, &QNetworkReply::finished, this, &Download::handleModelDownloadFinished);
+    connect(modelReply, &QNetworkReply::readyRead, this, &Download::handleReadyRead);
+    m_activeDownloads.insert(modelReply, tempFile);
+}
+
+void Download::cancelDownload(const QString &modelFile)
+{
+    for (int i = 0; i < m_activeDownloads.size(); ++i) {
+        QNetworkReply *modelReply = m_activeDownloads.keys().at(i);
+        QUrl url = modelReply->request().url();
+        if (url.toString().endsWith(modelFile)) {
+            Network::globalInstance()->sendDownloadCanceled(modelFile);
+
+            // Disconnect the signals
+            disconnect(modelReply, &QNetworkReply::downloadProgress, this, &Download::handleDownloadProgress);
+            disconnect(modelReply, &QNetworkReply::finished, this, &Download::handleModelDownloadFinished);
+
+            modelReply->abort(); // Abort the download
+            modelReply->deleteLater(); // Schedule the reply for deletion
+
+            QFile *tempFile = m_activeDownloads.value(modelReply);
+            tempFile->deleteLater();
+            m_activeDownloads.remove(modelReply);
+
+            // Emit downloadFinished signal for cleanup
+            emit downloadFinished(modelFile);
+            break;
+        }
+    }
+}
+
+void Download::handleSslErrors(QNetworkReply *reply, const QList<QSslError> &errors)
+{
+    QUrl url = reply->request().url();
+    for (auto e : errors)
+        qWarning() << "ERROR: Received ssl error:" << e.errorString() << "for" << url;
+}
+
+void Download::handleModelsJsonDownloadFinished()
+{
+#if 0
+    QByteArray jsonData = QString(""
+    "["
+    "  {"
+    "    \"md5sum\": \"61d48a82cb188cceb14ebb8082bfec37\","
+    "    \"filename\": \"ggml-gpt4all-j-v1.1-breezy.bin\","
+    "    \"filesize\": \"3785248281\""
+    "  },"
+    "  {"
+    "    \"md5sum\": \"879344aaa9d62fdccbda0be7a09e7976\","
+    "    \"filename\": \"ggml-gpt4all-j-v1.2-jazzy.bin\","
+    "    \"filesize\": \"3785248281\","
+    "    \"isDefault\": \"true\""
+    "  },"
+    "  {"
+    "    \"md5sum\": \"5b5a3f9b858d33b29b52b89692415595\","
+    "    \"filesize\": \"3785248281\","
+    "    \"filename\": \"ggml-gpt4all-j.bin\""
+    "  }"
+    "]"
+    ).toUtf8();
+    printf("%s\n", jsonData.toStdString().c_str());
+    fflush(stdout);
+#else
+    QNetworkReply *jsonReply = qobject_cast<QNetworkReply *>(sender());
+    if (!jsonReply)
+        return;
+
+    QByteArray jsonData = jsonReply->readAll();
+    jsonReply->deleteLater();
+#endif
+    parseModelsJsonFile(jsonData);
+}
+
+void Download::parseModelsJsonFile(const QByteArray &jsonData)
+{
+    QJsonParseError err;
+    QJsonDocument document = QJsonDocument::fromJson(jsonData, &err);
+    if (err.error != QJsonParseError::NoError) {
+        qDebug() << "ERROR: Couldn't parse: " << jsonData << err.errorString();
+        return;
+    }
+
+    QString defaultModel;
+    QJsonArray jsonArray = document.array();
+    const QString currentVersion = QCoreApplication::applicationVersion();
+
+    m_modelMap.clear();
+    for (const QJsonValue &value : jsonArray) {
+        QJsonObject obj = value.toObject();
+
+        QString modelFilename = obj["filename"].toString();
+        QString modelFilesize = obj["filesize"].toString();
+        QString requires = obj["requires"].toString();
+        QByteArray modelMd5sum = obj["md5sum"].toString().toLatin1().constData();
+        bool isDefault = obj.contains("isDefault") && obj["isDefault"] == QString("true");
+        bool bestGPTJ = obj.contains("bestGPTJ") && obj["bestGPTJ"] == QString("true");
+        bool bestLlama = obj.contains("bestLlama") && obj["bestLlama"] == QString("true");
+        bool bestMPT = obj.contains("bestMPT") && obj["bestMPT"] == QString("true");
+        QString description = obj["description"].toString();
+
+        if (!requires.isEmpty()
+            && requires != currentVersion
+            && compareVersions(requires, currentVersion)) {
+            continue;
+        }
+
+        if (isDefault)
+            defaultModel = modelFilename;
+        quint64 sz = modelFilesize.toULongLong();
+        if (sz < 1024) {
+            modelFilesize = QString("%1 bytes").arg(sz);
+        } else if (sz < 1024 * 1024) {
+            modelFilesize = QString("%1 KB").arg(qreal(sz) / 1024, 0, 'g', 3);
+        } else if (sz < 1024 * 1024 * 1024) {
+            modelFilesize = QString("%1 MB").arg(qreal(sz) / (1024 * 1024), 0, 'g', 3);
+        } else {
+            modelFilesize = QString("%1 GB").arg(qreal(sz) / (1024 * 1024 * 1024), 0, 'g', 3);
+        }
+
+        QString filePath = downloadLocalModelsPath() + modelFilename;
+        QFileInfo info(filePath);
+        ModelInfo modelInfo;
+        modelInfo.filename = modelFilename;
+        modelInfo.filesize = modelFilesize;
+        modelInfo.md5sum = modelMd5sum;
+        modelInfo.installed = info.exists();
+        modelInfo.isDefault = isDefault;
+        modelInfo.bestGPTJ = bestGPTJ;
+        modelInfo.bestLlama = bestLlama;
+        modelInfo.bestMPT = bestMPT;
+        modelInfo.description = description;
+        modelInfo.requires = requires;
+        m_modelMap.insert(modelInfo.filename, modelInfo);
+    }
+
+    // remove ggml- prefix and .bin suffix
+    Q_ASSERT(defaultModel.startsWith("ggml-"));
+    defaultModel = defaultModel.remove(0, 5);
+    Q_ASSERT(defaultModel.endsWith(".bin"));
+    defaultModel.chop(4);
+
+    QSettings settings;
+    settings.sync();
+    settings.setValue("defaultModel", defaultModel);
+    settings.sync();
+    emit modelListChanged();
+}
+
+void Download::handleReleaseJsonDownloadFinished()
+{
+    QNetworkReply *jsonReply = qobject_cast<QNetworkReply *>(sender());
+    if (!jsonReply)
+        return;
+
+    QByteArray jsonData = jsonReply->readAll();
+    jsonReply->deleteLater();
+    parseReleaseJsonFile(jsonData);
+}
+
+void Download::parseReleaseJsonFile(const QByteArray &jsonData)
+{
+    QJsonParseError err;
+    QJsonDocument document = QJsonDocument::fromJson(jsonData, &err);
+    if (err.error != QJsonParseError::NoError) {
+        qDebug() << "ERROR: Couldn't parse: " << jsonData << err.errorString();
+        return;
+    }
+
+    QJsonArray jsonArray = document.array();
+
+    m_releaseMap.clear();
+    for (const QJsonValue &value : jsonArray) {
+        QJsonObject obj = value.toObject();
+
+        QString version = obj["version"].toString();
+        QString notes = obj["notes"].toString();
+        QString contributors = obj["contributors"].toString();
+        ReleaseInfo releaseInfo;
+        releaseInfo.version = version;
+        releaseInfo.notes = notes;
+        releaseInfo.contributors = contributors;
+        m_releaseMap.insert(version, releaseInfo);
+    }
+
+    emit hasNewerReleaseChanged();
+    emit releaseInfoChanged();
+}
+
+void Download::handleErrorOccurred(QNetworkReply::NetworkError code)
+{
+    QNetworkReply *modelReply = qobject_cast<QNetworkReply *>(sender());
+    if (!modelReply)
+        return;
+
+    QString modelFilename = modelReply->url().fileName();
+    qWarning() << "ERROR: Network error occurred attempting to download"
+               << modelFilename
+               << "code:" << code
+               << "errorString" << modelReply->errorString();
+    Network::globalInstance()->sendDownloadError(modelFilename, (int)code, modelReply->errorString());
+    cancelDownload(modelFilename);
+}
+
+void Download::handleDownloadProgress(qint64 bytesReceived, qint64 bytesTotal)
+{
+    QNetworkReply *modelReply = qobject_cast<QNetworkReply *>(sender());
+    if (!modelReply)
+        return;
+    QFile *tempFile = m_activeDownloads.value(modelReply);
+    if (!tempFile)
+        return;
+    QString contentRange = modelReply->rawHeader("content-range");
+    if (contentRange.contains("/")) {
+        QString contentTotalSize = contentRange.split("/").last();
+        bytesTotal = contentTotalSize.toLongLong();
+    }
+
+    QString modelFilename = modelReply->url().fileName();
+    emit downloadProgress(tempFile->pos(), bytesTotal, modelFilename);
+}
+
+HashAndSaveFile::HashAndSaveFile()
+    : QObject(nullptr)
+{
+    moveToThread(&m_hashAndSaveThread);
+    m_hashAndSaveThread.setObjectName("hashandsave thread");
+    m_hashAndSaveThread.start();
+}
+
+void HashAndSaveFile::hashAndSave(const QString &expectedHash, const QString &saveFilePath,
+        QFile *tempFile, QNetworkReply *modelReply)
+{
+    Q_ASSERT(!tempFile->isOpen());
+    QString modelFilename = modelReply->url().fileName();
+
+    // Reopen the tempFile for hashing
+    if (!tempFile->open(QIODevice::ReadOnly)) {
+        qWarning() << "ERROR: Could not open temp file for hashing:"
+            << tempFile->fileName() << modelFilename;
+        emit hashAndSaveFinished(false, tempFile, modelReply);
+        return;
+    }
+
+    QCryptographicHash hash(QCryptographicHash::Md5);
+    while(!tempFile->atEnd())
+        hash.addData(tempFile->read(16384));
+    if (hash.result().toHex() != expectedHash) {
+        tempFile->close();
+        qWarning() << "ERROR: Download error MD5SUM did not match:"
+            << hash.result().toHex()
+            << "!=" << expectedHash << "for" << modelFilename;
+        tempFile->remove();
+        emit hashAndSaveFinished(false, tempFile, modelReply);
+        return;
+    }
+
+    // The file save needs the tempFile closed
+    tempFile->close();
+
+    // Attempt to *move* the verified tempfile into place - this should be atomic
+    // but will only work if the destination is on the same filesystem
+    if (tempFile->rename(saveFilePath)) {
+        emit hashAndSaveFinished(true, tempFile, modelReply);
+        return;
+    }
+
+    // Reopen the tempFile for copying
+    if (!tempFile->open(QIODevice::ReadOnly)) {
+        qWarning() << "ERROR: Could not open temp file at finish:"
+            << tempFile->fileName() << modelFilename;
+        emit hashAndSaveFinished(false, tempFile, modelReply);
+        return;
+    }
+
+    // Save the model file to disk
+    QFile file(saveFilePath);
+    if (file.open(QIODevice::WriteOnly)) {
+        QByteArray buffer;
+        while (!tempFile->atEnd()) {
+            buffer = tempFile->read(16384);
+            file.write(buffer);
+        }
+        file.close();
+        tempFile->close();
+        emit hashAndSaveFinished(true, tempFile, modelReply);
+    } else {
+        QFile::FileError error = file.error();
+        qWarning() << "ERROR: Could not save model to location:"
+            << saveFilePath
+            << "failed with code" << error;
+        tempFile->close();
+        emit hashAndSaveFinished(false, tempFile, modelReply);
+        return;
+    }
+}
+
+void Download::handleModelDownloadFinished()
+{
+    QNetworkReply *modelReply = qobject_cast<QNetworkReply *>(sender());
+    if (!modelReply)
+        return;
+
+    QString modelFilename = modelReply->url().fileName();
+    QFile *tempFile = m_activeDownloads.value(modelReply);
+    m_activeDownloads.remove(modelReply);
+
+    if (modelReply->error()) {
+        qWarning() << "ERROR: downloading:" << modelReply->errorString();
+        modelReply->deleteLater();
+        tempFile->deleteLater();
+        emit downloadFinished(modelFilename);
+        return;
+    }
+
+    // The hash and save needs the tempFile closed
+    tempFile->close();
+
+    // Notify that we are calculating hash
+    ModelInfo info = m_modelMap.value(modelFilename);
+    info.calcHash = true;
+    m_modelMap.insert(modelFilename, info);
+    emit modelListChanged();
+
+    const QString saveFilePath = downloadLocalModelsPath() + modelFilename;
+    emit requestHashAndSave(info.md5sum, saveFilePath, tempFile, modelReply);
+}
+
+void Download::handleHashAndSaveFinished(bool success,
+        QFile *tempFile, QNetworkReply *modelReply)
+{
+    // The hash and save should send back with tempfile closed
+    Q_ASSERT(!tempFile->isOpen());
+    QString modelFilename = modelReply->url().fileName();
+    Network::globalInstance()->sendDownloadFinished(modelFilename, success);
+
+    ModelInfo info = m_modelMap.value(modelFilename);
+    info.calcHash = false;
+    info.installed = success;
+    m_modelMap.insert(modelFilename, info);
+    emit modelListChanged();
+
+    modelReply->deleteLater();
+    tempFile->deleteLater();
+    emit downloadFinished(modelFilename);
+}
+
+void Download::handleReadyRead()
+{
+    QNetworkReply *modelReply = qobject_cast<QNetworkReply *>(sender());
+    if (!modelReply)
+        return;
+
+    QString modelFilename = modelReply->url().fileName();
+    QFile *tempFile = m_activeDownloads.value(modelReply);
+    QByteArray buffer;
+    while (!modelReply->atEnd()) {
+        buffer = modelReply->read(16384);
+        tempFile->write(buffer);
+    }
+    tempFile->flush();
+}
diff --git a/gpt4all-chat/download.h b/gpt4all-chat/download.h
new file mode 100644
index 00000000..638bae43
--- /dev/null
+++ b/gpt4all-chat/download.h
@@ -0,0 +1,136 @@
+#ifndef DOWNLOAD_H
+#define DOWNLOAD_H
+
+#include <QObject>
+#include <QNetworkAccessManager>
+#include <QNetworkReply>
+#include <QFile>
+#include <QVariant>
+#include <QTemporaryFile>
+#include <QThread>
+
+struct ModelInfo {
+    Q_GADGET
+    Q_PROPERTY(QString filename MEMBER filename)
+    Q_PROPERTY(QString filesize MEMBER filesize)
+    Q_PROPERTY(QByteArray md5sum MEMBER md5sum)
+    Q_PROPERTY(bool calcHash MEMBER calcHash)
+    Q_PROPERTY(bool installed MEMBER installed)
+    Q_PROPERTY(bool isDefault MEMBER isDefault)
+    Q_PROPERTY(bool bestGPTJ MEMBER bestGPTJ)
+    Q_PROPERTY(bool bestLlama MEMBER bestLlama)
+    Q_PROPERTY(bool bestMPT MEMBER bestMPT)
+    Q_PROPERTY(QString description MEMBER description)
+    Q_PROPERTY(QString requires MEMBER requires)
+
+public:
+    QString filename;
+    QString filesize;
+    QByteArray md5sum;
+    bool calcHash = false;
+    bool installed = false;
+    bool isDefault = false;
+    bool bestGPTJ = false;
+    bool bestLlama = false;
+    bool bestMPT = false;
+    QString description;
+    QString requires;
+};
+Q_DECLARE_METATYPE(ModelInfo)
+
+struct ReleaseInfo {
+    Q_GADGET
+    Q_PROPERTY(QString version MEMBER version)
+    Q_PROPERTY(QString notes MEMBER notes)
+    Q_PROPERTY(QString contributors MEMBER contributors)
+
+public:
+    QString version;
+    QString notes;
+    QString contributors;
+};
+
+class HashAndSaveFile : public QObject
+{
+    Q_OBJECT
+public:
+    HashAndSaveFile();
+
+public Q_SLOTS:
+    void hashAndSave(const QString &hash, const QString &saveFilePath,
+        QFile *tempFile, QNetworkReply *modelReply);
+
+Q_SIGNALS:
+    void hashAndSaveFinished(bool success,
+        QFile *tempFile, QNetworkReply *modelReply);
+
+private:
+    QThread m_hashAndSaveThread;
+};
+
+class Download : public QObject
+{
+    Q_OBJECT
+    Q_PROPERTY(QList<ModelInfo> modelList READ modelList NOTIFY modelListChanged)
+    Q_PROPERTY(bool hasNewerRelease READ hasNewerRelease NOTIFY hasNewerReleaseChanged)
+    Q_PROPERTY(ReleaseInfo releaseInfo READ releaseInfo NOTIFY releaseInfoChanged)
+    Q_PROPERTY(QString downloadLocalModelsPath READ downloadLocalModelsPath
+                   WRITE setDownloadLocalModelsPath
+                   NOTIFY downloadLocalModelsPathChanged)
+
+public:
+    static Download *globalInstance();
+
+    QList<ModelInfo> modelList() const;
+    ReleaseInfo releaseInfo() const;
+    bool hasNewerRelease() const;
+    Q_INVOKABLE void updateModelList();
+    Q_INVOKABLE void updateReleaseNotes();
+    Q_INVOKABLE void downloadModel(const QString &modelFile);
+    Q_INVOKABLE void cancelDownload(const QString &modelFile);
+    Q_INVOKABLE QString defaultLocalModelsPath() const;
+    Q_INVOKABLE QString downloadLocalModelsPath() const;
+    Q_INVOKABLE void setDownloadLocalModelsPath(const QString &modelPath);
+    Q_INVOKABLE bool isFirstStart() const;
+
+private Q_SLOTS:
+    void handleSslErrors(QNetworkReply *reply, const QList<QSslError> &errors);
+    void handleModelsJsonDownloadFinished();
+    void handleReleaseJsonDownloadFinished();
+    void handleErrorOccurred(QNetworkReply::NetworkError code);
+    void handleDownloadProgress(qint64 bytesReceived, qint64 bytesTotal);
+    void handleModelDownloadFinished();
+    void handleHashAndSaveFinished(bool success,
+        QFile *tempFile, QNetworkReply *modelReply);
+    void handleReadyRead();
+
+Q_SIGNALS:
+    void downloadProgress(qint64 bytesReceived, qint64 bytesTotal, const QString &modelFile);
+    void downloadFinished(const QString &modelFile);
+    void modelListChanged();
+    void releaseInfoChanged();
+    void hasNewerReleaseChanged();
+    void downloadLocalModelsPathChanged();
+    void requestHashAndSave(const QString &hash, const QString &saveFilePath,
+        QFile *tempFile, QNetworkReply *modelReply);
+
+private:
+    void parseModelsJsonFile(const QByteArray &jsonData);
+    void parseReleaseJsonFile(const QByteArray &jsonData);
+    QString incompleteDownloadPath(const QString &modelFile);
+
+    HashAndSaveFile *m_hashAndSave;
+    QMap<QString, ModelInfo> m_modelMap;
+    QMap<QString, ReleaseInfo> m_releaseMap;
+    QNetworkAccessManager m_networkManager;
+    QMap<QNetworkReply*, QFile*> m_activeDownloads;
+    QString m_downloadLocalModelsPath;
+    QDateTime m_startTime;
+
+private:
+    explicit Download();
+    ~Download() {}
+    friend class MyDownload;
+};
+
+#endif // DOWNLOAD_H
diff --git a/gpt4all-chat/icons/copy.svg b/gpt4all-chat/icons/copy.svg
new file mode 100644
index 00000000..5ab45b5b
--- /dev/null
+++ b/gpt4all-chat/icons/copy.svg
@@ -0,0 +1,9 @@
+<svg fill="#7d7d8e" height="800px" width="800px" version="1.1" xmlns="http://www.w3.org/2000/svg" viewBox="0 0 512 512" xmlns:xlink="http://www.w3.org/1999/xlink" enable-background="new 0 0 512 512">
+  <g>
+    <g>
+      <path d="M480.6,109.1h-87.5V31.4c0-11.3-9.1-20.4-20.4-20.4H31.4C20.1,11,11,20.1,11,31.4v351c0,11.3,9.1,20.4,20.4,20.4h87.5    v77.7c0,11.3,9.1,20.4,20.4,20.4h341.3c11.3,0,20.4-9.1,20.4-20.4v-351C501,118.3,491.9,109.1,480.6,109.1z M51.8,362V51.8h300.4    v57.3H139.3c-11.3,0-20.4,9.1-20.4,20.4V362H51.8z M460.2,460.2H159.7V150h300.4V460.2z"/>
+      <path d="m233.3,254.4h155.8c11.3,0 20.4-9.1 20.4-20.4 0-11.3-9.1-20.4-20.4-20.4h-155.8c-11.3,0-20.4,9.1-20.4,20.4 0,11.2 9.1,20.4 20.4,20.4z"/>
+      <path d="m233.3,396.6h155.8c11.3,0 20.4-9.1 20.4-20.4 0-11.3-9.1-20.4-20.4-20.4h-155.8c-11.3,0-20.4,9.1-20.4,20.4 0,11.3 9.1,20.4 20.4,20.4z"/>
+    </g>
+  </g>
+</svg>
diff --git a/gpt4all-chat/icons/edit.svg b/gpt4all-chat/icons/edit.svg
new file mode 100644
index 00000000..9820173b
--- /dev/null
+++ b/gpt4all-chat/icons/edit.svg
@@ -0,0 +1,5 @@
+<svg xmlns="http://www.w3.org/2000/svg" fill="#7d7d8e" viewBox="0 0 576 512"><path d="M402.6 83.2l90.2 90.2c3.8 3.8 3.8 10 0 13.8L274.4 405.6l-92.8 10.3c-12.4 1.4-22.9-9.1-21.5-21.5l10.3-92.8L388.8 83.2c3.8-3.8 10-3.8 13.8 0zm162-22.9l-48.8-48.8c-15.2-15.2-39.9-15.2-55.2 0l-35.4 35.4c-3.8 3.8-3.8 10 0 13.8l90.2 90.2c3.8 3.8 10 3.8 13.8 0l35.4-35.4c15.2-15.3 15.2-40 0-55.2zM384 346.2V448H64V128h229.8c3.2 0 6.2-1.3 8.5-3.5l40-40c7.6-7.6 2.2-20.5-8.5-20.5H48C21.5 64 0 85.5 0 112v352c0 26.5 21.5 48 48 48h352c26.5 0 48-21.5 48-48V306.2c0-10.7-12.9-16-20.5-8.5l-40 40c-2.2 2.3-3.5 5.3-3.5 8.5z"/></svg>
+<!--
+Font Awesome Free 5.2.0 by @fontawesome - https://fontawesome.com
+License - https://fontawesome.com/license (Icons: CC BY 4.0, Fonts: SIL OFL 1.1, Code: MIT License)
+-->
diff --git a/gpt4all-chat/icons/favicon.icns b/gpt4all-chat/icons/favicon.icns
new file mode 100644
index 00000000..38638c7a
Binary files /dev/null and b/gpt4all-chat/icons/favicon.icns differ
diff --git a/gpt4all-chat/icons/favicon.ico b/gpt4all-chat/icons/favicon.ico
new file mode 100644
index 00000000..d7c27c4b
Binary files /dev/null and b/gpt4all-chat/icons/favicon.ico differ
diff --git a/gpt4all-chat/icons/logo-1024.png b/gpt4all-chat/icons/logo-1024.png
new file mode 100644
index 00000000..2fb7cbdc
Binary files /dev/null and b/gpt4all-chat/icons/logo-1024.png differ
diff --git a/gpt4all-chat/icons/logo-128.png b/gpt4all-chat/icons/logo-128.png
new file mode 100644
index 00000000..81c52374
Binary files /dev/null and b/gpt4all-chat/icons/logo-128.png differ
diff --git a/gpt4all-chat/icons/logo-16.png b/gpt4all-chat/icons/logo-16.png
new file mode 100644
index 00000000..344ac9b1
Binary files /dev/null and b/gpt4all-chat/icons/logo-16.png differ
diff --git a/gpt4all-chat/icons/logo-256.png b/gpt4all-chat/icons/logo-256.png
new file mode 100644
index 00000000..291f3003
Binary files /dev/null and b/gpt4all-chat/icons/logo-256.png differ
diff --git a/gpt4all-chat/icons/logo-32.png b/gpt4all-chat/icons/logo-32.png
new file mode 100644
index 00000000..06628744
Binary files /dev/null and b/gpt4all-chat/icons/logo-32.png differ
diff --git a/gpt4all-chat/icons/logo-48.png b/gpt4all-chat/icons/logo-48.png
new file mode 100644
index 00000000..4d53f9f7
Binary files /dev/null and b/gpt4all-chat/icons/logo-48.png differ
diff --git a/gpt4all-chat/icons/logo-512.png b/gpt4all-chat/icons/logo-512.png
new file mode 100644
index 00000000..4f70fbb4
Binary files /dev/null and b/gpt4all-chat/icons/logo-512.png differ
diff --git a/gpt4all-chat/icons/logo-64.png b/gpt4all-chat/icons/logo-64.png
new file mode 100644
index 00000000..fbffe619
Binary files /dev/null and b/gpt4all-chat/icons/logo-64.png differ
diff --git a/gpt4all-chat/icons/logo.svg b/gpt4all-chat/icons/logo.svg
new file mode 100644
index 00000000..e7084ec0
--- /dev/null
+++ b/gpt4all-chat/icons/logo.svg
@@ -0,0 +1,14 @@
+<svg viewBox="0 0 1024 1024" style="background: transparent" xmlns="http://www.w3.org/2000/svg">
+  <rect style="stroke: rgb(0, 0, 0); fill: rgb(32, 33, 35);" width="830.033" height="830.033" rx="183" y="92.866" x="100.219" ry="183"></rect>
+  <path d="M 899.164 633.951 C 901.247 634.834 903.465 635.015 905.815 634.467 C 905.445 631.599 880.952 619.317 879.536 618.608 C 847.052 602.39 826.824 596.787 818.199 592.651 C 816.009 591.603 815.069 591.48 815.091 590.632 C 815.171 587.38 866.185 585.853 872.787 581.468 C 870.273 579.112 812.628 587.437 800.595 587.76 C 790.367 588.035 778.326 583.934 776.7 580.397 C 785.665 575.867 817.387 574.356 824.087 569.44 C 822.235 567.769 823.177 567.231 796.498 572.327 C 787.505 574.049 771.736 575.969 764.018 578.12 C 757.282 580.001 734.524 580.364 733.953 580.374 C 695.962 581.048 651.911 587.016 590.483 580.404 C 522.716 573.115 533.142 549.843 532.963 487.237 C 532.931 475.323 527.748 443.538 574.398 435.67 C 610.188 429.631 650.676 430.773 664.826 431.092 C 681.062 431.457 752.738 434.569 752.19 434.549 C 753.566 434.598 819.676 445.861 820.228 445.961 C 821.72 446.219 822.935 445.801 824.087 444.76 C 817.224 439.727 785.717 438.36 776.7 433.799 C 777.924 431.135 784.542 428.965 787.564 428.074 C 797.662 425.083 806.198 426.879 816.448 427.959 C 873.547 433.964 871.089 434.321 872.787 432.731 C 867.16 428.993 822.266 426.539 816.285 424.554 C 811.588 422.997 820.855 420.408 835.885 414.68 C 873.645 400.295 905.439 382.632 905.815 379.733 C 900.538 378.5 898.923 380.688 885.2 386.331 C 846.304 402.325 835.982 407.748 834.568 404.907 C 833.754 403.263 860.361 382.75 859.649 380.954 C 848.361 383.741 821.511 411.523 800.832 415.065 C 759.713 422.103 746.421 425.494 743.618 422.607 C 754.62 415.088 763.48 409.955 764.952 404.67 C 762.751 404.902 760.898 405.188 759.23 406.137 C 732.491 421.412 744.862 422.439 689.392 422.087 C 686.226 422.063 669.929 421.282 665.832 420.479 C 667.321 416.952 670.603 417.325 712.009 392.959 C 728.868 383.035 737.082 382.115 796.816 369.913 C 816.502 365.889 813.61 366.09 838.011 363.194 C 838.693 363.112 839.844 363.359 839.78 362.458 C 839.716 361.571 838.567 361.884 837.892 361.898 C 835.482 361.961 820.4 361.313 820.158 361.256 C 818.845 360.937 818.211 359.955 819.891 359.132 C 887.757 325.921 860.277 343.093 881.838 329.323 C 889.633 324.342 894.482 324.321 903.481 318.049 C 906.577 315.885 898.009 316.64 892.573 319.591 C 876.44 328.348 869.753 332.113 858.127 336.077 C 855.891 336.841 847.169 337.334 853.129 330.14 C 863.71 317.374 865.493 315.205 862.002 314.498 C 860.93 314.282 860.447 314.982 859.99 315.557 C 855.476 321.263 850.087 325.598 844.335 332.686 C 833.156 346.463 815.617 354.258 797.558 359.566 C 788.586 362.202 762.612 368.245 761.031 367.667 C 761.049 366.555 774.861 344.777 775.473 343.831 C 783.577 331.24 780.01 324.672 794.553 313.274 C 829.587 285.812 831.372 284.808 830.145 283.661 C 829.43 282.985 828.576 283.838 827.961 284.232 C 777.263 316.304 768.945 337.152 817.965 241.117 C 819.757 237.605 817.387 235.524 815.958 237.674 C 803.078 257.061 792.332 285.429 789.181 279.96 C 782.692 268.709 787.775 261.928 785.372 251.338 C 785.308 251.046 785.144 250.755 784.714 250.768 C 783.06 252.058 782.221 253.078 782.249 254.485 C 782.284 256.461 780.936 265.649 782.365 277.87 C 786.34 311.811 768.962 349.387 750.721 363.876 C 744.211 369.051 672.349 401.669 671.797 401.915 C 663.431 405.715 646.234 414.733 649.252 407.718 C 657.94 387.498 654.376 391.957 696.973 385.655 C 697.509 385.574 697.977 385.479 697.843 384.825 C 696.22 384.053 676.958 385.582 668.672 385.564 C 666.969 385.561 666.515 384.005 667.663 383.015 C 677.129 374.889 695.418 367.284 698.448 360.99 C 697.209 360.519 698.261 360.141 678.299 370.902 C 676.896 371.658 675.043 370.663 675.368 368.959 C 678.076 354.597 678.674 355.045 677.95 354.593 C 677.422 354.264 676.776 354.446 676.374 354.867 C 668.23 363.433 673.593 364.719 665.957 376.893 C 662.263 382.784 657.458 385.294 653.143 390.76 C 639.467 408.082 640.606 414.179 627.131 417.491 C 613.584 420.822 599.857 415.793 559.567 427.176 C 559.027 427.329 540.569 432.255 533.657 433.797 C 532.782 433.992 531.46 434.425 530.962 433.442 C 530.499 432.51 531.784 432.076 532.438 431.579 C 537.398 427.813 549.032 419.933 563.134 405.877 C 586.593 382.495 605.458 348.191 633.785 337.762 C 646.6 333.05 668.955 326.228 677.29 323.743 C 691.378 319.544 701.285 324.64 705.374 325.21 C 708.163 325.6 712.125 326.668 712.693 325.229 C 713.232 323.87 712.005 323.464 711.463 323.02 C 704.928 317.645 689.343 320.349 684.405 317.432 C 694.736 311.839 720.259 309.544 721.905 305.244 C 720.635 304.276 716.217 305.193 715.421 305.328 C 680.129 311.257 632.281 332.335 627.777 328.209 C 641.93 311.627 671.251 291.791 690.424 280.044 C 713.248 266.056 726.836 260.636 751.085 249.893 C 754.617 248.329 755.109 248.209 754.706 247.62 C 753.798 246.275 742.499 250.832 731.405 253.252 C 729.09 253.758 729.438 251.613 730.255 250.299 C 737.23 239.118 744.655 223.824 759.142 215.774 C 763.563 213.32 769.822 208.091 769.69 206.665 C 766.981 205.249 741.452 223.465 742.796 217.188 C 742.796 217.188 744.134 206.576 744.134 206.576 C 744.55 203.139 742.533 201.996 741.459 202.436 C 737.223 204.172 737.451 204.412 736.165 222.809 C 734.958 240.066 722.095 247.464 706.939 257.468 C 675.679 278.09 673.971 277.723 674.266 272.425 C 674.291 271.928 678.493 252.789 685.124 239.992 C 691.516 227.665 701.251 219.508 695.352 218.831 C 693.122 218.571 688.359 226.561 685.913 225.388 C 682.622 223.81 702.369 179.282 704.713 159.114 C 704.868 157.794 702.705 156.786 701.374 158.971 C 695.749 168.192 690.217 192.997 685.101 197.869 C 683.677 199.228 682.298 198.131 682.196 197.183 C 680.643 182.884 680.316 168.449 675.134 174.112 C 671.864 177.69 678.475 188.892 678.007 217.09 C 677.62 240.639 667.833 270.238 659.286 283.884 C 649.074 300.178 631.208 303.688 597.134 343.484 C 593.566 347.656 592.621 348.349 591.359 347.828 C 590.499 347.477 590.374 346.888 590.408 346.161 C 591.103 331.265 591.579 325.048 594.06 317.394 C 599.22 301.455 605.104 292.539 603.619 289.838 C 596.911 295.24 596.174 303.551 588.975 309.116 C 586.453 311.063 584.756 309.65 584.023 306.838 C 582.838 302.267 582.804 299.448 578.977 298.019 C 577.685 297.535 577.227 297.79 577.237 299.015 C 577.24 300.221 577.339 301.419 577.689 302.614 C 583.641 322.86 588.417 352.765 575.273 369.923 C 569.238 377.799 550.393 394.702 540.078 404.362 C 533.54 410.49 522.791 417.431 520.611 409.105 C 517.724 398.102 519.146 392.991 519.166 390.18 C 519.201 386.198 520.776 369.716 521.122 367.755 C 522.823 357.96 524.738 333.809 549.117 311.825 C 560.373 301.669 603.128 272.202 618.022 255.162 C 630.576 240.793 630.745 231.18 631.79 227.669 C 644.157 186.047 643.813 193.329 653.477 146.889 C 653.923 144.735 652.82 143.855 650.53 144.576 C 644.553 146.458 646.566 151.968 640.149 149.443 C 635.278 147.521 634.592 147.192 633.688 148.086 C 632.798 148.961 636.817 156.141 638.345 157.864 C 640.046 159.78 639.653 160.356 639.545 174.441 C 639.449 185.917 637.044 195.776 631.54 211.249 C 623.469 233.924 622.959 244.117 597.685 263.882 C 593.145 267.435 588.016 265.581 589.039 260.164 C 591.287 248.212 604.022 244.549 605.442 241.81 C 596.351 243.212 596.053 243.402 594.316 243.087 C 591.335 242.541 590.917 240.501 590.908 237.317 C 590.814 191.584 590.996 193.327 590.403 190.848 C 589.717 187.987 586.315 184.221 585.379 187.103 C 584.577 189.575 583.505 197.752 583.393 203.36 C 582.66 239.299 587.501 228.381 561.68 255.204 C 557.914 259.111 553.909 259.876 534.713 265.259 C 520.798 269.161 521.893 267.863 521.77 266.157 C 519.013 226.619 514.204 233.79 527.721 222.212 C 544.621 207.727 561.905 194.078 555.72 194.44 C 550.232 194.759 547.404 201.698 518.412 220.467 C 517.861 220.824 517.34 221.186 516.426 221.048 C 511.104 187.178 509.541 186.324 526.002 182.233 C 588.415 166.716 579.518 168.794 586.69 164.844 C 587.859 164.197 587.024 163.344 586.298 163.266 C 585.683 163.199 585.139 163.384 581.229 164.214 C 576.845 165.145 559.874 173.691 554.695 170.592 C 556.328 163.114 573.251 155.548 571.085 152.097 C 568.877 152.29 566.685 152.741 564.791 153.873 C 550.548 162.375 556.079 168.617 537.625 174.438 C 528.086 177.446 517.417 178.766 513.232 178.648 C 506.759 178.463 505.904 170.651 507.169 166.34 C 511.182 152.711 564.953 135.578 568.817 128.051 C 565.896 127.503 554.627 135.092 552.433 134.108 C 553.044 131.047 553.216 128.039 553.79 125.064 C 554.693 120.391 554.634 120.097 554.036 119.815 C 553.023 119.339 552.387 120.415 551.607 121.357 C 547.087 126.806 548.251 133.571 537.063 140.758 C 530.316 145.097 519.916 148.575 515.978 147.381 C 515.592 144.456 536.574 116.915 530.268 120.9 C 518.617 128.266 518.172 131.347 516.697 127.96 C 514.801 123.579 512.241 119.478 510.223 115.151 C 509.881 114.419 509.636 113.584 508.531 113.148 C 507.02 117.972 521.575 128.909 498.687 165.249 C 497.704 166.809 495.607 165.678 494.671 164.113 C 486.123 149.826 487.062 151.179 485.291 153.273 C 484.161 154.608 483.954 154.65 482.525 153.605 C 479.901 151.678 477.741 149.38 476.167 146.656 C 470.662 137.168 470.817 136.505 469.078 135.846 C 465.597 148.678 476.701 154.803 479.591 163.476 C 482.006 170.707 471.786 215.489 465.394 201.392 C 457.844 184.738 458.383 185.066 456.984 185.048 C 454.255 185.009 452.57 195.151 450.865 195.64 C 449.953 195.401 449.319 193.51 446.034 189.314 C 444.019 186.744 441.284 185.083 437.852 184.463 C 436.35 184.189 435.986 184.522 436.255 185.87 C 437.123 190.248 437.535 189.679 455.457 205.796 C 464.169 213.627 465.784 214.241 464.114 217.131 C 464.114 217.131 453.373 238.385 444.299 255.64 C 442.935 258.229 440.749 259.887 438.225 261.492 C 431.41 251.448 423.822 221.514 429.254 187.293 C 434.227 155.929 447.467 149.071 457.093 124.259 C 457.575 123.021 457.139 122.042 456.27 121.122 C 455.211 119.999 451.22 121.753 450.572 124.716 C 447.975 136.608 439.493 147.444 433.147 151.873 C 431.011 153.362 433.142 154.943 414.274 129.198 C 413.857 128.618 413.608 127.801 412.573 127.684 C 411.941 129.629 412.402 139.023 419.233 147.708 C 423.259 152.824 425.71 157.438 425.34 163.694 C 425.026 169.085 422.552 193.111 420.964 199.398 C 418.361 209.697 418.811 208.766 416.064 209.582 C 414.331 210.096 415.346 208.283 410.359 204.215 C 404.077 199.085 387.821 183.355 387.453 188.688 C 387.192 192.465 389.128 193.353 393.284 197.199 C 393.673 197.559 394.292 197.901 393.906 198.532 C 392.976 200.048 393.031 199.534 369.581 188.327 C 366.629 186.913 365.358 185.987 365.327 187.847 C 365.274 191.178 368.277 192.351 374.158 195.388 C 426.063 222.168 416.975 206.417 422.533 281.176 C 422.533 281.176 424.887 332.339 424.887 332.339 C 425.251 341.776 390.007 308.417 371.299 291.787 C 350.777 273.543 354.415 250.329 347.297 206.963 C 344.501 189.969 339.39 144.488 336.739 143.801 C 335.956 143.601 335.812 144.423 334.987 146.025 C 333.517 148.863 333.079 147.381 329.741 146.256 C 327.46 145.492 327.852 146.384 328.522 152.414 C 330.784 172.729 348.291 202.491 339.267 201.348 C 334.04 200.689 300.953 147.474 296.226 150.589 C 295.398 151.138 294.147 148.921 311.572 175.43 C 308.869 174.9 294.353 168.114 292.908 170.22 C 292.145 171.321 299.631 178.543 313.204 184.553 C 317.71 186.554 343.98 206.522 337.442 238.949 C 337.067 240.826 336.764 240.915 335.192 239.728 C 322.111 229.832 322.401 229.698 321.467 230.278 C 319.842 231.297 324.036 236.624 325.02 237.84 C 330.908 245.119 336.035 251.003 341.156 263.88 C 342.776 267.957 338.921 271.545 332.476 268.595 C 313.982 260.144 300.403 248.906 294.43 230.624 C 291.138 220.541 286.466 212.808 283.241 206.065 C 273.455 185.62 280.105 182.045 269.364 175.882 C 268.965 175.649 268.541 175.308 267.716 175.685 C 268.554 180.86 269.4 186.121 270.3 191.72 C 266.359 190.403 255.506 181.487 247.885 180.566 C 247.524 181.993 258.721 191.129 266.373 195.45 C 275.134 200.403 274.925 202.82 283.115 219.813 C 283.351 220.306 285.202 225.475 282.082 224.458 C 276.219 222.551 260.142 209.993 252.665 210.119 C 252.512 211.921 280.09 232.651 283.976 235.586 C 287.672 238.369 290.117 241.861 292.024 245.786 C 290.93 246.623 281.214 246.414 279.798 246.371 C 234.903 244.951 218.268 211.394 212.641 205.398 C 211.991 204.703 211.347 204.108 210.327 204.579 C 209.258 205.081 209.856 205.862 210.109 206.552 C 215.41 220.886 215.302 219.821 214.509 220.403 C 192.125 211.243 192.941 211.266 192.3 212.087 C 191.106 213.621 200.079 218.205 201.168 218.794 C 273.419 257.937 277.138 250.022 288.914 254.109 C 288.255 255.6 273.65 260.884 265.299 261.509 C 250.869 262.592 240.631 259.304 236.073 260.377 C 242.075 264.573 258.718 267.665 268.794 264.86 C 281.046 261.446 292.481 260.728 305.191 266.31 C 339.645 281.444 350.42 288.625 358.661 299.873 C 359.146 300.539 359.806 301.142 359.716 302.124 C 349.436 302.124 306.366 298.456 306.267 302.364 C 306.241 303.335 305.66 303.028 324.854 305.855 C 324.97 307.096 325.704 306.554 310.18 312.507 C 309.63 312.723 309.024 312.857 309.272 313.596 C 309.912 315.462 322.163 311.987 335.762 309.223 C 370.353 302.2 365.362 310.337 403.34 336.269 C 413.526 343.222 425.34 350.589 432.818 363.361 C 434.313 365.917 435.055 368.484 431.868 368.648 C 429.718 368.76 394.254 363.119 356.791 342.924 C 341.645 334.759 343.559 338.78 344.125 339.227 C 346.223 340.877 344.646 339.723 373.739 359.777 C 375.586 361.048 373.658 361.457 368.742 362.726 C 347.566 368.199 348.562 367.624 348.596 368.516 C 349.723 369.658 362.595 367.095 373.34 365.615 C 382.506 364.352 386.279 365.168 403.498 369.153 C 424.652 374.053 438.602 375.827 446.53 389.783 C 457.786 409.581 463.738 404.617 466.514 421.127 C 467.281 425.693 465.903 426.914 460.786 427.194 C 450.521 427.757 423.412 419.105 413.798 415.522 C 349.464 391.541 341.356 375.426 329.115 349.721 C 322.921 336.721 322.17 336.023 320.536 336.819 C 319.55 337.295 319.214 334.732 334.2 373.165 C 328.016 372.743 318.12 368.795 312.921 366.337 C 285.972 353.607 272.188 317.36 232.475 297.233 C 224.148 293.011 213.879 290.382 206.904 282.172 C 198.322 272.082 204.57 267.467 198.833 265.039 C 196.66 264.122 195.314 266.742 195.053 268.912 C 193.991 277.834 198.744 281.353 199.698 286.196 C 193.223 286.399 163.085 284.48 159.334 284.89 C 159.424 287.202 180.688 289.264 181.785 289.345 C 187.382 289.778 205.021 290.17 223.125 298.825 C 266.117 319.369 291.209 365.804 285.95 364.523 C 279.956 363.058 287.633 365.819 275.04 361.436 C 228.597 345.261 212.37 339.354 200.805 330.46 C 184.641 318.031 173.165 301.053 170.568 302.103 C 168.926 302.767 172.282 309.153 171.468 311.712 C 163.509 311.108 145.898 306 145.178 307.622 C 144.529 309.105 152.642 310.967 172.466 318.25 C 184.618 322.715 182.553 321.522 191.284 328.627 C 191.579 328.869 191.998 329.035 191.83 329.569 C 190.917 330.156 170.748 336.241 151.75 335.878 C 144.825 335.748 143.963 336.035 143.951 337.185 C 143.915 341.569 183.351 335.677 185.724 335.337 C 195.786 333.887 199.409 337.252 212.401 342.714 C 250.024 358.52 245.931 355.789 249.618 360.544 C 238.55 363.996 182.753 365.622 182.654 369.127 C 182.576 371.782 207.564 368.937 219.247 367.953 C 254.922 364.942 314.601 368.014 338.39 387.222 C 330.92 389.679 304.024 388.279 303.335 391.217 C 304.442 392.882 326.848 393.327 330.222 393.437 C 340.707 393.78 345.078 396.115 358.343 402.576 C 365.777 406.203 381.361 415.178 381.775 417.243 C 369.577 418.987 347.947 418.368 343.145 418.116 C 318.09 416.78 301.453 410.882 286.596 401.514 C 240.763 372.61 249.698 382.71 271.713 397.504 C 274.305 399.245 290.66 410.18 291.717 413.462 C 274.691 413.677 248.805 407.06 234.38 402.561 C 220.993 398.387 203.247 389.127 201.638 391.818 C 200.999 392.893 202.164 393.083 202.747 393.469 C 216.179 402.28 216.236 401.905 217.484 403.594 C 199.079 400.309 120.915 376.39 134.775 383.845 C 138.029 385.595 161.161 394.385 161.073 395.523 C 155.061 397.642 136.045 401.836 136.121 402.804 C 136.145 403.153 136.51 403.366 136.832 403.274 C 138.709 402.749 140.644 403.125 142.545 402.917 C 158.54 401.133 174.258 398.413 189.181 401.545 C 192.147 402.165 238.195 410.996 237.973 413.819 C 237.775 416.421 162.899 421.901 163.163 425.275 C 163.306 427.128 179.589 424.891 194.621 423.526 C 207.541 422.354 236.411 418.012 228.156 426.219 C 221.324 433.012 221.427 432.172 221.298 433.293 C 223.684 434.222 226.091 434.203 228.513 434.019 C 234.674 433.543 236.625 429.807 241.871 422.484 C 246.452 416.089 246.326 416.605 272.619 419.029 C 307.558 422.244 316.112 422.951 315.84 424.992 C 315.728 425.901 314.784 425.51 310.042 426.386 C 302.172 427.842 295.84 431.857 282.396 434.796 C 273.453 436.753 257.583 440.06 236.44 446.37 C 230.993 447.996 226.753 453.59 235.894 450.608 C 273.667 438.277 274.55 444.841 302.618 433.686 C 318.308 427.455 330.649 427.717 374 427.213 C 402.843 426.878 417.479 425.5 454.08 439.074 C 503.294 457.323 489.844 461.333 491.762 521.623 C 492.492 544.551 493.839 555.811 477.252 564.99 C 454.139 577.782 414.925 587.031 406.309 587.033 C 305.189 587.057 318.901 585.711 293.229 576.865 C 281.903 572.966 269.261 572.903 249.811 567.87 C 239.599 565.23 227.827 559.978 230.946 564.28 C 235.624 570.739 279.264 577.367 296.625 583.548 C 307.054 587.261 306.093 587.248 314.724 588.515 C 316.368 588.757 316.133 590.016 314.875 590.27 C 305.993 592.092 317.281 590.817 289.225 593.538 C 250.201 597.321 250.032 597.25 247.1 596.383 C 239.795 594.229 237.168 574.74 221.298 580.903 C 221.418 581.95 222.353 582.446 223.038 583.006 C 227.064 586.296 232.311 591.779 226.927 592.48 C 216.85 593.796 163.341 586.604 163.163 588.924 C 162.848 592.962 249.749 597.693 236.034 601.822 C 228.433 604.109 188.976 615.259 166.565 613.829 C 164.621 613.702 136.832 610.924 136.832 610.924 C 136.238 610.758 135.599 611.643 136.757 611.976 C 142.262 613.559 157.981 617.585 161.073 618.675 C 161.215 620.409 133.674 629.343 134.238 631.285 C 135.058 634.089 194.378 614.73 217.484 610.605 C 215.066 613.876 200.645 620.712 201.638 622.382 C 202.788 624.307 216.557 618.454 218.736 617.524 C 237.679 609.471 271.08 600.476 291.717 600.736 C 290.047 605.902 251.776 628.62 253.956 631.158 C 254.857 632.206 256.002 630.883 256.918 630.426 C 279.643 619.118 290.079 607.041 313.631 600.616 C 336.299 594.437 368.353 595.037 381.773 596.951 C 380.953 601.041 348.92 616.075 346.59 617.17 C 339.817 620.355 332.964 621.142 315.48 621.308 C 314.345 621.318 304.015 621.956 303.335 622.98 C 304.03 625.954 330.793 624.478 338.386 626.974 C 323.346 639.118 300.608 642.031 281.272 645.216 C 252.948 649.882 213.281 645.726 204.082 644.881 C 178.877 642.569 170.184 645.559 209.353 649.235 C 242.44 652.346 239.641 650.543 249.618 653.656 C 243.715 661.25 246.129 655.429 200.499 676.786 C 191.454 681.021 187.606 678.669 163.19 676.075 C 149.082 674.578 150.838 676.261 145.275 676.001 C 143.497 675.915 143.451 677.929 145.249 678.143 C 150.582 678.783 154.351 677.528 168.691 679.415 C 179.253 680.804 190.997 684.093 191.83 684.628 C 191.998 685.165 191.579 685.327 191.284 685.571 C 177.404 696.864 182.768 690.972 147.377 704.898 C 145.486 705.642 144.815 705.741 145.178 706.573 C 145.82 708.032 164.492 703.012 171.464 702.486 C 171.964 704.054 171.294 704.895 170.062 710.928 C 169.821 712.11 170.922 712.496 171.718 711.86 C 186.108 700.398 189.141 685.2 227.221 670.054 C 230.551 668.731 270.669 653.403 285.947 649.677 C 291.258 648.38 256.354 715.56 193.234 723.883 C 188.171 724.55 159.453 726.336 159.334 729.311 C 162.667 729.67 194.015 727.822 199.698 728.002 C 199.331 729.877 198.522 731.443 197.651 732.971 C 194.769 738.057 193.557 746.173 196.794 748.914 C 198.186 750.096 201.721 748.617 201.725 744.535 C 201.736 734.742 210.422 727.174 219.931 722.623 C 226.368 719.546 240.153 715.244 258.332 699.156 C 293.018 668.46 289.296 653.915 328.596 641.939 C 330.326 641.408 332.108 641.174 334.194 641.03 C 319.151 679.616 319.664 676.955 320.532 677.375 C 324.363 679.234 330.488 657.67 340.232 643.923 C 364.565 609.602 445.962 586.192 460.782 587.003 C 465.902 587.282 467.281 588.502 466.514 593.067 C 463.965 608.214 456.687 608.431 452.115 615.522 C 444.816 626.844 441.79 635.411 424.704 639.903 C 381.1 651.365 380.086 650.301 357.672 646.096 C 356.72 645.916 349.245 645.021 348.596 645.68 C 348.536 647.127 363.291 649.535 373.498 652.822 C 375.979 653.624 375.481 653.196 346.836 672.954 C 343.863 675.009 343.451 675.378 343.846 675.97 C 345.071 677.82 354.665 672.415 356.787 671.271 C 392.756 651.878 428.526 645.369 431.86 645.548 C 439.527 645.947 425.087 661.515 419.399 666.314 C 409.556 674.618 396.612 681.253 376.143 698.337 C 354.66 716.259 339.263 702.626 310.483 700.055 C 309.962 700.008 309.461 700.049 309.272 700.603 C 308.94 701.581 308.612 700.984 323.052 706.667 C 323.823 706.972 324.973 706.994 324.85 708.343 C 305.585 711.181 306.241 710.878 306.267 711.828 C 306.366 715.787 346.603 712.072 359.712 712.072 C 359.873 713.888 351.567 724.625 337.564 732.121 C 303.715 750.241 294.695 752.754 281.914 751.871 C 270.931 751.111 267.497 747.378 256.99 748.317 C 250.507 748.897 241.29 750.164 236.071 753.818 C 241.942 755.198 257.317 749.497 275.501 754.677 C 277.209 755.168 288.246 758.581 288.908 760.087 C 286.67 760.868 284.325 761.284 282.02 761.596 C 251.959 765.645 190.42 799.702 192.298 802.11 C 192.941 802.932 192.25 802.899 214.505 793.793 C 215.225 794.316 214.876 794.74 214.725 795.153 C 209.278 809.909 209.227 809.099 210.327 809.613 C 212.557 810.648 215.254 805.315 220.078 798.823 C 231.289 783.736 249.234 773.091 262.252 769.944 C 274.086 767.085 290.875 767.534 292.024 768.41 C 288.067 776.562 286.963 776.115 262.038 795.564 C 259.836 797.283 252.547 802.702 252.663 804.077 C 259.398 804.189 272.278 794.392 280.521 790.455 C 284.172 788.715 287.411 787.314 275.387 810.41 C 271.07 818.711 265.208 816.505 248.194 832.594 C 247.968 832.81 247.739 833.055 247.885 833.63 C 255.7 832.686 266.144 823.866 270.3 822.478 C 269.4 828.072 268.552 833.34 267.713 838.511 C 269.31 839.239 275.956 834.875 276.858 828.09 C 278.875 812.974 287.009 802.268 291.566 791.084 C 295.792 780.698 298.448 766.605 317.751 753.72 C 341.132 738.116 342.532 746.862 341.156 750.32 C 333.419 769.786 323.57 775.849 321.312 782.255 C 320.661 784.106 321.809 784.584 323.26 783.492 C 337.561 772.713 336.863 772.367 337.442 775.248 C 341.736 796.531 333.587 812.284 317.505 826.936 C 313.631 830.47 305.368 831.85 296.375 839.777 C 284.201 850.511 309.194 839.231 311.572 838.771 C 294.253 865.118 295.38 863.05 296.226 863.609 C 301.732 867.236 341.138 800.06 341.663 814.904 C 341.961 823.192 334.8 835.441 329.835 853.013 C 328.755 856.832 328.45 863.404 328.026 866.767 C 327.732 869.129 329.6 867.969 331.771 867.057 C 334.12 866.067 334.091 866.298 335.797 869.833 C 340.217 878.966 351.058 764.261 356.663 745.491 C 361.476 729.381 367.904 724.893 401.553 695.56 C 416.906 682.177 413.431 685.454 422.698 680.548 C 426.458 678.553 424.506 682.481 422.909 720.967 C 418.88 818.218 420.715 791.502 368.334 821.922 C 364.368 824.23 364.716 828.101 366.694 827.227 C 389.577 817.127 392.563 813.474 393.906 815.665 C 394.394 816.465 393.684 816.483 389.218 820.705 C 387.227 822.59 386.457 827.225 388.912 826.454 C 392.619 825.289 392.227 825.553 405.649 814.059 C 411.767 808.821 412.868 807.934 414.257 805.856 C 414.642 805.269 414.971 804.288 416.064 804.618 C 417.134 804.934 418.373 805.112 418.712 806.412 C 423.597 825.239 421.398 816.465 423.82 835.329 C 425.784 850.582 426.425 855.7 422.195 862.272 C 421.741 862.975 409.725 877.817 412.573 886.514 C 413.498 886.407 411.96 888.2 430.043 863.392 C 431.61 861.241 431.749 861.35 433.153 862.323 C 439.157 866.519 447.668 877.656 449.721 885.699 C 450.791 889.889 450.265 891.909 454.946 893.455 C 456.195 893.863 457.808 891.779 457.093 889.938 C 447.499 865.216 442.55 869.271 433.611 843.907 C 421.824 810.452 428.937 766.397 438.225 752.706 C 443.192 755.862 442.721 754.375 459.692 788.414 C 464.615 798.287 465.923 798.917 463.43 801.162 C 436.497 825.44 437.123 823.959 436.255 828.334 C 435.986 829.677 436.35 830.009 437.854 829.737 C 444.361 828.56 446.387 824.456 449.976 819.345 C 450.2 819.022 450.391 818.683 450.865 818.558 C 452.756 819.102 455.641 834.351 458.652 827.696 C 466.577 810.175 466.089 810.307 468.011 810.07 C 471.797 809.606 477.614 826.237 479.357 840.582 C 480.08 846.517 482 849.986 474.674 859.097 C 470.212 864.642 467.053 870.894 469.078 878.352 C 472.558 877.032 474.207 866.687 482.523 860.593 C 486.343 857.792 484.986 865.829 488.598 859.999 C 492.184 854.206 496.446 845.394 498.684 848.945 C 521.68 885.459 507.027 896.261 508.529 901.05 C 509.636 900.616 509.881 899.779 510.219 899.045 C 512.237 894.716 514.796 890.617 516.697 886.24 C 517.819 883.658 517.553 884.213 529.491 892.719 C 538.25 898.953 515.532 870.193 515.976 866.819 C 517.34 866.405 518.809 866.519 520.23 866.784 C 546.671 871.83 547.05 888.105 552.508 893.93 C 553.415 894.9 554.657 894.624 554.455 893.177 C 554.455 893.177 552.433 880.102 552.429 880.091 C 554.567 879.133 565.963 886.681 568.815 886.149 C 567.861 884.296 566.229 883.271 564.485 882.393 C 518.677 859.322 500.39 853.652 508.157 838.329 C 509.972 834.754 514.362 835.281 521.417 836.209 C 534.434 837.923 548.172 841.546 554.675 851.344 C 557.704 855.903 564.297 861.508 571.085 862.102 C 573.279 858.605 556.343 851.155 554.693 843.605 C 560.721 840 580.683 851.519 586.298 850.931 C 587.026 850.856 587.85 849.999 586.685 849.355 C 579.512 845.398 588.379 847.471 526 831.968 C 509.01 827.744 511.211 826.312 516.426 793.149 C 517.338 793.01 517.853 793.371 518.41 793.73 C 546.952 812.208 550.35 819.445 555.72 819.757 C 562.086 820.129 543.323 805.359 527.717 791.988 C 514.212 780.417 519.004 787.65 521.77 748.041 C 521.891 746.363 520.647 744.994 534.713 748.943 C 553.859 754.313 557.903 755.077 561.676 758.995 C 587.496 785.813 582.66 774.903 583.393 810.841 C 583.503 816.465 584.582 824.645 585.379 827.096 C 586.319 829.982 589.717 826.204 590.401 823.351 C 590.979 820.948 590.814 823.096 590.908 776.882 C 590.927 769.035 595.154 770.798 605.437 772.39 C 604.013 769.639 591.285 765.983 589.035 754.03 C 588.014 748.617 593.14 746.767 597.685 750.32 C 622.849 769.997 623.38 780.038 631.538 802.949 C 637.046 818.434 639.449 828.298 639.545 839.76 C 639.651 853.878 640.032 854.428 638.341 856.333 C 636.813 858.064 632.804 865.241 633.686 866.114 C 634.625 867.037 635.382 866.632 640.149 864.757 C 646.568 862.228 644.546 867.74 650.525 869.622 C 652.82 870.345 653.922 869.462 653.477 867.311 C 643.817 820.901 644.133 828.079 631.79 786.528 C 630.743 783.016 630.586 773.42 618.019 759.036 C 603.052 741.91 560.465 712.613 549.117 702.373 C 527.116 682.536 523.907 662.451 521.119 646.443 C 520.77 644.462 519.195 627.997 519.166 624.02 C 519.146 621.213 517.724 616.09 520.611 605.093 C 522.791 596.767 533.54 603.708 540.076 609.833 C 550.538 619.64 569.203 636.361 575.269 644.275 C 592.987 667.396 577.266 710.303 577.235 715.181 C 577.227 716.406 577.685 716.663 578.977 716.179 C 582.802 714.75 582.838 711.93 584.021 707.358 C 584.747 704.574 586.427 703.116 588.968 705.084 C 596.204 710.674 596.867 718.925 603.619 724.361 C 605.104 721.66 599.233 712.798 594.058 696.805 C 591.539 689.023 591.091 682.684 590.406 668.034 C 590.37 667.312 590.499 666.725 591.359 666.37 C 593.012 665.69 594.871 668.069 597.134 670.712 C 631.222 710.533 649.065 713.998 659.282 730.314 C 666.984 742.61 677.59 771.909 678.007 797.107 C 678.46 824.614 671.92 836.572 675.134 840.083 C 683.229 848.933 678.806 810.338 685.101 816.329 C 687.161 818.294 687.817 818.852 696.746 844.715 C 702.143 860.367 704.862 856.338 704.711 855.082 C 703.191 842.013 687.49 797.9 687.65 798.391 C 684.79 789.745 684.678 789.4 685.913 788.808 C 688.359 787.635 693.126 795.627 695.352 795.371 C 697.086 795.17 697.552 794.447 696.884 792.891 C 691.718 780.913 686.424 786.89 674.369 742.676 C 671.936 733.752 682.883 740.861 706.933 756.727 C 722.103 766.737 734.956 774.126 736.163 791.391 C 737.467 810.008 737.351 810.078 741.457 811.762 C 742.533 812.202 744.548 811.057 744.131 807.624 C 742.753 796.363 741.476 794.626 745.618 796.068 C 754.524 799.161 767.128 808.871 769.69 807.531 C 769.826 806.04 763.374 800.775 759.14 798.423 C 744.651 790.369 737.223 775.074 730.252 763.901 C 729.446 762.613 729.07 760.436 731.403 760.945 C 742.638 763.398 753.791 767.933 754.704 766.578 C 755.107 765.988 754.613 765.868 751.083 764.306 C 727.11 753.686 713.319 748.192 690.421 734.156 C 671.256 722.408 641.938 702.584 627.775 685.987 C 632.644 681.525 714.615 714.514 721.903 708.955 C 720.154 704.398 695.455 702.751 684.401 696.764 C 689.33 693.854 704.937 696.543 711.461 691.18 C 712 690.736 713.228 690.327 712.691 688.968 C 712.123 687.53 708.145 688.603 705.372 688.986 C 701.287 689.554 691.373 694.652 677.288 690.453 C 631.817 676.897 619.538 674.67 593.621 644.071 C 580.939 629.097 574.069 614.197 532.436 582.619 C 531.781 582.124 530.496 581.686 530.962 580.755 C 531.456 579.773 532.782 580.205 533.655 580.399 C 558.448 585.92 573.121 592.241 594.038 594.146 C 607.449 595.369 620.289 595.024 627.129 596.705 C 640.602 600.022 639.467 606.116 653.141 623.436 C 657.455 628.903 662.253 631.414 665.953 637.306 C 673.557 649.427 668.247 650.782 676.371 659.331 C 676.774 659.756 677.42 659.932 677.946 659.605 C 678.672 659.153 678.075 659.609 675.363 645.237 C 675.041 643.53 676.894 642.539 678.295 643.298 C 698.267 654.054 697.209 653.677 698.446 653.209 C 695.404 646.883 677.179 639.351 667.661 631.184 C 666.513 630.193 666.967 628.638 668.668 628.636 C 676.954 628.614 696.215 630.142 697.843 629.37 C 697.97 628.715 697.505 628.622 696.969 628.545 C 654.427 622.248 657.947 626.717 649.248 606.482 C 648.963 605.818 648.219 605.156 648.988 604.398 C 649.707 603.687 650.653 603.715 651.55 603.985 C 660.932 606.79 743.371 644.484 750.719 650.318 C 765.787 662.295 777.096 686.857 780.497 704.846 C 784.538 726.175 781.955 734.874 781.701 751.311 C 781.657 754.134 782.299 756.897 782.247 759.714 C 782.219 761.124 783.058 762.142 784.712 763.429 C 785.14 763.44 785.305 763.148 785.369 762.859 C 787.753 752.338 782.718 745.438 789.179 734.236 C 793.007 727.597 812.534 778.08 817.582 777.351 C 823.891 776.44 779.648 706.633 785.88 703.235 C 788.384 701.868 828.576 732.01 830.143 730.541 C 831.377 729.377 829.43 728.263 794.552 700.925 C 779.886 689.437 783.667 683.1 775.471 670.367 C 774.86 669.416 761.045 647.642 761.027 646.53 C 762.608 645.955 788.447 651.958 797.556 654.634 C 815.599 659.936 833.15 667.733 844.333 681.511 C 850.08 688.592 855.466 692.924 859.988 698.637 C 860.446 699.216 860.929 699.914 862 699.696 C 865.497 698.995 863.697 696.808 853.127 684.058 C 847.365 677.097 855.528 677.23 858.126 678.12 C 881.065 685.945 894.054 698.039 902.99 697.509 C 909.355 697.13 886.135 687.621 881.837 684.878 C 860.208 671.064 888.046 688.418 819.889 655.066 C 818.168 654.219 818.886 653.249 820.155 652.944 C 820.397 652.884 835.475 652.234 837.888 652.3 C 838.565 652.316 839.713 652.624 839.778 651.738 C 839.842 650.839 838.688 651.088 838.007 651.004 C 807.498 647.384 752.295 635.086 752.84 635.192 C 723.685 629.674 722.41 627.216 669.431 597.058 C 668.035 596.262 666.573 595.477 665.828 593.715 C 672.586 592.394 724.214 589.73 737.752 595.255 C 749.565 600.075 755.627 608.538 764.95 609.53 C 763.515 604.378 755.432 599.664 743.614 591.586 C 745.695 589.445 756.21 591.278 759.154 591.844 C 814.926 602.525 802.921 595.44 834.542 617.168 C 856.072 631.967 855.821 632.298 859.647 633.244 C 860.361 631.444 833.748 610.939 834.568 609.288 C 835.853 606.704 842.952 610.034 899.164 633.951 Z M 558.654 262.121 C 561.214 261.077 582.006 251.145 581.158 257.475 C 578.185 279.601 557.914 293.399 528.889 313.334 C 527.314 314.416 527.281 314.377 526.703 312.658 C 524.623 306.521 523.271 299.203 523.287 293.441 C 524.487 276.927 525.301 275.723 558.654 262.121 Z M 489.567 191.124 C 490.01 189.343 491.264 178.101 493.742 182.039 C 496.695 186.726 497.505 183.079 508.772 233.674 C 509.377 236.401 509.165 241.81 509.123 242.305 C 508.871 245.192 506.088 245.866 503.869 244.574 C 500.783 242.785 487.52 232.059 481.665 226.569 C 473.445 218.849 484.229 212.469 489.567 191.124 Z M 461.714 256.429 C 463.863 251.989 463.634 254.522 467.57 245.53 C 467.759 245.104 474.217 231.876 474.557 231.521 C 475.735 232.459 476.992 233.31 478.051 234.33 C 496.289 252.008 490.428 242.376 500.698 254.12 C 515.346 270.863 513.161 296.599 512.235 320.806 C 511.293 345.41 512.805 347.748 498.603 340.37 C 473.622 327.38 464.634 315.403 460.319 304.136 C 456.921 295.255 461.692 287.872 463.887 281.814 C 466.46 274.737 469.733 263.97 469.792 263.597 C 470.106 261.757 467.614 259.149 465.715 262.125 C 462.657 266.91 464.024 266.559 458.663 279.822 C 457.997 281.48 454.255 285.738 451.552 283.838 C 449.622 282.483 460.713 258.496 461.714 256.429 Z M 442.181 302.888 C 442.764 292.788 445.451 292.881 448.866 291.119 C 449.734 290.675 450.042 291.9 450.072 292.902 C 451.014 324.469 507.955 346.339 507.428 358.878 C 507.401 359.438 508.872 406.786 497.487 429.713 C 496.523 431.65 495.101 431.789 493.606 430.082 C 440.852 369.836 439.971 341.258 442.181 302.888 Z M 526.703 701.534 C 527.281 699.822 527.314 699.784 528.889 700.866 C 560.813 722.792 578.308 735.493 581.158 756.725 C 582.006 763.057 561.214 753.123 558.649 752.078 C 525.504 738.554 524.504 737.445 523.287 720.757 C 523.271 714.997 524.623 707.677 526.703 701.534 Z M 448.866 723.075 C 445.459 721.321 442.764 721.416 442.181 711.31 C 439.965 672.819 440.86 644.352 493.606 584.114 C 500.967 575.709 508.238 626.465 507.391 645.294 C 507.391 656.72 508.299 658.766 503.898 662.259 C 474.836 685.312 450.723 699.463 450.072 721.292 C 450.031 722.779 449.504 723.407 448.866 723.075 Z M 492.815 833.093 C 490.935 833.119 489.842 824.182 489.567 823.075 C 480.622 787.302 465.802 799.469 499.923 772.413 C 501.177 771.422 502.467 770.433 503.869 769.624 C 506.088 768.33 508.871 769.003 509.123 771.891 C 509.856 780.285 497.529 833.03 492.815 833.093 Z M 492.424 767.735 C 485.242 772.028 481.592 777.064 474.557 782.677 C 473.776 781.863 465.625 764.056 464.58 762.477 C 459.942 755.436 446.096 725.014 454.328 730.102 C 456.725 731.58 459.294 732.682 462.635 745.137 C 465.878 757.24 470.515 753.251 469.622 750.169 C 464.997 734.272 460.006 722.334 460.006 722.334 C 456.906 711.27 464.751 699.176 473.071 691.242 C 484.033 680.799 501.79 671.729 505.711 670.52 C 513.209 668.204 511.448 675.282 512.595 707.288 C 513.116 721.902 514.481 754.532 492.424 767.735 Z" style="stroke-opacity: 0.22; stroke-width: 15px; fill: rgb(209, 213, 219); stroke: white;"></path>
+  <defs>
+    <style>
+      @font-face {
+        font-family: 'MyCustomFont';
+        src: url('https://fonts.gstatic.com/s/rubik/v26/iJWZBXyIfDnIV5PNhY1KTN7Z-Yh-4I-FV0U1.woff2');
+      }
+    </style>
+  </defs>
+  <text style="fill: rgb(209, 213, 219); font-family: MyCustomFont, sans-serif; font-size: 131px; font-weight: 700; white-space: pre;" x="198.537" y="555.716">GPT</text>
+  <text style="fill: rgb(209, 213, 219); font-family: MyCustomFont, sans-serif; font-size: 131px; font-weight: 700; white-space: pre;" x="558.336" y="555.716">4All</text>
+</svg>
diff --git a/gpt4all-chat/icons/network.svg b/gpt4all-chat/icons/network.svg
new file mode 100644
index 00000000..266f13d6
--- /dev/null
+++ b/gpt4all-chat/icons/network.svg
@@ -0,0 +1 @@
+<svg xmlns="http://www.w3.org/2000/svg" fill="#7d7d8e" viewBox="0 0 22 22"><g transform="matrix(1.37217 0 0 1.37217-27.479-15.472)"><path d="m28.04 13.847c-2.891 0-5.608 1.126-7.652 3.17l1.167 1.167c1.732-1.732 4.04-2.686 6.485-2.686 2.45 0 4.753.954 6.485 2.686l1.167-1.167c-2.044-2.044-4.761-3.17-7.652-3.17"/><path d="m22.466 19.09l1.167 1.167c1.178-1.178 2.745-1.828 4.412-1.828 1.667 0 3.233.649 4.412 1.828l1.167-1.167c-1.49-1.49-3.471-2.311-5.579-2.311-2.108 0-4.089.821-5.579 2.311"/><path d="m24.541 21.17l1.167 1.167c.624-.624 1.454-.968 2.337-.968.883 0 1.712.344 2.337.968l1.167-1.167c-.936-.936-2.18-1.451-3.504-1.451-1.324 0-2.568.515-3.504 1.451"/><path d="m28.04 22.994c-.429 0-.858.164-1.185.491-.011.011-.022.023-.033.035l1.218 1.222 1.221-1.218c-.012-.013-.024-.026-.036-.038-.327-.327-.756-.491-1.185-.491"/></g></svg>
diff --git a/gpt4all-chat/icons/regenerate.svg b/gpt4all-chat/icons/regenerate.svg
new file mode 100644
index 00000000..016e6a52
--- /dev/null
+++ b/gpt4all-chat/icons/regenerate.svg
@@ -0,0 +1 @@
+<svg stroke="#7d7d8e" fill="none" stroke-width="1.5" viewBox="0 0 24 24" stroke-linecap="round" stroke-linejoin="round" class="h-3 w-3" height="1em" width="1em" xmlns="http://www.w3.org/2000/svg"><polyline points="1 4 1 10 7 10"></polyline><polyline points="23 20 23 14 17 14"></polyline><path d="M20.49 9A9 9 0 0 0 5.64 5.64L1 10m22 4l-4.64 4.36A9 9 0 0 1 3.51 15"></path></svg>
diff --git a/gpt4all-chat/icons/send_message.svg b/gpt4all-chat/icons/send_message.svg
new file mode 100644
index 00000000..d8650b66
--- /dev/null
+++ b/gpt4all-chat/icons/send_message.svg
@@ -0,0 +1 @@
+<svg stroke="#7d7d8e" fill="none" stroke-width="2" viewBox="0 0 24 24" stroke-linecap="round" stroke-linejoin="round" class="h-4 w-4 mr-1" height="1em" width="1em" xmlns="http://www.w3.org/2000/svg"><line x1="22" y1="2" x2="11" y2="13"></line><polygon points="22 2 15 22 11 13 2 9 22 2"></polygon></svg>
diff --git a/gpt4all-chat/icons/settings.svg b/gpt4all-chat/icons/settings.svg
new file mode 100644
index 00000000..7542ea62
--- /dev/null
+++ b/gpt4all-chat/icons/settings.svg
@@ -0,0 +1,46 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+   fill="#7d7d8e"
+   height="800px"
+   width="800px"
+   version="1.1"
+   viewBox="0 0 512 512"
+   enable-background="new 0 0 512 512"
+   id="svg1510"
+   sodipodi:docname="settings.svg"
+   inkscape:version="1.2.1 (9c6d41e410, 2022-07-14)"
+   xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
+   xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
+   xmlns="http://www.w3.org/2000/svg"
+   xmlns:svg="http://www.w3.org/2000/svg">
+  <defs
+     id="defs1514" />
+  <sodipodi:namedview
+     id="namedview1512"
+     pagecolor="#ffffff"
+     bordercolor="#000000"
+     borderopacity="0.25"
+     inkscape:showpageshadow="2"
+     inkscape:pageopacity="0.0"
+     inkscape:pagecheckerboard="0"
+     inkscape:deskcolor="#d1d1d1"
+     showgrid="false"
+     inkscape:zoom="0.90774833"
+     inkscape:cx="228.03677"
+     inkscape:cy="281.46568"
+     inkscape:window-width="2391"
+     inkscape:window-height="1230"
+     inkscape:window-x="1278"
+     inkscape:window-y="253"
+     inkscape:window-maximized="0"
+     inkscape:current-layer="svg1510"
+     showguides="true">
+    <inkscape:grid
+       type="xygrid"
+       id="grid342" />
+  </sodipodi:namedview>
+  <path
+     id="path1906"
+     style="fill:#7d7d8e;fill-opacity:1;stroke:none;stroke-width:56.0377;stroke-dasharray:none;stroke-opacity:1"
+     d="m 249.08948,20.68769 c -56.11715,0.950536 -7.72591,30.532931 -60.80276,48.778099 -53.07685,18.245164 -33.1032,-34.837515 -77.94421,-1.083682 -44.841011,33.753833 11.69585,29.24314 -20.519981,75.201573 -32.215833,45.95844 -47.259069,-8.72651 -63.696208,44.9378 -16.4371393,53.66431 26.65302,16.78335 27.603556,72.9005 0.950536,56.11716 -43.364186,20.71765 -25.119018,73.7945 18.245167,53.07686 31.427189,-2.08768 65.181023,42.75333 33.753828,44.84101 -22.902612,42.24878 23.055828,74.46461 45.95844,32.21583 24.19749,-20.16084 77.8618,-3.72369 53.66431,16.43714 6.30414,47.64212 62.42129,46.69158 56.11716,-0.95054 7.72591,-30.53293 60.80277,-48.7781 53.07685,-18.24516 33.10319,34.83751 77.9442,1.08368 44.84102,-33.75383 -11.69584,-29.24314 20.51998,-75.20157 32.21583,-45.95844 47.25752,8.72651 63.69466,-44.9378 16.43714,-53.66431 -26.65146,-16.78335 -27.602,-72.9005 -0.95055,-56.11716 43.36262,-20.71765 25.11746,-73.7945 -18.24516,-53.07686 -31.42719,2.08768 -65.18102,-42.75333 C 378.67302,93.279178 435.33101,95.871406 389.37258,63.655578 343.41414,31.439744 365.17508,83.816416 311.51077,67.379275 257.84646,50.942135 305.20664,19.737154 249.08948,20.68769 Z m 7.61531,82.02706 A 152.78666,152.78666 0 0 1 409.49142,255.50138 152.78666,152.78666 0 0 1 256.70479,408.28801 152.78666,152.78666 0 0 1 103.91816,255.50138 152.78666,152.78666 0 0 1 256.70479,102.71475 Z" />
+</svg>
diff --git a/gpt4all-chat/icons/stop_generating.svg b/gpt4all-chat/icons/stop_generating.svg
new file mode 100644
index 00000000..c627ac0e
--- /dev/null
+++ b/gpt4all-chat/icons/stop_generating.svg
@@ -0,0 +1 @@
+<svg stroke="#7d7d8e" fill="none" stroke-width="1.5" viewBox="0 0 24 24" stroke-linecap="round" stroke-linejoin="round" class="h-3 w-3" height="1em" width="1em" xmlns="http://www.w3.org/2000/svg"><rect x="3" y="3" width="18" height="18" rx="2" ry="2"></rect></svg>
diff --git a/gpt4all-chat/icons/thumbs_down.svg b/gpt4all-chat/icons/thumbs_down.svg
new file mode 100644
index 00000000..b01a82d3
--- /dev/null
+++ b/gpt4all-chat/icons/thumbs_down.svg
@@ -0,0 +1,5 @@
+<svg xmlns="http://www.w3.org/2000/svg" fill="#7d7d8e" viewBox="0 0 512 512"><path d="M0 56v240c0 13.255 10.745 24 24 24h80c13.255 0 24-10.745 24-24V56c0-13.255-10.745-24-24-24H24C10.745 32 0 42.745 0 56zm40 200c0-13.255 10.745-24 24-24s24 10.745 24 24-10.745 24-24 24-24-10.745-24-24zm272 256c-20.183 0-29.485-39.293-33.931-57.795-5.206-21.666-10.589-44.07-25.393-58.902-32.469-32.524-49.503-73.967-89.117-113.111a11.98 11.98 0 0 1-3.558-8.521V59.901c0-6.541 5.243-11.878 11.783-11.998 15.831-.29 36.694-9.079 52.651-16.178C256.189 17.598 295.709.017 343.995 0h2.844c42.777 0 93.363.413 113.774 29.737 8.392 12.057 10.446 27.034 6.148 44.632 16.312 17.053 25.063 48.863 16.382 74.757 17.544 23.432 19.143 56.132 9.308 79.469l.11.11c11.893 11.949 19.523 31.259 19.439 49.197-.156 30.352-26.157 58.098-59.553 58.098H350.723C358.03 364.34 384 388.132 384 430.548 384 504 336 512 312 512z"/></svg>
+<!--
+Font Awesome Free 5.2.0 by @fontawesome - https://fontawesome.com
+License - https://fontawesome.com/license (Icons: CC BY 4.0, Fonts: SIL OFL 1.1, Code: MIT License)
+-->
diff --git a/gpt4all-chat/icons/thumbs_up.svg b/gpt4all-chat/icons/thumbs_up.svg
new file mode 100644
index 00000000..cd5efcd2
--- /dev/null
+++ b/gpt4all-chat/icons/thumbs_up.svg
@@ -0,0 +1,5 @@
+<svg xmlns="http://www.w3.org/2000/svg" fill="#7d7d8e" viewBox="0 0 512 512"><path d="M104 224H24c-13.255 0-24 10.745-24 24v240c0 13.255 10.745 24 24 24h80c13.255 0 24-10.745 24-24V248c0-13.255-10.745-24-24-24zM64 472c-13.255 0-24-10.745-24-24s10.745-24 24-24 24 10.745 24 24-10.745 24-24 24zM384 81.452c0 42.416-25.97 66.208-33.277 94.548h101.723c33.397 0 59.397 27.746 59.553 58.098.084 17.938-7.546 37.249-19.439 49.197l-.11.11c9.836 23.337 8.237 56.037-9.308 79.469 8.681 25.895-.069 57.704-16.382 74.757 4.298 17.598 2.244 32.575-6.148 44.632C440.202 511.587 389.616 512 346.839 512l-2.845-.001c-48.287-.017-87.806-17.598-119.56-31.725-15.957-7.099-36.821-15.887-52.651-16.178-6.54-.12-11.783-5.457-11.783-11.998v-213.77c0-3.2 1.282-6.271 3.558-8.521 39.614-39.144 56.648-80.587 89.117-113.111 14.804-14.832 20.188-37.236 25.393-58.902C282.515 39.293 291.817 0 312 0c24 0 72 8 72 81.452z"/></svg>
+<!--
+Font Awesome Free 5.2.0 by @fontawesome - https://fontawesome.com
+License - https://fontawesome.com/license (Icons: CC BY 4.0, Fonts: SIL OFL 1.1, Code: MIT License)
+-->
diff --git a/gpt4all-chat/icons/trash.svg b/gpt4all-chat/icons/trash.svg
new file mode 100644
index 00000000..b7c1a141
--- /dev/null
+++ b/gpt4all-chat/icons/trash.svg
@@ -0,0 +1,5 @@
+<svg xmlns="http://www.w3.org/2000/svg" fill="#7d7d8e" viewBox="0 0 448 512"><path d="M0 84V56c0-13.3 10.7-24 24-24h112l9.4-18.7c4-8.2 12.3-13.3 21.4-13.3h114.3c9.1 0 17.4 5.1 21.5 13.3L312 32h112c13.3 0 24 10.7 24 24v28c0 6.6-5.4 12-12 12H12C5.4 96 0 90.6 0 84zm416 56v324c0 26.5-21.5 48-48 48H80c-26.5 0-48-21.5-48-48V140c0-6.6 5.4-12 12-12h360c6.6 0 12 5.4 12 12zm-272 68c0-8.8-7.2-16-16-16s-16 7.2-16 16v224c0 8.8 7.2 16 16 16s16-7.2 16-16V208zm96 0c0-8.8-7.2-16-16-16s-16 7.2-16 16v224c0 8.8 7.2 16 16 16s16-7.2 16-16V208zm96 0c0-8.8-7.2-16-16-16s-16 7.2-16 16v224c0 8.8 7.2 16 16 16s16-7.2 16-16V208z"/></svg>
+<!--
+Font Awesome Free 5.2.0 by @fontawesome - https://fontawesome.com
+License - https://fontawesome.com/license (Icons: CC BY 4.0, Fonts: SIL OFL 1.1, Code: MIT License)
+-->
diff --git a/gpt4all-chat/llm.cpp b/gpt4all-chat/llm.cpp
new file mode 100644
index 00000000..e94c461b
--- /dev/null
+++ b/gpt4all-chat/llm.cpp
@@ -0,0 +1,79 @@
+#include "llm.h"
+#include "config.h"
+#include "download.h"
+#include "network.h"
+
+#include <QCoreApplication>
+#include <QDir>
+#include <QFile>
+#include <QProcess>
+#include <QResource>
+#include <QSettings>
+#include <fstream>
+
+class MyLLM: public LLM { };
+Q_GLOBAL_STATIC(MyLLM, llmInstance)
+LLM *LLM::globalInstance()
+{
+    return llmInstance();
+}
+
+LLM::LLM()
+    : QObject{nullptr}
+    , m_chatListModel(new ChatListModel(this))
+    , m_threadCount(std::min(4, (int32_t) std::thread::hardware_concurrency()))
+    , m_compatHardware(true)
+{
+    connect(QCoreApplication::instance(), &QCoreApplication::aboutToQuit,
+        this, &LLM::aboutToQuit);
+
+#if defined(__x86_64__) || defined(__i386__)
+    if (QString(GPT4ALL_AVX_ONLY) == "OFF") {
+        const bool avx(__builtin_cpu_supports("avx"));
+        const bool avx2(__builtin_cpu_supports("avx2"));
+        const bool fma(__builtin_cpu_supports("fma"));
+        m_compatHardware = avx && avx2 && fma;
+        emit compatHardwareChanged();
+    }
+#endif
+}
+
+bool LLM::checkForUpdates() const
+{
+    Network::globalInstance()->sendCheckForUpdates();
+
+#if defined(Q_OS_LINUX)
+    QString tool("maintenancetool");
+#elif defined(Q_OS_WINDOWS)
+    QString tool("maintenancetool.exe");
+#elif defined(Q_OS_DARWIN)
+    QString tool("../../../maintenancetool.app/Contents/MacOS/maintenancetool");
+#endif
+
+    QString fileName = QCoreApplication::applicationDirPath()
+        + "/../" + tool;
+    if (!QFileInfo::exists(fileName)) {
+        qDebug() << "Couldn't find tool at" << fileName << "so cannot check for updates!";
+        return false;
+    }
+
+    return QProcess::startDetached(fileName);
+}
+
+int32_t LLM::threadCount() const
+{
+    return m_threadCount;
+}
+
+void LLM::setThreadCount(int32_t n_threads)
+{
+    if (n_threads <= 0)
+        n_threads = std::min(4, (int32_t) std::thread::hardware_concurrency());
+    m_threadCount = n_threads;
+    emit threadCountChanged();
+}
+
+void LLM::aboutToQuit()
+{
+    m_chatListModel->saveChats();
+}
diff --git a/gpt4all-chat/llm.h b/gpt4all-chat/llm.h
new file mode 100644
index 00000000..ac12981d
--- /dev/null
+++ b/gpt4all-chat/llm.h
@@ -0,0 +1,44 @@
+#ifndef LLM_H
+#define LLM_H
+
+#include <QObject>
+
+#include "chatlistmodel.h"
+
+class LLM : public QObject
+{
+    Q_OBJECT
+    Q_PROPERTY(ChatListModel *chatListModel READ chatListModel NOTIFY chatListModelChanged)
+    Q_PROPERTY(int32_t threadCount READ threadCount WRITE setThreadCount NOTIFY threadCountChanged)
+    Q_PROPERTY(bool compatHardware READ compatHardware NOTIFY compatHardwareChanged)
+
+public:
+    static LLM *globalInstance();
+
+    ChatListModel *chatListModel() const { return m_chatListModel; }
+    int32_t threadCount() const;
+    void setThreadCount(int32_t n_threads);
+    bool compatHardware() const { return m_compatHardware; }
+
+    Q_INVOKABLE bool checkForUpdates() const;
+
+Q_SIGNALS:
+    void chatListModelChanged();
+    void threadCountChanged();
+    void compatHardwareChanged();
+
+private Q_SLOTS:
+    void aboutToQuit();
+
+private:
+    ChatListModel *m_chatListModel;
+    int32_t m_threadCount;
+    bool m_compatHardware;
+
+private:
+    explicit LLM();
+    ~LLM() {}
+    friend class MyLLM;
+};
+
+#endif // LLM_H
diff --git a/gpt4all-chat/llmodel/CMakeLists.txt b/gpt4all-chat/llmodel/CMakeLists.txt
new file mode 100644
index 00000000..704faccc
--- /dev/null
+++ b/gpt4all-chat/llmodel/CMakeLists.txt
@@ -0,0 +1,47 @@
+cmake_minimum_required(VERSION 3.16)
+
+if(APPLE)
+  option(BUILD_UNIVERSAL "Build a Universal binary on macOS" ON)
+  if(BUILD_UNIVERSAL)
+    # Build a Universal binary on macOS
+    # This requires that the found Qt library is compiled as Universal binaries.
+    set(CMAKE_OSX_ARCHITECTURES "arm64;x86_64" CACHE STRING "" FORCE)
+  else()
+    # Build for the host architecture on macOS
+    set(CMAKE_OSX_ARCHITECTURES "${CMAKE_HOST_SYSTEM_PROCESSOR}" CACHE STRING "" FORCE)
+  endif()
+endif()
+
+# Include the binary directory for the generated header file
+include_directories("${CMAKE_CURRENT_BINARY_DIR}")
+
+project(llmodel VERSION ${APP_VERSION} LANGUAGES CXX C)
+
+set(CMAKE_CXX_STANDARD_REQUIRED ON)
+
+set(LLAMA_BUILD_EXAMPLES ON CACHE BOOL "llama: build examples" FORCE)
+set(BUILD_SHARED_LIBS ON FORCE)
+
+set(CMAKE_VERBOSE_MAKEFILE ON)
+if (GPT4ALL_AVX_ONLY)
+    set(LLAMA_AVX2 OFF CACHE BOOL "llama: enable AVX2" FORCE)
+    set(LLAMA_F16C OFF CACHE BOOL "llama: enable F16C" FORCE)
+    set(LLAMA_FMA  OFF CACHE BOOL "llama: enable FMA" FORCE)
+endif()
+
+add_subdirectory(llama.cpp)
+
+add_library(llmodel
+    gptj.h gptj.cpp
+    llamamodel.h llamamodel.cpp
+    llama.cpp/examples/common.cpp
+    llmodel.h llmodel_c.h llmodel_c.cpp
+    mpt.h mpt.cpp
+    utils.h utils.cpp
+)
+
+target_link_libraries(llmodel
+    PRIVATE llama)
+
+set(COMPONENT_NAME_MAIN ${PROJECT_NAME})
+set(CMAKE_INSTALL_PREFIX ${CMAKE_BINARY_DIR}/install)
diff --git a/gpt4all-chat/llmodel/gptj.cpp b/gpt4all-chat/llmodel/gptj.cpp
new file mode 100644
index 00000000..837fd1f8
--- /dev/null
+++ b/gpt4all-chat/llmodel/gptj.cpp
@@ -0,0 +1,1102 @@
+#include "gptj.h"
+#include "llama.cpp/ggml.h"
+
+#include "utils.h"
+
+#include <cassert>
+#include <cmath>
+#include <cstdio>
+#include <cstring>
+#include <fstream>
+#include <map>
+#include <string>
+#include <vector>
+#include <iostream>
+#include <unistd.h>
+#include <sstream>
+#include <unordered_set>
+
+// default hparams (GPT-J 6B)
+static const size_t MB = 1024*1024;
+
+struct gptj_hparams {
+    int32_t n_vocab = 50400;
+    int32_t n_ctx   = 2048;
+    int32_t n_embd  = 4096;
+    int32_t n_head  = 16;
+    int32_t n_layer = 28;
+    int32_t n_rot   = 64;
+    int32_t f16     = 1;
+};
+
+struct gptj_layer {
+    // normalization
+    struct ggml_tensor * ln_1_g;
+    struct ggml_tensor * ln_1_b;
+
+    // attention
+    struct ggml_tensor * c_attn_q_proj_w;
+    struct ggml_tensor * c_attn_k_proj_w;
+    struct ggml_tensor * c_attn_v_proj_w;
+
+    struct ggml_tensor * c_attn_proj_w;
+
+    // ff
+    struct ggml_tensor * c_mlp_fc_w;
+    struct ggml_tensor * c_mlp_fc_b;
+
+    struct ggml_tensor * c_mlp_proj_w;
+    struct ggml_tensor * c_mlp_proj_b;
+};
+
+struct gptj_buffer {
+    uint8_t * addr = NULL;
+    size_t size = 0;
+
+    void resize(size_t size) {
+        delete[] addr;
+        addr = new uint8_t[size];
+        this->size = size;
+    }
+
+    ~gptj_buffer() {
+        fflush(stdout);
+        delete[] addr;
+    }
+};
+
+struct gptj_kv_cache {
+    struct ggml_tensor * k;
+    struct ggml_tensor * v;
+
+    struct ggml_context * ctx = NULL;
+
+    gptj_buffer buf;
+
+    int n; // number of tokens currently in the cache
+
+    ~gptj_kv_cache() {
+        if (ctx) {
+            ggml_free(ctx);
+        }
+    }
+};
+
+struct gptj_model {
+    gptj_hparams hparams;
+
+    // normalization
+    struct ggml_tensor * ln_f_g;
+    struct ggml_tensor * ln_f_b;
+
+    struct ggml_tensor * wte; // position embedding
+
+    struct ggml_tensor * lmh_g; // language model head
+    struct ggml_tensor * lmh_b; // language model bias
+
+    std::vector<gptj_layer> layers;
+
+    // key + value memory
+    struct gptj_kv_cache kv_self;
+
+    //
+    struct ggml_context * ctx;
+    std::map<std::string, struct ggml_tensor *> tensors;
+
+    gptj_buffer buf;
+
+    ~gptj_model() {
+        if (ctx) {
+            ggml_free(ctx);
+        }
+    }
+};
+
+static bool kv_cache_init(
+        const struct gptj_hparams & hparams,
+             struct gptj_kv_cache & cache,
+                         ggml_type   wtype,
+                               int   n_ctx) {
+    const int n_embd  = hparams.n_embd;
+    const int n_layer = hparams.n_layer;
+
+    const int64_t n_mem      = (int64_t)n_layer*n_ctx;
+    const int64_t n_elements = n_embd*n_mem;
+
+    cache.buf.resize(2u*n_elements*ggml_type_size(wtype) + 2u*MB);
+
+    struct ggml_init_params params;
+    params.mem_size   = cache.buf.size;
+    params.mem_buffer = cache.buf.addr;
+    params.no_alloc   = false;
+
+    cache.ctx = ggml_init(params);
+
+    if (!cache.ctx) {
+        fprintf(stderr, "%s: failed to allocate memory for kv cache\n", __func__);
+        return false;
+    }
+
+    cache.k = ggml_new_tensor_1d(cache.ctx, wtype, n_elements);
+    cache.v = ggml_new_tensor_1d(cache.ctx, wtype, n_elements);
+
+    return true;
+}
+
+// load the model's weights from a stream
+bool gptj_model_load(const std::string &fname, std::istream &fin, gptj_model & model, gpt_vocab & vocab) {
+    printf("%s: loading model from '%s' - please wait ...\n", __func__, fname.c_str());
+
+    // verify magic
+    {
+        uint32_t magic;
+        fin.read((char *) &magic, sizeof(magic));
+        if (magic != 0x67676d6c) {
+            fprintf(stderr, "%s: invalid model file '%s' (bad magic)\n", __func__, fname.c_str());
+            return false;
+        }
+    }
+
+    // load hparams
+    {
+        auto & hparams = model.hparams;
+
+        fin.read((char *) &hparams.n_vocab, sizeof(hparams.n_vocab));
+        fin.read((char *) &hparams.n_ctx,   sizeof(hparams.n_ctx));
+        fin.read((char *) &hparams.n_embd,  sizeof(hparams.n_embd));
+        fin.read((char *) &hparams.n_head,  sizeof(hparams.n_head));
+        fin.read((char *) &hparams.n_layer, sizeof(hparams.n_layer));
+        fin.read((char *) &hparams.n_rot,   sizeof(hparams.n_rot));
+        fin.read((char *) &hparams.f16,     sizeof(hparams.f16));
+
+        printf("%s: n_vocab = %d\n", __func__, hparams.n_vocab);
+        printf("%s: n_ctx   = %d\n", __func__, hparams.n_ctx);
+        printf("%s: n_embd  = %d\n", __func__, hparams.n_embd);
+        printf("%s: n_head  = %d\n", __func__, hparams.n_head);
+        printf("%s: n_layer = %d\n", __func__, hparams.n_layer);
+        printf("%s: n_rot   = %d\n", __func__, hparams.n_rot);
+        printf("%s: f16     = %d\n", __func__, hparams.f16);
+    }
+
+    // load vocab
+    {
+        int32_t n_vocab = 0;
+        fin.read((char *) &n_vocab, sizeof(n_vocab));
+
+        if (n_vocab != model.hparams.n_vocab) {
+            fprintf(stderr, "%s: invalid model file '%s' (bad vocab size %d != %d)\n",
+                    __func__, fname.c_str(), n_vocab, model.hparams.n_vocab);
+            return false;
+        }
+
+        std::string word;
+        for (int i = 0; i < n_vocab; i++) {
+            uint32_t len;
+            fin.read((char *) &len, sizeof(len));
+
+            word.resize(len);
+            fin.read((char *) word.data(), len);
+
+            vocab.token_to_id[word] = i;
+            vocab.id_to_token[i] = word;
+        }
+    }
+
+    // for the big tensors, we have the option to store the data in 16-bit floats or quantized
+    // in order to save memory and also to speed up the computation
+    ggml_type wtype = GGML_TYPE_COUNT;
+    switch (model.hparams.f16) {
+        case 0: wtype = GGML_TYPE_F32;  break;
+        case 1: wtype = GGML_TYPE_F16;  break;
+        case 2: wtype = GGML_TYPE_Q4_0; break;
+        case 3: wtype = GGML_TYPE_Q4_1; break;
+        case 5: wtype = GGML_TYPE_Q4_2; break;
+        default:
+                {
+                    fprintf(stderr, "%s: invalid model file '%s' (bad f16 value %d)\n",
+                            __func__, fname.c_str(), model.hparams.f16);
+                    return false;
+                }
+    }
+
+    const ggml_type wtype2 = GGML_TYPE_F32;
+
+    auto & ctx = model.ctx;
+
+    size_t ctx_size = 0;
+
+    {
+        const auto & hparams = model.hparams;
+
+        const int n_embd  = hparams.n_embd;
+        const int n_layer = hparams.n_layer;
+        const int n_ctx   = hparams.n_ctx;
+        const int n_vocab = hparams.n_vocab;
+
+        ctx_size += n_embd*ggml_type_sizef(GGML_TYPE_F32); // ln_f_g
+        ctx_size += n_embd*ggml_type_sizef(GGML_TYPE_F32); // ln_f_b
+
+        ctx_size += n_embd*n_vocab*ggml_type_sizef(wtype); // wte
+
+        ctx_size += n_embd*n_vocab*ggml_type_sizef(wtype);         // lmh_g
+        ctx_size +=        n_vocab*ggml_type_sizef(GGML_TYPE_F32); // lmh_b
+
+        ctx_size += n_layer*(n_embd*ggml_type_sizef(GGML_TYPE_F32)); // ln_1_g
+        ctx_size += n_layer*(n_embd*ggml_type_sizef(GGML_TYPE_F32)); // ln_1_b
+
+        ctx_size += n_layer*(n_embd*n_embd*ggml_type_sizef(wtype)); // c_attn_q_proj_w
+        ctx_size += n_layer*(n_embd*n_embd*ggml_type_sizef(wtype)); // c_attn_k_proj_w
+        ctx_size += n_layer*(n_embd*n_embd*ggml_type_sizef(wtype)); // c_attn_v_proj_w
+
+        ctx_size += n_layer*(n_embd*n_embd*ggml_type_sizef(wtype)); // c_attn_proj_w
+
+        ctx_size += n_layer*(4*n_embd*n_embd*ggml_type_sizef(wtype));         // c_mlp_fc_w
+        ctx_size += n_layer*(       4*n_embd*ggml_type_sizef(GGML_TYPE_F32)); // c_mlp_fc_b
+
+        ctx_size += n_layer*(4*n_embd*n_embd*ggml_type_sizef(wtype));         // c_mlp_proj_w
+        ctx_size += n_layer*(         n_embd*ggml_type_sizef(GGML_TYPE_F32)); // c_mlp_proj_b
+
+        ctx_size += n_ctx*n_layer*n_embd*ggml_type_sizef(GGML_TYPE_F32); // memory_k
+        ctx_size += n_ctx*n_layer*n_embd*ggml_type_sizef(GGML_TYPE_F32); // memory_v
+
+        ctx_size += (5 + 10*n_layer)*256; // object overhead
+
+        printf("%s: ggml ctx size = %6.2f MB\n", __func__, ctx_size/(1024.0*1024.0));
+    }
+
+    // create the ggml context
+    {
+        struct ggml_init_params params = {
+            .mem_size   = ctx_size,
+            .mem_buffer = NULL,
+        };
+
+        model.ctx = ggml_init(params);
+        if (!model.ctx) {
+            fprintf(stderr, "%s: ggml_init() failed\n", __func__);
+            return false;
+        }
+    }
+
+    // prepare memory for the weights
+    {
+        const auto & hparams = model.hparams;
+
+        const int n_embd  = hparams.n_embd;
+        const int n_layer = hparams.n_layer;
+        const int n_ctx   = hparams.n_ctx;
+        const int n_vocab = hparams.n_vocab;
+
+        model.layers.resize(n_layer);
+
+        model.wte    = ggml_new_tensor_2d(ctx, wtype,         n_embd, n_vocab);
+
+        model.ln_f_g = ggml_new_tensor_1d(ctx, GGML_TYPE_F32, n_embd);
+        model.ln_f_b = ggml_new_tensor_1d(ctx, GGML_TYPE_F32, n_embd);
+
+        model.lmh_g  = ggml_new_tensor_2d(ctx, wtype,         n_embd, n_vocab);
+        model.lmh_b  = ggml_new_tensor_1d(ctx, GGML_TYPE_F32, n_vocab);
+
+        // map by name
+        model.tensors["transformer.wte.weight"] = model.wte;
+
+        model.tensors["transformer.ln_f.weight"] = model.ln_f_g;
+        model.tensors["transformer.ln_f.bias"]   = model.ln_f_b;
+
+        model.tensors["lm_head.weight"] = model.lmh_g;
+        model.tensors["lm_head.bias"]   = model.lmh_b;
+
+        for (int i = 0; i < n_layer; ++i) {
+            auto & layer = model.layers[i];
+
+            layer.ln_1_g          = ggml_new_tensor_1d(ctx, GGML_TYPE_F32,   n_embd);
+            layer.ln_1_b          = ggml_new_tensor_1d(ctx, GGML_TYPE_F32,   n_embd);
+
+            layer.c_attn_q_proj_w = ggml_new_tensor_2d(ctx, wtype,           n_embd,   n_embd);
+            layer.c_attn_k_proj_w = ggml_new_tensor_2d(ctx, wtype,           n_embd,   n_embd);
+            layer.c_attn_v_proj_w = ggml_new_tensor_2d(ctx, wtype,           n_embd,   n_embd);
+
+            layer.c_attn_proj_w   = ggml_new_tensor_2d(ctx, wtype,           n_embd,   n_embd);
+
+            layer.c_mlp_fc_w      = ggml_new_tensor_2d(ctx, wtype,           n_embd, 4*n_embd);
+            layer.c_mlp_fc_b      = ggml_new_tensor_1d(ctx, GGML_TYPE_F32, 4*n_embd);
+
+            layer.c_mlp_proj_w    = ggml_new_tensor_2d(ctx, wtype,         4*n_embd,   n_embd);
+            layer.c_mlp_proj_b    = ggml_new_tensor_1d(ctx, GGML_TYPE_F32,   n_embd);
+
+            // map by name
+            model.tensors["transformer.h." + std::to_string(i) + ".ln_1.weight"]          = layer.ln_1_g;
+            model.tensors["transformer.h." + std::to_string(i) + ".ln_1.bias"]            = layer.ln_1_b;
+
+            model.tensors["transformer.h." + std::to_string(i) + ".attn.q_proj.weight"]   = layer.c_attn_q_proj_w;
+            model.tensors["transformer.h." + std::to_string(i) + ".attn.k_proj.weight"]   = layer.c_attn_k_proj_w;
+            model.tensors["transformer.h." + std::to_string(i) + ".attn.v_proj.weight"]   = layer.c_attn_v_proj_w;
+
+            model.tensors["transformer.h." + std::to_string(i) + ".attn.out_proj.weight"] = layer.c_attn_proj_w;
+
+            model.tensors["transformer.h." + std::to_string(i) + ".mlp.fc_in.weight"]     = layer.c_mlp_fc_w;
+            model.tensors["transformer.h." + std::to_string(i) + ".mlp.fc_in.bias"]       = layer.c_mlp_fc_b;
+
+            model.tensors["transformer.h." + std::to_string(i) + ".mlp.fc_out.weight"]    = layer.c_mlp_proj_w;
+            model.tensors["transformer.h." + std::to_string(i) + ".mlp.fc_out.bias"]      = layer.c_mlp_proj_b;
+        }
+    }
+
+    // key + value memory
+    {
+        const auto & hparams = model.hparams;
+
+        const int n_embd  = hparams.n_embd;
+        const int n_layer = hparams.n_layer;
+        const int n_ctx   = hparams.n_ctx;
+
+        const int n_mem      = n_layer*n_ctx;
+        const int n_elements = n_embd*n_mem;
+
+        if (!kv_cache_init(hparams, model.kv_self, GGML_TYPE_F16, model.hparams.n_ctx)) {
+            fprintf(stderr, "%s: kv_cache_init() failed for self-attention cache\n", __func__);
+            ggml_free(ctx);
+            return false;
+        }
+
+        const size_t memory_size = ggml_nbytes(model.kv_self.k) + ggml_nbytes(model.kv_self.v);
+        printf("%s: kv self size  = %7.2f MB\n", __func__, memory_size / 1024.0 / 1024.0);
+    }
+
+    // load weights
+    {
+        int n_tensors = 0;
+        size_t total_size = 0;
+
+        printf("%s: ", __func__);
+
+        while (true) {
+            int32_t n_dims;
+            int32_t length;
+            int32_t ftype;
+
+            fin.read(reinterpret_cast<char *>(&n_dims), sizeof(n_dims));
+            fin.read(reinterpret_cast<char *>(&length), sizeof(length));
+            fin.read(reinterpret_cast<char *>(&ftype),  sizeof(ftype));
+
+            if (fin.eof()) {
+                break;
+            }
+
+            int32_t nelements = 1;
+            int32_t ne[2] = { 1, 1 };
+            for (int i = 0; i < n_dims; ++i) {
+                fin.read(reinterpret_cast<char *>(&ne[i]), sizeof(ne[i]));
+                nelements *= ne[i];
+            }
+
+            std::string name(length, 0);
+            fin.read(&name[0], length);
+
+            if (model.tensors.find(name.data()) == model.tensors.end()) {
+                fprintf(stderr, "%s: unknown tensor '%s' in model file\n", __func__, name.data());
+                return false;
+            }
+
+            auto tensor = model.tensors[name.data()];
+            if (ggml_nelements(tensor) != nelements) {
+                fprintf(stderr, "%s: tensor '%s' has wrong size in model file\n", __func__, name.data());
+                return false;
+            }
+
+            if (tensor->ne[0] != ne[0] || tensor->ne[1] != ne[1]) {
+                fprintf(stderr, "%s: tensor '%s' has wrong shape in model file: got [%lu, %lu], expected [%d, %d]\n",
+                        __func__, name.data(), tensor->ne[0], tensor->ne[1], ne[0], ne[1]);
+                return false;
+            }
+
+            if (0) {
+                static const char * ftype_str[] = { "f32", "f16", "q4_0", "q4_1", };
+                printf("%24s - [%5d, %5d], type = %6s, %6.2f MB, %9zu bytes\n", name.data(), ne[0], ne[1], ftype_str[ftype], ggml_nbytes(tensor)/1024.0/1024.0, ggml_nbytes(tensor));
+            }
+
+            size_t bpe = 0;
+
+            switch (ftype) {
+                case 0: bpe = ggml_type_size(GGML_TYPE_F32);  break;
+                case 1: bpe = ggml_type_size(GGML_TYPE_F16);  break;
+                case 2: bpe = ggml_type_size(GGML_TYPE_Q4_0); assert(ne[0] % 64 == 0); break;
+                case 3: bpe = ggml_type_size(GGML_TYPE_Q4_1); assert(ne[0] % 64 == 0); break;
+                default:
+                        {
+                            fprintf(stderr, "%s: unknown ftype %d in model file\n", __func__, ftype);
+                            return false;
+                        }
+            };
+
+            if ((nelements*bpe)/ggml_blck_size(tensor->type) != ggml_nbytes(tensor)) {
+                fprintf(stderr, "%s: tensor '%s' has wrong size in model file: got %zu, expected %zu\n",
+                        __func__, name.data(), ggml_nbytes(tensor), nelements*bpe);
+                return false;
+            }
+
+            fin.read(reinterpret_cast<char *>(tensor->data), ggml_nbytes(tensor));
+
+            //printf("%42s - [%5d, %5d], type = %6s, %6.2f MB\n", name.data(), ne[0], ne[1], ftype == 0 ? "float" : "f16", ggml_nbytes(tensor)/1024.0/1024.0);
+            total_size += ggml_nbytes(tensor);
+            if (++n_tensors % 8 == 0) {
+                printf(".");
+                fflush(stdout);
+            }
+        }
+
+        printf(" done\n");
+
+        printf("%s: model size = %8.2f MB / num tensors = %d\n", __func__, total_size/1024.0/1024.0, n_tensors);
+    }
+
+    return true;
+}
+
+// load the model's weights from a file path
+bool gptj_model_load(const std::string & fname, gptj_model & model, gpt_vocab & vocab) {
+
+    auto fin = std::ifstream(fname, std::ios::binary);
+    if (!fin) {
+        fprintf(stderr, "%s: failed to open '%s'\n", __func__, fname.c_str());
+        return false;
+    }
+
+    bool loaded = gptj_model_load(fname, fin, model, vocab);
+    fin.close();
+    return loaded;
+}
+
+// evaluate the transformer
+//
+//   - model:     the model
+//   - n_threads: number of threads to use
+//   - n_past:    the context size so far
+//   - embd_inp:  the embeddings of the tokens in the context
+//   - embd_w:    the predicted logits for the next token
+//
+// The GPT-J model requires about 16MB of memory per input token.
+//
+bool gptj_eval(
+        gptj_model & model,
+        const int n_threads,
+        const int n_past,
+        const std::vector<gpt_vocab::id> & embd_inp,
+              std::vector<float>         & embd_w,
+              size_t                     & mem_per_token) {
+    const int N = embd_inp.size();
+
+    const auto & hparams = model.hparams;
+
+    const int n_embd  = hparams.n_embd;
+    const int n_layer = hparams.n_layer;
+    const int n_ctx   = hparams.n_ctx;
+    const int n_head  = hparams.n_head;
+    const int n_vocab = hparams.n_vocab;
+    const int n_rot   = hparams.n_rot;
+
+    const int d_key = n_embd/n_head;
+
+    static size_t buf_size = 1024u*MB;
+    if (!model.buf.addr || model.buf.size < buf_size)
+        model.buf.resize(buf_size);
+
+    if (mem_per_token > 0 && mem_per_token*N > model.buf.size) {
+        const size_t buf_size_new = 1.1*(mem_per_token*N); // add 10% to account for ggml object overhead
+        printf("\n%s: reallocating buffer from %zu to %zu bytes\n", __func__, model.buf.size, buf_size_new);
+
+        // reallocate
+        model.buf.resize(buf_size_new);
+        if (model.buf.addr == nullptr) {
+            fprintf(stderr, "%s: failed to allocate %zu bytes\n", __func__, model.buf.size);
+            return false;
+        }
+    }
+
+    struct ggml_init_params params = {
+        .mem_size   = model.buf.size,
+        .mem_buffer = model.buf.addr,
+    };
+
+    struct ggml_context * ctx0 = ggml_init(params);
+    struct ggml_cgraph gf = { .n_threads = n_threads };
+
+    struct ggml_tensor * embd = ggml_new_tensor_1d(ctx0, GGML_TYPE_I32, N);
+    memcpy(embd->data, embd_inp.data(), N*ggml_element_size(embd));
+
+    // wte
+    struct ggml_tensor * inpL = ggml_get_rows(ctx0, model.wte, embd);
+
+    for (int il = 0; il < n_layer; ++il) {
+        struct ggml_tensor * cur;
+
+        // norm
+        {
+            cur = ggml_norm(ctx0, inpL);
+
+            // cur = ln_1_g*cur + ln_1_b
+            cur = ggml_add(ctx0,
+                    ggml_mul(ctx0,
+                        ggml_repeat(ctx0, model.layers[il].ln_1_g, cur),
+                        cur),
+                    ggml_repeat(ctx0, model.layers[il].ln_1_b, cur));
+        }
+
+        struct ggml_tensor * inpSA = cur;
+
+        // self-attention
+        {
+            struct ggml_tensor * Qcur = ggml_mul_mat(ctx0, model.layers[il].c_attn_q_proj_w, cur);
+            struct ggml_tensor * Kcur = ggml_mul_mat(ctx0, model.layers[il].c_attn_k_proj_w, cur);
+            struct ggml_tensor * Vcur = ggml_mul_mat(ctx0, model.layers[il].c_attn_v_proj_w, cur);
+
+            // store key and value to memory
+            {
+                struct ggml_tensor * k = ggml_view_1d(ctx0, model.kv_self.k, N*n_embd, (ggml_element_size(model.kv_self.k)*n_embd)*(il*n_ctx + n_past));
+                struct ggml_tensor * v = ggml_view_1d(ctx0, model.kv_self.v, N*n_embd, (ggml_element_size(model.kv_self.v)*n_embd)*(il*n_ctx + n_past));
+
+                ggml_build_forward_expand(&gf, ggml_cpy(ctx0, Kcur, k));
+                ggml_build_forward_expand(&gf, ggml_cpy(ctx0, Vcur, v));
+            }
+
+            // Q = Qcur.contiguous().view(n_embd/n_head, n_head, N).permute(0, 2, 1, 3)
+            struct ggml_tensor * Q =
+                ggml_permute(ctx0,
+                        ggml_rope(ctx0,
+                            ggml_cpy(ctx0,
+                                Qcur,
+                                ggml_new_tensor_3d(ctx0, GGML_TYPE_F32, n_embd/n_head, n_head, N)),
+                            n_past, n_rot, 0),
+                        0, 2, 1, 3);
+
+            // K = Kmem.view(n_embd/n_head, n_head, n_past + N).permute(0, 2, 1, 3)
+            struct ggml_tensor * K =
+                ggml_permute(ctx0,
+                        ggml_rope(ctx0,
+                            ggml_reshape_3d(ctx0,
+                                ggml_view_1d(ctx0, model.kv_self.k, (n_past + N)*n_embd, il*n_ctx*ggml_element_size(model.kv_self.k)*n_embd),
+                                n_embd/n_head, n_head, n_past + N),
+                            n_past, n_rot, 1),
+                        0, 2, 1, 3);
+
+            // K * Q
+            struct ggml_tensor * KQ = ggml_mul_mat(ctx0, K, Q);
+
+            // KQ_scaled = KQ / sqrt(n_embd/n_head)
+            struct ggml_tensor * KQ_scaled =
+                ggml_scale(ctx0,
+                        KQ,
+                        ggml_new_f32(ctx0, 1.0f/sqrt(float(n_embd)/n_head))
+                        );
+
+            // KQ_masked = mask_past(KQ_scaled)
+            struct ggml_tensor * KQ_masked = ggml_diag_mask_inf(ctx0, KQ_scaled, n_past);
+
+            // KQ = soft_max(KQ_masked)
+            struct ggml_tensor * KQ_soft_max = ggml_soft_max(ctx0, KQ_masked);
+
+            // V_trans = Vmem.view(n_embd/n_head, n_head, n_past + N).permute(1, 2, 0, 3).contiguous()
+            struct ggml_tensor * V_trans =
+                ggml_cpy(ctx0,
+                        ggml_permute(ctx0,
+                            ggml_reshape_3d(ctx0,
+                                ggml_view_1d(ctx0, model.kv_self.v, (n_past + N)*n_embd, il*n_ctx*ggml_element_size(model.kv_self.v)*n_embd),
+                                n_embd/n_head, n_head, n_past + N),
+                            1, 2, 0, 3),
+                        ggml_new_tensor_3d(ctx0, model.kv_self.v->type, n_past + N, n_embd/n_head, n_head));
+
+            // KQV = transpose(V) * KQ_soft_max
+            struct ggml_tensor * KQV = ggml_mul_mat(ctx0, V_trans, KQ_soft_max);
+
+            // KQV_merged = KQV.permute(0, 2, 1, 3)
+            struct ggml_tensor * KQV_merged = ggml_permute(ctx0, KQV, 0, 2, 1, 3);
+
+            // cur = KQV_merged.contiguous().view(n_embd, N)
+            cur = ggml_cpy(ctx0,
+                    KQV_merged,
+                    ggml_new_tensor_2d(ctx0, GGML_TYPE_F32, n_embd, N));
+
+            // projection (no bias)
+            cur = ggml_mul_mat(ctx0,
+                    model.layers[il].c_attn_proj_w,
+                    cur);
+        }
+
+        struct ggml_tensor * inpFF = cur;
+
+        // feed-forward network
+        // this is independent of the self-attention result, so it could be done in parallel to the self-attention
+        {
+            // note here we pass inpSA instead of cur
+            cur = ggml_mul_mat(ctx0,
+                    model.layers[il].c_mlp_fc_w,
+                    inpSA);
+
+            cur = ggml_add(ctx0,
+                    ggml_repeat(ctx0, model.layers[il].c_mlp_fc_b, cur),
+                    cur);
+
+            // GELU activation
+            cur = ggml_gelu(ctx0, cur);
+
+            // projection
+            // cur = proj_w*cur + proj_b
+            cur = ggml_mul_mat(ctx0,
+                    model.layers[il].c_mlp_proj_w,
+                    cur);
+
+            cur = ggml_add(ctx0,
+                    ggml_repeat(ctx0, model.layers[il].c_mlp_proj_b, cur),
+                    cur);
+        }
+
+        // self-attention + FF
+        cur  = ggml_add(ctx0, cur, inpFF);
+
+        // input for next layer
+        inpL = ggml_add(ctx0, cur, inpL);
+    }
+
+    // norm
+    {
+        inpL = ggml_norm(ctx0, inpL);
+
+        // inpL = ln_f_g*inpL + ln_f_b
+        inpL = ggml_add(ctx0,
+                ggml_mul(ctx0,
+                    ggml_repeat(ctx0, model.ln_f_g, inpL),
+                    inpL),
+                ggml_repeat(ctx0, model.ln_f_b, inpL));
+    }
+
+    // lm_head
+    {
+        inpL = ggml_mul_mat(ctx0, model.lmh_g, inpL);
+
+        inpL = ggml_add(ctx0,
+                ggml_repeat(ctx0, model.lmh_b, inpL),
+                inpL);
+    }
+
+    // logits -> probs
+    //inpL = ggml_soft_max(ctx0, inpL);
+
+    // run the computation
+    ggml_build_forward_expand(&gf, inpL);
+    ggml_graph_compute       (ctx0, &gf);
+
+    //if (n_past%100 == 0) {
+    //    ggml_graph_print   (&gf);
+    //    ggml_graph_dump_dot(&gf, NULL, "gpt-2.dot");
+    //}
+
+    //embd_w.resize(n_vocab*N);
+    //memcpy(embd_w.data(), ggml_get_data(inpL), sizeof(float)*n_vocab*N);
+
+    // return result for just the last token
+    embd_w.resize(n_vocab);
+    memcpy(embd_w.data(), (float *) ggml_get_data(inpL) + (n_vocab*(N-1)), sizeof(float)*n_vocab);
+
+    if (mem_per_token == 0) {
+        mem_per_token = ggml_used_mem(ctx0)/N;
+    }
+    //printf("used_mem = %zu\n", ggml_used_mem(ctx0));
+
+    ggml_free(ctx0);
+
+    return true;
+}
+
+#define GPTJ_MAX_RNG_STATE 64*1024
+
+size_t gptj_get_state_size(const gptj_model &model)
+{
+    // we don't know size of rng until we actually serialize it. so reserve more than enough memory for its serialized state.
+    // for reference, std::mt19937(1337) serializes to 6701 bytes.
+    const size_t s_rng_size        = sizeof(size_t);
+    const size_t s_rng             = GPTJ_MAX_RNG_STATE;
+    const size_t s_kv_size         = sizeof(size_t);
+    const size_t s_kv_ntok         = sizeof(int);
+    const size_t s_kv              = model.kv_self.buf.size;
+    const size_t s_total = (
+        + s_rng_size
+        + s_rng
+        + s_kv_size
+        + s_kv_ntok
+        + s_kv
+    );
+    fflush(stdout);
+    return s_total;
+}
+
+size_t gptj_copy_state_data(const gptj_model &model, const std::mt19937 &rng, uint8_t *dest)
+{
+    uint8_t * out = dest;
+    fflush(stdout);
+    // copy rng
+    {
+        std::stringstream rng_ss;
+        rng_ss << rng;
+
+        const size_t rng_size = rng_ss.str().size();
+        char rng_buf[GPTJ_MAX_RNG_STATE];
+
+        memset(&rng_buf[0], 0, GPTJ_MAX_RNG_STATE);
+        memcpy(&rng_buf[0], rng_ss.str().data(), rng_ss.str().size());
+
+        memcpy(out, &rng_size,   sizeof(rng_size));   out += sizeof(rng_size);
+        memcpy(out, &rng_buf[0], GPTJ_MAX_RNG_STATE); out += GPTJ_MAX_RNG_STATE;
+    }
+
+    // copy kv cache
+    {
+        const size_t kv_size = model.kv_self.buf.size;
+        const int    kv_ntok = model.kv_self.n;
+
+        memcpy(out, &kv_size, sizeof(kv_size)); out += sizeof(kv_size);
+        memcpy(out, &kv_ntok, sizeof(kv_ntok)); out += sizeof(kv_ntok);
+
+        if (kv_size) {
+            memcpy(out, model.kv_self.buf.addr, kv_size); out += kv_size;
+        }
+    }
+
+    const size_t written  = out - dest;
+    const size_t expected = gptj_get_state_size(model);
+    assert(written == expected);
+    fflush(stdout);
+    return written;
+}
+
+size_t gptj_set_state_data(gptj_model *model, std::mt19937 *rng, const uint8_t *src)
+{
+    const uint8_t * in = src;
+
+    // set rng
+    {
+        size_t rng_size;
+        char   rng_buf[GPTJ_MAX_RNG_STATE];
+
+        memcpy(&rng_size,   in, sizeof(rng_size));    in += sizeof(rng_size);
+        memcpy(&rng_buf[0], in, GPTJ_MAX_RNG_STATE); in += GPTJ_MAX_RNG_STATE;
+
+        std::stringstream rng_ss;
+        rng_ss.str(std::string(&rng_buf[0], rng_size));
+        rng_ss >> *rng;
+
+        assert(rng_ss.fail() == false);
+    }
+
+    // set kv cache
+    {
+        size_t kv_size;
+        int kv_ntok;
+
+        memcpy(&kv_size, in, sizeof(kv_size)); in += sizeof(kv_size);
+        memcpy(&kv_ntok, in, sizeof(kv_ntok)); in += sizeof(kv_ntok);
+
+        if (kv_size) {
+            assert(model->kv_self.buf.size == kv_size);
+
+            void * k_data = model->kv_self.k->data; // remember data pointers
+            void * v_data = model->kv_self.v->data; // because their value is stored in buf and overwritten by memcpy
+
+            memcpy(model->kv_self.buf.addr, in, kv_size); in += kv_size;
+
+            model->kv_self.k->data = k_data; // restore correct data pointers
+            model->kv_self.v->data = v_data;
+
+        }
+
+        model->kv_self.n = kv_ntok;
+    }
+
+    const size_t nread    = in - src;
+    const size_t expected = gptj_get_state_size(*model);
+    assert(nread == expected);
+    fflush(stdout);
+    return nread;
+}
+
+struct GPTJPrivate {
+    const std::string modelPath;
+    bool modelLoaded;
+    gpt_vocab vocab;
+    gptj_model *model = nullptr;
+    int64_t n_threads = 0;
+    size_t mem_per_token = 0;
+    std::mt19937 rng;
+};
+
+GPTJ::GPTJ()
+    : d_ptr(new GPTJPrivate) {
+
+    d_ptr->model = new gptj_model;
+    d_ptr->modelLoaded = false;
+}
+
+bool GPTJ::loadModel(const std::string &modelPath) {
+    std::mt19937 rng(time(NULL));
+    d_ptr->rng = rng;
+
+    auto fin = std::ifstream(modelPath, std::ios::binary);
+
+    // load the model
+    if (!gptj_model_load(modelPath, fin, *d_ptr->model, d_ptr->vocab)) {
+        std::cerr << "GPT-J ERROR: failed to load model from " <<  modelPath;
+        return false;
+    }
+
+    d_ptr->n_threads = std::min(4, (int32_t) std::thread::hardware_concurrency());
+    d_ptr->modelLoaded = true;
+    fflush(stdout);
+    return true;
+}
+
+void GPTJ::setThreadCount(int32_t n_threads) {
+    d_ptr->n_threads = n_threads;
+}
+
+int32_t GPTJ::threadCount() {
+    return d_ptr->n_threads;
+}
+
+GPTJ::~GPTJ()
+{
+    delete d_ptr->model;
+}
+
+bool GPTJ::isModelLoaded() const
+{
+    return d_ptr->modelLoaded;
+}
+
+size_t GPTJ::stateSize() const
+{
+    return gptj_get_state_size(*d_ptr->model);
+}
+
+size_t GPTJ::saveState(uint8_t *dest) const
+{
+    return gptj_copy_state_data(*d_ptr->model, d_ptr->rng, dest);
+}
+
+size_t GPTJ::restoreState(const uint8_t *src)
+{
+    return gptj_set_state_data(d_ptr->model, &d_ptr->rng, src);
+}
+
+void GPTJ::prompt(const std::string &prompt,
+        std::function<bool(int32_t)> promptCallback,
+        std::function<bool(int32_t, const std::string&)> responseCallback,
+        std::function<bool(bool)> recalculateCallback,
+        PromptContext &promptCtx) {
+
+    if (!isModelLoaded()) {
+        std::cerr << "GPT-J ERROR: prompt won't work with an unloaded model!\n";
+        return;
+    }
+
+    const int64_t t_main_start_us = ggml_time_us();
+
+    int64_t t_sample_us  = 0;
+    int64_t t_predict_us = 0;
+    int64_t t_prompt_us = 0;
+
+    // tokenize the prompt
+    std::vector<gpt_vocab::id> embd_inp = ::gpt_tokenize(d_ptr->vocab, prompt);
+
+    // save the context size
+    promptCtx.n_ctx = d_ptr->model->hparams.n_ctx;
+
+    if ((int) embd_inp.size() > promptCtx.n_ctx - 4) {
+        responseCallback(-1, "ERROR: The prompt size exceeds the context window size and cannot be processed.");
+        std::cerr << "GPT-J ERROR: The prompt is" << embd_inp.size() <<
+            "tokens and the context window is" << promptCtx.n_ctx << "!\n";
+        return;
+    }
+
+    promptCtx.n_predict = std::min(promptCtx.n_predict, promptCtx.n_ctx - (int) embd_inp.size());
+    promptCtx.n_past = std::min(promptCtx.n_past, promptCtx.n_ctx);
+
+    // determine the required inference memory per token:
+    static bool initialized = false;
+    static std::vector<gpt_vocab::id> p_instruct;
+    static std::vector<gpt_vocab::id> r_instruct;
+    if (!initialized) {
+        gptj_eval(*d_ptr->model, d_ptr->n_threads, 0, { 0, 1, 2, 3 }, promptCtx.logits,
+            d_ptr->mem_per_token);
+        initialized = true;
+    }
+
+    // process the prompt in batches
+    size_t i = 0;
+    const int64_t t_start_prompt_us = ggml_time_us();
+    while (i < embd_inp.size()) {
+        size_t batch_end = std::min(i + promptCtx.n_batch, embd_inp.size());
+        std::vector<gpt_vocab::id> batch(embd_inp.begin() + i, embd_inp.begin() + batch_end);
+
+        // Check if the context has run out...
+        if (promptCtx.n_past + batch.size() > promptCtx.n_ctx) {
+            const int32_t erasePoint = promptCtx.n_ctx * promptCtx.contextErase;
+            // Erase the first percentage of context from the tokens...
+            std::cerr << "GPTJ: reached the end of the context window so resizing\n";
+            promptCtx.tokens.erase(promptCtx.tokens.begin(), promptCtx.tokens.begin() + erasePoint);
+            promptCtx.n_past = promptCtx.tokens.size();
+            recalculateContext(promptCtx, recalculateCallback);
+            assert(promptCtx.n_past + batch.size() <= promptCtx.n_ctx);
+        }
+
+        if (!gptj_eval(*d_ptr->model, d_ptr->n_threads, promptCtx.n_past, batch, promptCtx.logits,
+            d_ptr->mem_per_token)) {
+            std::cerr << "GPT-J ERROR: Failed to process prompt\n";
+            return;
+        }
+
+        size_t tokens = batch_end - i;
+        for (size_t t = 0; t < tokens; ++t) {
+            if (promptCtx.tokens.size() == promptCtx.n_ctx)
+                promptCtx.tokens.erase(promptCtx.tokens.begin());
+            promptCtx.tokens.push_back(batch.at(t));
+            if (!promptCallback(batch.at(t)))
+                return;
+        }
+        promptCtx.n_past += batch.size();
+        i = batch_end;
+    }
+    t_prompt_us += ggml_time_us() - t_start_prompt_us;
+
+    int p_instructFound = 0;
+    int r_instructFound = 0;
+
+    std::string cachedResponse;
+    std::vector<gpt_vocab::id> cachedTokens;
+    std::unordered_set<std::string> reversePrompts
+        = { "### Instruction", "### Prompt", "### Response", "### Human", "### Assistant" };
+
+    // predict next tokens
+    int32_t totalPredictions = 0;
+    for (int i = 0; i < promptCtx.n_predict; i++) {
+
+        // sample next token
+        const int n_vocab = d_ptr->model->hparams.n_vocab;
+        gpt_vocab::id id = 0;
+        {
+            const int64_t t_start_sample_us = ggml_time_us();
+            id = gpt_sample_top_k_top_p(d_ptr->vocab,
+                promptCtx.tokens.data() + promptCtx.n_ctx - promptCtx.n_ctx,
+                promptCtx.n_ctx,
+                promptCtx.logits,
+                promptCtx.top_k, promptCtx.top_p, promptCtx.temp,
+                promptCtx.repeat_penalty,
+                d_ptr->rng);
+
+            t_sample_us += ggml_time_us() - t_start_sample_us;
+        }
+
+        // Check if the context has run out...
+        if (promptCtx.n_past + 1 > promptCtx.n_ctx) {
+            const int32_t erasePoint = promptCtx.n_ctx * promptCtx.contextErase;
+            // Erase the first percentage of context from the tokens...
+            std::cerr << "GPTJ: reached the end of the context window so resizing\n";
+            promptCtx.tokens.erase(promptCtx.tokens.begin(), promptCtx.tokens.begin() + erasePoint);
+            promptCtx.n_past = promptCtx.tokens.size();
+            recalculateContext(promptCtx, recalculateCallback);
+            assert(promptCtx.n_past + 1 <= promptCtx.n_ctx);
+        }
+
+        const int64_t t_start_predict_us = ggml_time_us();
+        if (!gptj_eval(*d_ptr->model, d_ptr->n_threads, promptCtx.n_past, { id }, promptCtx.logits,
+            d_ptr->mem_per_token)) {
+            std::cerr << "GPT-J ERROR: Failed to predict next token\n";
+            return;
+        }
+        t_predict_us += ggml_time_us() - t_start_predict_us;
+
+        promptCtx.n_past += 1;
+        // display text
+        ++totalPredictions;
+
+        if (id == 50256 /*end of text*/)
+            goto stop_generating;
+
+        const std::string str = d_ptr->vocab.id_to_token[id];
+
+        // Check if the provided str is part of our reverse prompts
+        bool foundPartialReversePrompt = false;
+        const std::string completed = cachedResponse + str;
+        if (reversePrompts.find(completed) != reversePrompts.end()) {
+            goto stop_generating;
+        }
+
+        // Check if it partially matches our reverse prompts and if so, cache
+        for (auto s : reversePrompts) {
+            if (s.compare(0, completed.size(), completed) == 0) {
+                foundPartialReversePrompt = true;
+                cachedResponse = completed;
+                break;
+            }
+        }
+
+        // Regardless the token gets added to our cache
+        cachedTokens.push_back(id);
+
+        // Continue if we have found a partial match
+        if (foundPartialReversePrompt)
+            continue;
+
+        // Empty the cache
+        for (auto t : cachedTokens) {
+            if (promptCtx.tokens.size() == promptCtx.n_ctx)
+                promptCtx.tokens.erase(promptCtx.tokens.begin());
+            promptCtx.tokens.push_back(t);
+            if (!responseCallback(t, d_ptr->vocab.id_to_token[t]))
+                goto stop_generating;
+        }
+        cachedTokens.clear();
+    }
+
+stop_generating:
+
+#if 0
+    // report timing
+    {
+        const int64_t t_main_end_us = ggml_time_us();
+
+        std::cout << "GPT-J INFO: mem per token = " << mem_per_token << " bytes\n";
+        std::cout << "GPT-J INFO:   sample time = " << t_sample_us/1000.0f << " ms\n";
+        std::cout << "GPT-J INFO:   prompt time = " << t_prompt_us/1000.0f << " ms\n";
+        std::cout << "GPT-J INFO:  predict time = " << t_predict_us/1000.0f << " ms / " << t_predict_us/1000.0f/totalPredictions << " ms per token\n";
+        std::cout << "GPT-J INFO:    total time = " << (t_main_end_us - t_main_start_us)/1000.0f << " ms\n";
+        fflush(stdout);
+    }
+#endif
+
+    return;
+}
+
+void GPTJ::recalculateContext(PromptContext &promptCtx, std::function<bool(bool)> recalculate)
+{
+    size_t i = 0;
+    promptCtx.n_past = 0;
+    while (i < promptCtx.tokens.size()) {
+        size_t batch_end = std::min(i + promptCtx.n_batch, promptCtx.tokens.size());
+        std::vector<gpt_vocab::id> batch(promptCtx.tokens.begin() + i, promptCtx.tokens.begin() + batch_end);
+
+        assert(promptCtx.n_past + batch.size() <= promptCtx.n_ctx);
+
+        if (!gptj_eval(*d_ptr->model, d_ptr->n_threads, promptCtx.n_past, batch, promptCtx.logits,
+            d_ptr->mem_per_token)) {
+            std::cerr << "GPTJ ERROR: Failed to process prompt\n";
+            goto stop_generating;
+        }
+        promptCtx.n_past += batch.size();
+        if (!recalculate(true))
+            goto stop_generating;
+        i = batch_end;
+    }
+    assert(promptCtx.n_past == promptCtx.tokens.size());
+
+stop_generating:
+    recalculate(false);
+}
diff --git a/gpt4all-chat/llmodel/gptj.h b/gpt4all-chat/llmodel/gptj.h
new file mode 100644
index 00000000..3109c1da
--- /dev/null
+++ b/gpt4all-chat/llmodel/gptj.h
@@ -0,0 +1,36 @@
+#ifndef GPTJ_H
+#define GPTJ_H
+
+#include <string>
+#include <functional>
+#include <vector>
+#include "llmodel.h"
+
+class GPTJPrivate;
+class GPTJ : public LLModel {
+public:
+    GPTJ();
+    ~GPTJ();
+
+    bool loadModel(const std::string &modelPath) override;
+    bool isModelLoaded() const override;
+    size_t stateSize() const override;
+    size_t saveState(uint8_t *dest) const override;
+    size_t restoreState(const uint8_t *src) override;
+    void prompt(const std::string &prompt,
+        std::function<bool(int32_t)> promptCallback,
+        std::function<bool(int32_t, const std::string&)> responseCallback,
+        std::function<bool(bool)> recalculateCallback,
+        PromptContext &ctx) override;
+    void setThreadCount(int32_t n_threads) override;
+    int32_t threadCount() override;
+
+protected:
+    void recalculateContext(PromptContext &promptCtx,
+        std::function<bool(bool)> recalculate) override;
+
+private:
+    GPTJPrivate *d_ptr;
+};
+
+#endif // GPTJ_H
diff --git a/gpt4all-chat/llmodel/llama.cpp b/gpt4all-chat/llmodel/llama.cpp
new file mode 160000
index 00000000..03ceb39c
--- /dev/null
+++ b/gpt4all-chat/llmodel/llama.cpp
@@ -0,0 +1 @@
+Subproject commit 03ceb39c1e729bed4ad1dfa16638a72f1843bf0c
diff --git a/gpt4all-chat/llmodel/llamamodel.cpp b/gpt4all-chat/llmodel/llamamodel.cpp
new file mode 100644
index 00000000..272633c7
--- /dev/null
+++ b/gpt4all-chat/llmodel/llamamodel.cpp
@@ -0,0 +1,260 @@
+#include "llamamodel.h"
+
+#include "llama.cpp/examples/common.h"
+#include "llama.cpp/llama.h"
+#include "llama.cpp/ggml.h"
+
+#include <cassert>
+#include <cmath>
+#include <cstdio>
+#include <cstring>
+#include <fstream>
+#include <map>
+#include <string>
+#include <vector>
+#include <iostream>
+#include <unistd.h>
+#include <random>
+#include <thread>
+#include <unordered_set>
+
+struct LLamaPrivate {
+    const std::string modelPath;
+    bool modelLoaded;
+    llama_context *ctx = nullptr;
+    llama_context_params params;
+    int64_t n_threads = 0;
+};
+
+LLamaModel::LLamaModel()
+    : d_ptr(new LLamaPrivate) {
+
+    d_ptr->modelLoaded = false;
+}
+
+bool LLamaModel::loadModel(const std::string &modelPath)
+{
+    // load the model
+    d_ptr->params = llama_context_default_params();
+
+    gpt_params params;
+    d_ptr->params.n_ctx      = 2048;
+    d_ptr->params.n_parts    = params.n_parts;
+    d_ptr->params.seed       = params.seed;
+    d_ptr->params.f16_kv     = params.memory_f16;
+    d_ptr->params.use_mmap   = params.use_mmap;
+    d_ptr->params.use_mlock  = params.use_mlock;
+
+    d_ptr->ctx = llama_init_from_file(modelPath.c_str(), d_ptr->params);
+    if (!d_ptr->ctx) {
+        std::cerr << "LLAMA ERROR: failed to load model from " <<  modelPath << std::endl;
+        return false;
+    }
+
+    d_ptr->n_threads = std::min(4, (int32_t) std::thread::hardware_concurrency());
+    d_ptr->modelLoaded = true;
+    fflush(stderr);
+    return true;
+}
+
+void LLamaModel::setThreadCount(int32_t n_threads) {
+    d_ptr->n_threads = n_threads;
+}
+
+int32_t LLamaModel::threadCount() {
+    return d_ptr->n_threads;
+}
+
+LLamaModel::~LLamaModel()
+{
+    llama_free(d_ptr->ctx);
+}
+
+bool LLamaModel::isModelLoaded() const
+{
+    return d_ptr->modelLoaded;
+}
+
+size_t LLamaModel::stateSize() const
+{
+    return llama_get_state_size(d_ptr->ctx);
+}
+
+size_t LLamaModel::saveState(uint8_t *dest) const
+{
+    return llama_copy_state_data(d_ptr->ctx, dest);
+}
+
+size_t LLamaModel::restoreState(const uint8_t *src)
+{
+    return llama_set_state_data(d_ptr->ctx, src);
+}
+
+void LLamaModel::prompt(const std::string &prompt,
+        std::function<bool(int32_t)> promptCallback,
+        std::function<bool(int32_t, const std::string&)> responseCallback,
+        std::function<bool(bool)> recalculateCallback,
+        PromptContext &promptCtx) {
+
+    if (!isModelLoaded()) {
+        std::cerr << "LLAMA ERROR: prompt won't work with an unloaded model!\n";
+        return;
+    }
+
+    gpt_params params;
+    params.prompt = prompt;
+
+    // Add a space in front of the first character to match OG llama tokenizer behavior
+    params.prompt.insert(0, 1, ' ');
+
+    // tokenize the prompt
+    auto embd_inp = ::llama_tokenize(d_ptr->ctx, params.prompt, false);
+
+    // save the context size
+    promptCtx.n_ctx = llama_n_ctx(d_ptr->ctx);
+
+    if ((int) embd_inp.size() > promptCtx.n_ctx - 4) {
+        responseCallback(-1, "The prompt size exceeds the context window size and cannot be processed.");
+        std::cerr << "LLAMA ERROR: The prompt is" << embd_inp.size() <<
+            "tokens and the context window is" << promptCtx.n_ctx << "!\n";
+        return;
+    }
+
+    promptCtx.n_predict = std::min(promptCtx.n_predict, promptCtx.n_ctx - (int) embd_inp.size());
+    promptCtx.n_past = std::min(promptCtx.n_past, promptCtx.n_ctx);
+
+    // number of tokens to keep when resetting context
+    params.n_keep = (int)embd_inp.size();
+
+    // process the prompt in batches
+    size_t i = 0;
+    const int64_t t_start_prompt_us = ggml_time_us();
+    while (i < embd_inp.size()) {
+        size_t batch_end = std::min(i + promptCtx.n_batch, embd_inp.size());
+        std::vector<llama_token> batch(embd_inp.begin() + i, embd_inp.begin() + batch_end);
+
+        // Check if the context has run out...
+        if (promptCtx.n_past + batch.size() > promptCtx.n_ctx) {
+            const int32_t erasePoint = promptCtx.n_ctx * promptCtx.contextErase;
+            // Erase the first percentage of context from the tokens...
+            std::cerr << "LLAMA: reached the end of the context window so resizing\n";
+            promptCtx.tokens.erase(promptCtx.tokens.begin(), promptCtx.tokens.begin() + erasePoint);
+            promptCtx.n_past = promptCtx.tokens.size();
+            recalculateContext(promptCtx, recalculateCallback);
+            assert(promptCtx.n_past + batch.size() <= promptCtx.n_ctx);
+        }
+
+        if (llama_eval(d_ptr->ctx, batch.data(), batch.size(), promptCtx.n_past, d_ptr->n_threads)) {
+            std::cerr << "LLAMA ERROR: Failed to process prompt\n";
+            return;
+        }
+
+        size_t tokens = batch_end - i;
+        for (size_t t = 0; t < tokens; ++t) {
+            if (promptCtx.tokens.size() == promptCtx.n_ctx)
+                promptCtx.tokens.erase(promptCtx.tokens.begin());
+            promptCtx.tokens.push_back(batch.at(t));
+            if (!promptCallback(batch.at(t)))
+                return;
+        }
+        promptCtx.n_past += batch.size();
+        i = batch_end;
+    }
+
+    std::string cachedResponse;
+    std::vector<llama_token> cachedTokens;
+    std::unordered_set<std::string> reversePrompts
+        = { "### Instruction", "### Prompt", "### Response", "### Human", "### Assistant" };
+
+    // predict next tokens
+    int32_t totalPredictions = 0;
+    for (int i = 0; i < promptCtx.n_predict; i++) {
+        // sample next token
+        llama_token id = llama_sample_top_p_top_k(d_ptr->ctx,
+            promptCtx.tokens.data() + promptCtx.n_ctx - promptCtx.repeat_last_n,
+            promptCtx.repeat_last_n, promptCtx.top_k, promptCtx.top_p, promptCtx.temp,
+            promptCtx.repeat_penalty);
+
+        // Check if the context has run out...
+        if (promptCtx.n_past + 1 > promptCtx.n_ctx) {
+            const int32_t erasePoint = promptCtx.n_ctx * promptCtx.contextErase;
+            // Erase the first percentage of context from the tokens...
+            std::cerr << "LLAMA: reached the end of the context window so resizing\n";
+            promptCtx.tokens.erase(promptCtx.tokens.begin(), promptCtx.tokens.begin() + erasePoint);
+            promptCtx.n_past = promptCtx.tokens.size();
+            recalculateContext(promptCtx, recalculateCallback);
+            assert(promptCtx.n_past + 1 <= promptCtx.n_ctx);
+        }
+
+        if (llama_eval(d_ptr->ctx, &id, 1, promptCtx.n_past, d_ptr->n_threads)) {
+            std::cerr << "LLAMA ERROR: Failed to predict next token\n";
+            return;
+        }
+
+        promptCtx.n_past += 1;
+        // display text
+        ++totalPredictions;
+        if (id == llama_token_eos())
+            return;
+
+        const std::string str = llama_token_to_str(d_ptr->ctx, id);
+
+        // Check if the provided str is part of our reverse prompts
+        bool foundPartialReversePrompt = false;
+        const std::string completed = cachedResponse + str;
+        if (reversePrompts.find(completed) != reversePrompts.end()) {
+            return;
+        }
+
+        // Check if it partially matches our reverse prompts and if so, cache
+        for (auto s : reversePrompts) {
+            if (s.compare(0, completed.size(), completed) == 0) {
+                foundPartialReversePrompt = true;
+                cachedResponse = completed;
+                break;
+            }
+        }
+
+        // Regardless the token gets added to our cache
+        cachedTokens.push_back(id);
+
+        // Continue if we have found a partial match
+        if (foundPartialReversePrompt)
+            continue;
+
+        // Empty the cache
+        for (auto t : cachedTokens) {
+            if (promptCtx.tokens.size() == promptCtx.n_ctx)
+                promptCtx.tokens.erase(promptCtx.tokens.begin());
+            promptCtx.tokens.push_back(t);
+            if (!responseCallback(t, llama_token_to_str(d_ptr->ctx, t)))
+                return;
+        }
+        cachedTokens.clear();
+    }
+}
+
+void LLamaModel::recalculateContext(PromptContext &promptCtx, std::function<bool(bool)> recalculate)
+{
+    size_t i = 0;
+    promptCtx.n_past = 0;
+    while (i < promptCtx.tokens.size()) {
+        size_t batch_end = std::min(i + promptCtx.n_batch, promptCtx.tokens.size());
+        std::vector<llama_token> batch(promptCtx.tokens.begin() + i, promptCtx.tokens.begin() + batch_end);
+
+        assert(promptCtx.n_past + batch.size() <= promptCtx.n_ctx);
+
+        if (llama_eval(d_ptr->ctx, batch.data(), batch.size(), promptCtx.n_past, d_ptr->n_threads)) {
+            std::cerr << "LLAMA ERROR: Failed to process prompt\n";
+            goto stop_generating;
+        }
+        promptCtx.n_past += batch.size();
+        if (!recalculate(true))
+            goto stop_generating;
+        i = batch_end;
+    }
+    assert(promptCtx.n_past == promptCtx.tokens.size());
+
+stop_generating:
+    recalculate(false);
+}
diff --git a/gpt4all-chat/llmodel/llamamodel.h b/gpt4all-chat/llmodel/llamamodel.h
new file mode 100644
index 00000000..7f487803
--- /dev/null
+++ b/gpt4all-chat/llmodel/llamamodel.h
@@ -0,0 +1,36 @@
+#ifndef LLAMAMODEL_H
+#define LLAMAMODEL_H
+
+#include <string>
+#include <functional>
+#include <vector>
+#include "llmodel.h"
+
+class LLamaPrivate;
+class LLamaModel : public LLModel {
+public:
+    LLamaModel();
+    ~LLamaModel();
+
+    bool loadModel(const std::string &modelPath) override;
+    bool isModelLoaded() const override;
+    size_t stateSize() const override;
+    size_t saveState(uint8_t *dest) const override;
+    size_t restoreState(const uint8_t *src) override;
+    void prompt(const std::string &prompt,
+        std::function<bool(int32_t)> promptCallback,
+        std::function<bool(int32_t, const std::string&)> responseCallback,
+        std::function<bool(bool)> recalculateCallback,
+        PromptContext &ctx) override;
+    void setThreadCount(int32_t n_threads) override;
+    int32_t threadCount() override;
+
+protected:
+    void recalculateContext(PromptContext &promptCtx,
+        std::function<bool(bool)> recalculate) override;
+
+private:
+    LLamaPrivate *d_ptr;
+};
+
+#endif // LLAMAMODEL_H
\ No newline at end of file
diff --git a/gpt4all-chat/llmodel/llmodel.h b/gpt4all-chat/llmodel/llmodel.h
new file mode 100644
index 00000000..5e254ab5
--- /dev/null
+++ b/gpt4all-chat/llmodel/llmodel.h
@@ -0,0 +1,47 @@
+#ifndef LLMODEL_H
+#define LLMODEL_H
+
+#include <string>
+#include <functional>
+#include <vector>
+#include <cstdint>
+
+class LLModel {
+public:
+    explicit LLModel() {}
+    virtual ~LLModel() {}
+
+    virtual bool loadModel(const std::string &modelPath) = 0;
+    virtual bool isModelLoaded() const = 0;
+    virtual size_t stateSize() const { return 0; }
+    virtual size_t saveState(uint8_t *dest) const { return 0; }
+    virtual size_t restoreState(const uint8_t *src) { return 0; }
+    struct PromptContext {
+        std::vector<float> logits;      // logits of current context
+        std::vector<int32_t> tokens;    // current tokens in the context window
+        int32_t n_past = 0;             // number of tokens in past conversation
+        int32_t n_ctx = 0;              // number of tokens possible in context window
+        int32_t n_predict = 200;
+        int32_t top_k = 40;
+        float   top_p = 0.9f;
+        float   temp = 0.9f;
+        int32_t n_batch = 9;
+        float   repeat_penalty = 1.10f;
+        int32_t repeat_last_n = 64;     // last n tokens to penalize
+        float   contextErase = 0.75f;   // percent of context to erase if we exceed the context
+                                        // window
+    };
+    virtual void prompt(const std::string &prompt,
+        std::function<bool(int32_t)> promptCallback,
+        std::function<bool(int32_t, const std::string&)> responseCallback,
+        std::function<bool(bool)> recalculateCallback,
+        PromptContext &ctx) = 0;
+    virtual void setThreadCount(int32_t n_threads) {}
+    virtual int32_t threadCount() { return 1; }
+
+protected:
+    virtual void recalculateContext(PromptContext &promptCtx,
+        std::function<bool(bool)> recalculate) = 0;
+};
+
+#endif // LLMODEL_H
diff --git a/gpt4all-chat/llmodel/llmodel_c.cpp b/gpt4all-chat/llmodel/llmodel_c.cpp
new file mode 100644
index 00000000..4361a900
--- /dev/null
+++ b/gpt4all-chat/llmodel/llmodel_c.cpp
@@ -0,0 +1,161 @@
+#include "llmodel_c.h"
+
+#include "gptj.h"
+#include "llamamodel.h"
+#include "mpt.h"
+
+struct LLModelWrapper {
+    LLModel *llModel = nullptr;
+    LLModel::PromptContext promptContext;
+};
+
+llmodel_model llmodel_gptj_create()
+{
+    LLModelWrapper *wrapper = new LLModelWrapper;
+    wrapper->llModel = new GPTJ;
+    return reinterpret_cast<void*>(wrapper);
+}
+
+void llmodel_gptj_destroy(llmodel_model gptj)
+{
+    LLModelWrapper *wrapper = reinterpret_cast<LLModelWrapper*>(gptj);
+    delete wrapper->llModel;
+    delete wrapper;
+}
+
+llmodel_model llmodel_mpt_create()
+{
+    LLModelWrapper *wrapper = new LLModelWrapper;
+    wrapper->llModel = new MPT;
+    return reinterpret_cast<void*>(wrapper);
+}
+
+void llmodel_mpt_destroy(llmodel_model mpt)
+{
+    LLModelWrapper *wrapper = reinterpret_cast<LLModelWrapper*>(mpt);
+    delete wrapper->llModel;
+    delete wrapper;
+}
+
+llmodel_model llmodel_llama_create()
+{
+    LLModelWrapper *wrapper = new LLModelWrapper;
+    wrapper->llModel = new LLamaModel;
+    return reinterpret_cast<void*>(wrapper);
+}
+
+void llmodel_llama_destroy(llmodel_model llama)
+{
+    LLModelWrapper *wrapper = reinterpret_cast<LLModelWrapper*>(llama);
+    delete wrapper->llModel;
+    delete wrapper;
+}
+
+bool llmodel_loadModel(llmodel_model model, const char *model_path)
+{
+    LLModelWrapper *wrapper = reinterpret_cast<LLModelWrapper*>(model);
+    return wrapper->llModel->loadModel(model_path);
+}
+
+bool llmodel_isModelLoaded(llmodel_model model)
+{
+    LLModelWrapper *wrapper = reinterpret_cast<LLModelWrapper*>(model);
+    return wrapper->llModel->isModelLoaded();
+}
+
+uint64_t llmodel_get_state_size(llmodel_model model)
+{
+    LLModelWrapper *wrapper = reinterpret_cast<LLModelWrapper*>(model);
+    return wrapper->llModel->stateSize();
+}
+
+uint64_t llmodel_save_state_data(llmodel_model model, uint8_t *dest)
+{
+    LLModelWrapper *wrapper = reinterpret_cast<LLModelWrapper*>(model);
+    return wrapper->llModel->saveState(dest);
+}
+
+uint64_t llmodel_restore_state_data(llmodel_model model, const uint8_t *src)
+{
+    LLModelWrapper *wrapper = reinterpret_cast<LLModelWrapper*>(model);
+    return wrapper->llModel->restoreState(src);
+}
+
+// Wrapper functions for the C callbacks
+bool prompt_wrapper(int32_t token_id, void *user_data) {
+    llmodel_prompt_callback callback = reinterpret_cast<llmodel_prompt_callback>(user_data);
+    return callback(token_id);
+}
+
+bool response_wrapper(int32_t token_id, const std::string &response, void *user_data) {
+    llmodel_response_callback callback = reinterpret_cast<llmodel_response_callback>(user_data);
+    return callback(token_id, response.c_str());
+}
+
+bool recalculate_wrapper(bool is_recalculating, void *user_data) {
+    llmodel_recalculate_callback callback = reinterpret_cast<llmodel_recalculate_callback>(user_data);
+    return callback(is_recalculating);
+}
+
+void llmodel_prompt(llmodel_model model, const char *prompt,
+                    llmodel_response_callback prompt_callback,
+                    llmodel_response_callback response_callback,
+                    llmodel_recalculate_callback recalculate_callback,
+                    llmodel_prompt_context *ctx)
+{
+    LLModelWrapper *wrapper = reinterpret_cast<LLModelWrapper*>(model);
+
+    // Create std::function wrappers that call the C function pointers
+    std::function<bool(int32_t)> prompt_func =
+        std::bind(&prompt_wrapper, std::placeholders::_1, reinterpret_cast<void*>(prompt_callback));
+    std::function<bool(int32_t, const std::string&)> response_func =
+        std::bind(&response_wrapper, std::placeholders::_1, std::placeholders::_2, reinterpret_cast<void*>(response_callback));
+    std::function<bool(bool)> recalc_func =
+        std::bind(&recalculate_wrapper, std::placeholders::_1, reinterpret_cast<void*>(recalculate_callback));
+
+    // Copy the C prompt context
+    wrapper->promptContext.n_past = ctx->n_past;
+    wrapper->promptContext.n_ctx = ctx->n_ctx;
+    wrapper->promptContext.n_predict = ctx->n_predict;
+    wrapper->promptContext.top_k = ctx->top_k;
+    wrapper->promptContext.top_p = ctx->top_p;
+    wrapper->promptContext.temp = ctx->temp;
+    wrapper->promptContext.n_batch = ctx->n_batch;
+    wrapper->promptContext.repeat_penalty = ctx->repeat_penalty;
+    wrapper->promptContext.repeat_last_n = ctx->repeat_last_n;
+    wrapper->promptContext.contextErase = ctx->context_erase;
+
+    // Call the C++ prompt method
+    wrapper->llModel->prompt(prompt, prompt_func, response_func, recalc_func, wrapper->promptContext);
+
+    // Update the C context by giving access to the wrappers raw pointers to std::vector data
+    // which involves no copies
+    ctx->logits = wrapper->promptContext.logits.data();
+    ctx->logits_size = wrapper->promptContext.logits.size();
+    ctx->tokens = wrapper->promptContext.tokens.data();
+    ctx->tokens_size = wrapper->promptContext.tokens.size();
+
+    // Update the rest of the C prompt context
+    ctx->n_past = wrapper->promptContext.n_past;
+    ctx->n_ctx = wrapper->promptContext.n_ctx;
+    ctx->n_predict = wrapper->promptContext.n_predict;
+    ctx->top_k = wrapper->promptContext.top_k;
+    ctx->top_p = wrapper->promptContext.top_p;
+    ctx->temp = wrapper->promptContext.temp;
+    ctx->n_batch = wrapper->promptContext.n_batch;
+    ctx->repeat_penalty = wrapper->promptContext.repeat_penalty;
+    ctx->repeat_last_n = wrapper->promptContext.repeat_last_n;
+    ctx->context_erase = wrapper->promptContext.contextErase;
+}
+
+void llmodel_setThreadCount(llmodel_model model, int32_t n_threads)
+{
+    LLModelWrapper *wrapper = reinterpret_cast<LLModelWrapper*>(model);
+    wrapper->llModel->setThreadCount(n_threads);
+}
+
+int32_t llmodel_threadCount(llmodel_model model)
+{
+    LLModelWrapper *wrapper = reinterpret_cast<LLModelWrapper*>(model);
+    return wrapper->llModel->threadCount();
+}
diff --git a/gpt4all-chat/llmodel/llmodel_c.h b/gpt4all-chat/llmodel/llmodel_c.h
new file mode 100644
index 00000000..f45bdd8d
--- /dev/null
+++ b/gpt4all-chat/llmodel/llmodel_c.h
@@ -0,0 +1,172 @@
+#ifndef LLMODEL_C_H
+#define LLMODEL_C_H
+
+#include <stdint.h>
+#include <stddef.h>
+#include <stdbool.h>
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+/**
+ * Opaque pointer to the underlying model.
+ */
+typedef void *llmodel_model;
+
+/**
+ * llmodel_prompt_context structure for holding the prompt context.
+ * NOTE: The implementation takes care of all the memory handling of the raw logits pointer and the
+ * raw tokens pointer. Attempting to resize them or modify them in any way can lead to undefined
+ * behavior.
+ */
+typedef struct {
+    float *logits;          // logits of current context
+    size_t logits_size;     // the size of the raw logits vector
+    int32_t *tokens;        // current tokens in the context window
+    size_t tokens_size;     // the size of the raw tokens vector
+    int32_t n_past;         // number of tokens in past conversation
+    int32_t n_ctx;          // number of tokens possible in context window
+    int32_t n_predict;      // number of tokens to predict
+    int32_t top_k;          // top k logits to sample from
+    float top_p;            // nucleus sampling probability threshold
+    float temp;             // temperature to adjust model's output distribution
+    int32_t n_batch;        // number of predictions to generate in parallel
+    float repeat_penalty;   // penalty factor for repeated tokens
+    int32_t repeat_last_n;  // last n tokens to penalize
+    float context_erase;    // percent of context to erase if we exceed the context window
+} llmodel_prompt_context;
+
+/**
+ * Callback type for prompt processing.
+ * @param token_id The token id of the prompt.
+ * @return a bool indicating whether the model should keep processing.
+ */
+typedef bool (*llmodel_prompt_callback)(int32_t token_id);
+
+/**
+ * Callback type for response.
+ * @param token_id The token id of the response.
+ * @param response The response string. NOTE: a token_id of -1 indicates the string is an error string.
+ * @return a bool indicating whether the model should keep generating.
+ */
+typedef bool (*llmodel_response_callback)(int32_t token_id, const char *response);
+
+/**
+ * Callback type for recalculation of context.
+ * @param whether the model is recalculating the context.
+ * @return a bool indicating whether the model should keep generating.
+ */
+typedef bool (*llmodel_recalculate_callback)(bool is_recalculating);
+
+/**
+ * Create a GPTJ instance.
+ * @return A pointer to the GPTJ instance.
+ */
+llmodel_model llmodel_gptj_create();
+
+/**
+ * Destroy a GPTJ instance.
+ * @param gptj A pointer to the GPTJ instance.
+ */
+void llmodel_gptj_destroy(llmodel_model gptj);
+
+/**
+ * Create a MPT instance.
+ * @return A pointer to the MPT instance.
+ */
+llmodel_model llmodel_mpt_create();
+
+/**
+ * Destroy a MPT instance.
+ * @param gptj A pointer to the MPT instance.
+ */
+void llmodel_mpt_destroy(llmodel_model mpt);
+
+/**
+ * Create a LLAMA instance.
+ * @return A pointer to the LLAMA instance.
+ */
+llmodel_model llmodel_llama_create();
+
+/**
+ * Destroy a LLAMA instance.
+ * @param llama A pointer to the LLAMA instance.
+ */
+void llmodel_llama_destroy(llmodel_model llama);
+
+/**
+ * Load a model from a file.
+ * @param model A pointer to the llmodel_model instance.
+ * @param model_path A string representing the path to the model file.
+ * @return true if the model was loaded successfully, false otherwise.
+ */
+bool llmodel_loadModel(llmodel_model model, const char *model_path);
+
+/**
+ * Check if a model is loaded.
+ * @param model A pointer to the llmodel_model instance.
+ * @return true if the model is loaded, false otherwise.
+ */
+bool llmodel_isModelLoaded(llmodel_model model);
+
+/**
+ * Get the size of the internal state of the model.
+ * NOTE: This state data is specific to the type of model you have created.
+ * @param model A pointer to the llmodel_model instance.
+ * @return the size in bytes of the internal state of the model
+ */
+uint64_t llmodel_get_state_size(llmodel_model model);
+
+/**
+ * Saves the internal state of the model to the specified destination address.
+ * NOTE: This state data is specific to the type of model you have created.
+ * @param model A pointer to the llmodel_model instance.
+ * @param dest A pointer to the destination.
+ * @return the number of bytes copied
+ */
+uint64_t llmodel_save_state_data(llmodel_model model, uint8_t *dest);
+
+/**
+ * Restores the internal state of the model using data from the specified address.
+ * NOTE: This state data is specific to the type of model you have created.
+ * @param model A pointer to the llmodel_model instance.
+ * @param src A pointer to the src.
+ * @return the number of bytes read
+ */
+uint64_t llmodel_restore_state_data(llmodel_model model, const uint8_t *src);
+
+/**
+ * Generate a response using the model.
+ * @param model A pointer to the llmodel_model instance.
+ * @param prompt A string representing the input prompt.
+ * @param prompt_callback A callback function for handling the processing of prompt.
+ * @param response_callback A callback function for handling the generated response.
+ * @param recalculate_callback A callback function for handling recalculation requests.
+ * @param ctx A pointer to the llmodel_prompt_context structure.
+ */
+void llmodel_prompt(llmodel_model model, const char *prompt,
+                    llmodel_response_callback prompt_callback,
+                    llmodel_response_callback response_callback,
+                    llmodel_recalculate_callback recalculate_callback,
+                    llmodel_prompt_context *ctx);
+
+/**
+ * Set the number of threads to be used by the model.
+ * @param model A pointer to the llmodel_model instance.
+ * @param n_threads The number of threads to be used.
+ */
+void llmodel_setThreadCount(llmodel_model model, int32_t n_threads);
+
+/**
+ * Get the number of threads currently being used by the model.
+ * @param model A pointer to the llmodel_model instance.
+ * @return The number of threads currently being used.
+ */
+int32_t llmodel_threadCount(llmodel_model model);
+
+#ifdef __cplusplus
+}
+#endif
+
+#endif // LLMODEL_C_H
diff --git a/gpt4all-chat/llmodel/mpt.cpp b/gpt4all-chat/llmodel/mpt.cpp
new file mode 100644
index 00000000..1a5ce612
--- /dev/null
+++ b/gpt4all-chat/llmodel/mpt.cpp
@@ -0,0 +1,1240 @@
+#include "mpt.h"
+#include "llama.cpp/ggml.h"
+
+#include <cassert>
+#include <cmath>
+#include <cstdio>
+#include <cstring>
+#include <fstream>
+#include <map>
+#include <random>
+#include <string>
+#include <vector>
+#include <iostream>
+#include <unistd.h>
+#include <sstream>
+#include <thread>
+#include <unordered_set>
+#include <regex>
+
+static const size_t MB = 1024*1024;
+
+// default hparams (MPT 7B)
+struct mpt_hparams {
+    int32_t n_vocab      = 50432;
+    int32_t n_ctx        = 2048;
+    int32_t n_embd       = 4096;
+    int32_t n_head       = 32;
+    int32_t n_layer      = 32;
+    float alibi_bias_max = 8;
+    float clip_qkv       = 0;
+    int32_t expand       = 4;
+    int32_t f16          = 1;
+};
+
+struct mpt_layer {
+    // normalization
+    struct ggml_tensor * norm_1_w;
+    struct ggml_tensor * norm_2_w;
+
+    // attention
+    struct ggml_tensor * attn_Wqkv_w;
+    struct ggml_tensor * attn_out_proj_w;
+
+    // ff
+    struct ggml_tensor * ffn_up_proj_w;
+    struct ggml_tensor * ffn_down_proj_w;
+};
+
+struct mpt_buffer {
+    uint8_t * addr = NULL;
+    size_t size = 0;
+
+    void resize(size_t size) {
+        delete[] addr;
+        addr = new uint8_t[size];
+        this->size = size;
+    }
+
+    ~mpt_buffer() {
+        fflush(stdout);
+        delete[] addr;
+    }
+};
+
+struct mpt_kv_cache {
+    struct ggml_tensor * k;
+    struct ggml_tensor * v;
+
+    struct ggml_context * ctx = NULL;
+
+    mpt_buffer buf;
+
+    int n; // number of tokens currently in the cache
+
+    ~mpt_kv_cache() {
+        if (ctx) {
+            ggml_free(ctx);
+        }
+    }
+};
+
+struct mpt_model {
+    mpt_hparams hparams;
+
+    // normalization
+    struct ggml_tensor * norm_f_w;
+
+    struct ggml_tensor * wte; // position embedding
+
+    // mpt does weight tying
+
+    std::vector<mpt_layer> layers;
+
+    struct mpt_kv_cache kv_self;
+    struct ggml_context * ctx;
+    std::map<std::string, struct ggml_tensor *> tensors;
+
+
+    mpt_buffer buf;
+
+    ~mpt_model() {
+        if (ctx) {
+            ggml_free(ctx);
+        }
+    }
+};
+
+static bool kv_cache_init(
+        const struct mpt_hparams & hparams,
+             struct mpt_kv_cache & cache,
+                         ggml_type   wtype,
+                               int   n_ctx) {
+    const int n_embd  = hparams.n_embd;
+    const int n_layer = hparams.n_layer;
+
+    const int64_t n_mem      = (int64_t)n_layer*n_ctx;
+    const int64_t n_elements = n_embd*n_mem;
+
+    cache.buf.resize(2u*n_elements*ggml_type_size(wtype) + 2u*MB);
+
+    struct ggml_init_params params;
+    params.mem_size   = cache.buf.size;
+    params.mem_buffer = cache.buf.addr;
+    params.no_alloc   = false;
+
+    cache.ctx = ggml_init(params);
+
+    if (!cache.ctx) {
+        fprintf(stderr, "%s: failed to allocate memory for kv cache\n", __func__);
+        return false;
+    }
+
+    cache.k = ggml_new_tensor_1d(cache.ctx, wtype, n_elements);
+    cache.v = ggml_new_tensor_1d(cache.ctx, wtype, n_elements);
+
+    return true;
+}
+
+struct mpt_vocab {
+    using id    = int32_t;
+    using token = std::string;
+
+    std::map<token, id> token_to_id;
+    std::map<id, token> id_to_token;
+    std::vector<std::string> special_tokens;
+
+    void add_special_token(const std::string &token) {
+        special_tokens.push_back(token);
+    }
+};
+
+std::string regex_escape(const std::string &s) {
+  static const std::regex metacharacters(R"([\.\^\$\-\+\(\)\[\]\{\}\|\?\*])");
+  return std::regex_replace(s, metacharacters, "\\$&");
+}
+
+// load the model's weights from a stream
+bool mpt_model_load(const std::string &fname, std::istream &fin, mpt_model & model, mpt_vocab & vocab) {
+    printf("%s: loading model from '%s' - please wait ...\n", __func__, fname.c_str());
+
+    // verify magic
+    {
+        uint32_t magic;
+        fin.read((char *) &magic, sizeof(magic));
+        if (magic != 0x67676d6d) {
+            fprintf(stderr, "%s: invalid model file '%s' (bad magic)\n", __func__, fname.c_str());
+            return false;
+        }
+    }
+
+    // load hparams
+    {
+        auto & hparams = model.hparams;
+
+        fin.read((char *) &hparams.n_vocab, sizeof(hparams.n_vocab));
+        fin.read((char *) &hparams.n_ctx,   sizeof(hparams.n_ctx));
+        fin.read((char *) &hparams.n_layer, sizeof(hparams.n_layer));
+        fin.read((char *) &hparams.n_head,  sizeof(hparams.n_head));
+        fin.read((char *) &hparams.n_embd,  sizeof(hparams.n_embd));
+        fin.read((char *) &hparams.alibi_bias_max,  sizeof(hparams.alibi_bias_max));
+        fin.read((char *) &hparams.clip_qkv,  sizeof(hparams.clip_qkv));
+        fin.read((char *) &hparams.f16,   sizeof(hparams.f16));
+
+        printf("%s: n_vocab        = %d\n", __func__, hparams.n_vocab);
+        printf("%s: n_ctx          = %d\n", __func__, hparams.n_ctx);
+        printf("%s: n_embd         = %d\n", __func__, hparams.n_embd);
+        printf("%s: n_head         = %d\n", __func__, hparams.n_head);
+        printf("%s: n_layer        = %d\n", __func__, hparams.n_layer);
+        printf("%s: alibi_bias_max = %f\n", __func__, hparams.alibi_bias_max);
+        printf("%s: clip_qkv       = %f\n", __func__, hparams.clip_qkv);
+        printf("%s: ftype          = %d\n", __func__, hparams.f16);
+    }
+
+    // load vocab
+    {
+        int32_t n_vocab = model.hparams.n_vocab;
+        fin.read((char *) &n_vocab, sizeof(n_vocab));
+
+        if (n_vocab != model.hparams.n_vocab) {
+            fprintf(stderr, "%s: invalid model file '%s' (bad vocab size %d != %d)\n",
+                    __func__, fname.c_str(), n_vocab, model.hparams.n_vocab);
+            return false;
+        }
+
+        std::string word;
+        for (int i = 0; i < n_vocab; i++) {
+            uint32_t len;
+            fin.read((char *) &len, sizeof(len));
+            bool special = false;
+            if (len & (1<<31)) {
+                len = len &~ (1<<31);
+                special = true;
+            }
+
+            if (len > 0) {
+                word.resize(len);
+                fin.read((char *) word.data(), len);
+                vocab.token_to_id[word] = i;
+                vocab.id_to_token[i] = word;
+            }
+
+            // TODO: this only kind-of works, the gpt_tokenize can still incorrectly
+            // tokenize special tokens
+            if(special) {
+                vocab.add_special_token(word);
+            }
+        }
+    }
+
+    // for the big tensors, we have the option to store the data in 16-bit floats or quantized
+    // in order to save memory and also to speed up the computation
+    ggml_type wtype = GGML_TYPE_COUNT;
+    switch (model.hparams.f16) {
+        case 0: wtype = GGML_TYPE_F32;  break;
+        case 1: wtype = GGML_TYPE_F16;  break;
+        case 2: wtype = GGML_TYPE_Q4_0; break;
+        case 3: wtype = GGML_TYPE_Q4_1; break;
+        case 5: wtype = GGML_TYPE_Q4_2; break;
+        default:
+                {
+                    fprintf(stderr, "%s: invalid model file '%s' (bad f16 value %d)\n",
+                            __func__, fname.c_str(), model.hparams.f16);
+                    return false;
+                }
+    }
+
+    auto & ctx = model.ctx;
+
+    size_t ctx_size = 0;
+
+    {
+        const auto & hparams = model.hparams;
+
+        const int n_embd  = hparams.n_embd;
+        const int n_layer = hparams.n_layer;
+        const int n_ctx   = hparams.n_ctx;
+        const int n_vocab = hparams.n_vocab;
+        const int expand  = hparams.expand;
+
+
+        ctx_size += n_embd*ggml_type_sizef(GGML_TYPE_F32); // ln_f_w
+
+        ctx_size += n_embd*n_vocab*ggml_type_sizef(GGML_TYPE_F32); // wte
+
+        ctx_size += n_layer*(n_embd*ggml_type_sizef(GGML_TYPE_F32)); // norm_1_w
+        ctx_size += n_layer*(n_embd*ggml_type_sizef(GGML_TYPE_F32)); // norm_2_w
+
+        ctx_size += n_layer*(3*n_embd*n_embd*ggml_type_sizef(wtype)); // attn_Wqkv_w
+        ctx_size += n_layer*(n_embd*n_embd*ggml_type_sizef(wtype)); // attn_out_proj_w
+
+        ctx_size += n_layer*(expand*n_embd*n_embd*ggml_type_sizef(wtype));  // ffn_up_proj_w
+        ctx_size += n_layer*(expand*n_embd*n_embd*ggml_type_sizef(wtype)); // ffn_down_proj_w
+
+        ctx_size += n_ctx*n_layer*n_embd*ggml_type_sizef(GGML_TYPE_F16); // memory_k
+        ctx_size += n_ctx*n_layer*n_embd*ggml_type_sizef(GGML_TYPE_F16); // memory_v
+
+        // TODO probably less now?
+        ctx_size += (5 + 10*n_layer)*256; // object overhead
+
+        printf("%s: ggml ctx size = %6.2f MB\n", __func__, ctx_size/(1024.0*1024.0));
+    }
+
+    // create the ggml context
+    {
+        struct ggml_init_params params = {
+            .mem_size   = ctx_size,
+            .mem_buffer = NULL,
+            .no_alloc   = false,
+        };
+
+        model.ctx = ggml_init(params);
+        if (!model.ctx) {
+            fprintf(stderr, "%s: ggml_init() failed\n", __func__);
+            return false;
+        }
+    }
+
+    // prepare memory for the weights
+    {
+        const auto & hparams = model.hparams;
+
+        const int n_embd  = hparams.n_embd;
+        const int n_layer = hparams.n_layer;
+        const int n_ctx   = hparams.n_ctx;
+        const int n_vocab = hparams.n_vocab;
+        const int expand  = hparams.expand;
+
+        model.layers.resize(n_layer);
+
+        model.wte    = ggml_new_tensor_2d(ctx, GGML_TYPE_F32, n_embd, n_vocab);
+        model.norm_f_w = ggml_new_tensor_1d(ctx, GGML_TYPE_F32, n_embd);
+
+        // map by name
+        model.tensors["transformer.wte.weight"] = model.wte;
+        model.tensors["transformer.norm_f.weight"] = model.norm_f_w;
+
+        for (int i = 0; i < n_layer; ++i) {
+            auto & layer = model.layers[i];
+
+            layer.norm_1_w        = ggml_new_tensor_1d(ctx, GGML_TYPE_F32, n_embd);
+            layer.norm_2_w        = ggml_new_tensor_1d(ctx, GGML_TYPE_F32, n_embd);
+
+            layer.attn_Wqkv_w     = ggml_new_tensor_2d(ctx, wtype,        n_embd, n_embd * 3);
+            layer.attn_out_proj_w = ggml_new_tensor_2d(ctx, wtype,        n_embd, n_embd);
+            layer.ffn_up_proj_w   = ggml_new_tensor_2d(ctx, wtype,        n_embd, expand*n_embd);
+            layer.ffn_down_proj_w = ggml_new_tensor_2d(ctx, wtype, expand*n_embd, n_embd);
+
+            // map by name
+            model.tensors["transformer.blocks." + std::to_string(i) + ".norm_1.weight"]        = layer.norm_1_w;
+            model.tensors["transformer.blocks." + std::to_string(i) + ".norm_2.weight"]        = layer.norm_2_w;
+            model.tensors["transformer.blocks." + std::to_string(i) + ".attn.Wqkv.weight"]     = layer.attn_Wqkv_w;
+            model.tensors["transformer.blocks." + std::to_string(i) + ".attn.out_proj.weight"] = layer.attn_out_proj_w;
+
+            model.tensors["transformer.blocks." + std::to_string(i) + ".ffn.up_proj.weight"]   = layer.ffn_up_proj_w;
+            model.tensors["transformer.blocks." + std::to_string(i) + ".ffn.down_proj.weight"] = layer.ffn_down_proj_w;
+        }
+    }
+
+    // key + value memory
+    {
+        const auto & hparams = model.hparams;
+
+        const int n_embd  = hparams.n_embd;
+        const int n_layer = hparams.n_layer;
+        const int n_ctx   = hparams.n_ctx;
+
+        const int n_mem      = n_layer*n_ctx;
+        const int n_elements = n_embd*n_mem;
+
+        if (!kv_cache_init(hparams, model.kv_self, GGML_TYPE_F16, model.hparams.n_ctx)) {
+            fprintf(stderr, "%s: kv_cache_init() failed for self-attention cache\n", __func__);
+            ggml_free(ctx);
+            return false;
+        }
+
+        const size_t memory_size = ggml_nbytes(model.kv_self.k) + ggml_nbytes(model.kv_self.v);
+        printf("%s: kv self size  = %7.2f MB\n", __func__, memory_size / 1024.0 / 1024.0);
+    }
+
+    // load weights
+    {
+        int n_tensors = 0;
+        size_t total_size = 0;
+
+        printf("%s: ", __func__);
+
+        while (true) {
+            int32_t n_dims;
+            int32_t length;
+            int32_t ttype;
+
+            fin.read(reinterpret_cast<char *>(&n_dims), sizeof(n_dims));
+            fin.read(reinterpret_cast<char *>(&length), sizeof(length));
+            fin.read(reinterpret_cast<char *>(&ttype),  sizeof(ttype));
+
+            if (fin.eof()) {
+                break;
+            }
+
+            int32_t nelements = 1;
+            int32_t ne[2] = { 1, 1 };
+            for (int i = 0; i < n_dims; ++i) {
+                fin.read(reinterpret_cast<char *>(&ne[i]), sizeof(ne[i]));
+                nelements *= ne[i];
+            }
+
+            std::string name(length, 0);
+            fin.read(&name[0], length);
+
+            if (model.tensors.find(name.data()) == model.tensors.end()) {
+                fprintf(stderr, "%s: unknown tensor '%s' in model file\n", __func__, name.data());
+                return false;
+            }
+
+            auto tensor = model.tensors[name.data()];
+            if (ggml_nelements(tensor) != nelements) {
+                fprintf(stderr, "%s: tensor '%s' has wrong size in model file\n", __func__, name.data());
+                return false;
+            }
+
+            if (tensor->ne[0] != ne[0] || tensor->ne[1] != ne[1]) {
+                fprintf(stderr, "%s: tensor '%s' has wrong shape in model file: got [%d, %d], expected [%d, %d]\n",
+                        __func__, name.data(), (int) tensor->ne[0], (int) tensor->ne[1], ne[0], ne[1]);
+                return false;
+            }
+
+            // for debugging
+            if (0) {
+                printf("%24s - [%5d, %5d], type = %6s, %6.2f MB, %9zu bytes\n", name.data(), ne[0], ne[1], ggml_type_name(ggml_type(ttype)), ggml_nbytes(tensor)/1024.0/1024.0, ggml_nbytes(tensor));
+            }
+
+            const size_t bpe = ggml_type_size(ggml_type(ttype));
+
+            if ((nelements*bpe)/ggml_blck_size(tensor->type) != ggml_nbytes(tensor)) {
+                fprintf(stderr, "%s: tensor '%s' has wrong size in model file: got %zu, expected %zu\n",
+                        __func__, name.data(), ggml_nbytes(tensor), nelements*bpe);
+                return false;
+            }
+
+            fin.read(reinterpret_cast<char *>(tensor->data), ggml_nbytes(tensor));
+
+            //printf("%42s - [%5d, %5d], type = %6s, %6.2f MB\n", name.data(), ne[0], ne[1], ttype == 0 ? "float" : "f16", ggml_nbytes(tensor)/1024.0/1024.0);
+            total_size += ggml_nbytes(tensor);
+            if (++n_tensors % 8 == 0) {
+                printf(".");
+                fflush(stdout);
+            }
+        }
+
+        printf(" done\n");
+
+        printf("%s: model size = %8.2f MB / num tensors = %d\n", __func__, total_size/1024.0/1024.0, n_tensors);
+    }
+
+    return true;
+}
+
+// load the model's weights from a file path
+bool mpt_model_load(const std::string & fname, mpt_model & model, mpt_vocab & vocab) {
+
+    auto fin = std::ifstream(fname, std::ios::binary);
+    if (!fin) {
+        fprintf(stderr, "%s: failed to open '%s'\n", __func__, fname.c_str());
+        return false;
+    }
+
+    bool loaded = mpt_model_load(fname, fin, model, vocab);
+    fin.close();
+    return loaded;
+}
+
+bool mpt_eval(
+        mpt_model & model,
+        const int n_threads,
+        const int n_past,
+        const std::vector<int>           & embd_inp,
+              std::vector<float>         & embd_w,
+              size_t                     & mem_per_token) {
+    const int N = embd_inp.size();
+
+    const auto & hparams = model.hparams;
+
+    const int n_embd  = hparams.n_embd;
+    const int n_layer = hparams.n_layer;
+    const int n_ctx   = hparams.n_ctx;
+    const int n_head  = hparams.n_head;
+    const int n_vocab = hparams.n_vocab;
+    const int expand  = hparams.expand;
+
+    const int d_key = n_embd/n_head;
+
+    static size_t buf_size = 256u*1024*1024;
+    static void * buf = malloc(buf_size);
+
+    if (mem_per_token > 0 && mem_per_token*N > buf_size) {
+        const size_t buf_size_new = 1.1*(mem_per_token*N); // add 10% to account for ggml object overhead
+        //printf("\n%s: reallocating buffer from %zu to %zu bytes\n", __func__, buf_size, buf_size_new);
+
+        // reallocate
+        buf_size = buf_size_new;
+        buf = realloc(buf, buf_size);
+        if (buf == nullptr) {
+            fprintf(stderr, "%s: failed to allocate %zu bytes\n", __func__, buf_size);
+            return false;
+        }
+    }
+
+    struct ggml_init_params params = {
+        .mem_size   = buf_size,
+        .mem_buffer = buf,
+        .no_alloc   = false,
+    };
+
+    struct ggml_context * ctx0 = ggml_init(params);
+    struct ggml_cgraph gf = { .n_threads = n_threads };
+
+    struct ggml_tensor * embd = ggml_new_tensor_1d(ctx0, GGML_TYPE_I32, N);
+    memcpy(embd->data, embd_inp.data(), N*ggml_element_size(embd));
+
+    // wte
+    struct ggml_tensor * inpL = ggml_get_rows(ctx0, model.wte, embd);
+
+    for (int il = 0; il < n_layer; ++il) {
+
+        struct ggml_tensor * inpSA = inpL;
+        struct ggml_tensor * cur = inpSA;
+        // self-attention
+        {
+
+            // norm1
+            cur = ggml_norm(ctx0, cur);
+            cur = ggml_mul(ctx0,
+                    ggml_repeat(ctx0, model.layers[il].norm_1_w, cur),
+                    cur);
+            // compute QKV
+            cur = ggml_mul_mat(ctx0,
+                    model.layers[il].attn_Wqkv_w,
+                    cur);
+
+            // TODO: clip_qkv
+            struct ggml_tensor * Qcur = ggml_cont(ctx0, ggml_view_2d(ctx0, cur, n_embd, N, cur->nb[1], 0*ggml_element_size(cur)*n_embd));
+            struct ggml_tensor * Kcur = ggml_cont(ctx0, ggml_view_2d(ctx0, cur, n_embd, N, cur->nb[1], 1*ggml_element_size(cur)*n_embd));
+            struct ggml_tensor * Vcur = ggml_cont(ctx0, ggml_view_2d(ctx0, cur, n_embd, N, cur->nb[1], 2*ggml_element_size(cur)*n_embd));
+
+            // TODO: qk_ln? (seems to be False in MPT-7B configs)
+            {
+                Vcur = ggml_transpose(ctx0, Vcur);
+
+                struct ggml_tensor * k = ggml_view_1d(ctx0, model.kv_self.k, N*n_embd, (ggml_element_size(model.kv_self.k)*n_embd)*(il*n_ctx + n_past));
+                struct ggml_tensor * v = ggml_view_2d(ctx0, model.kv_self.v, N, n_embd,
+                                        (   n_ctx)*ggml_element_size(model.kv_self.v),
+                                        (il*n_ctx)*ggml_element_size(model.kv_self.v)*n_embd + n_past*ggml_element_size(model.kv_self.v));
+
+                ggml_build_forward_expand(&gf, ggml_cpy(ctx0, Kcur, k));
+                ggml_build_forward_expand(&gf, ggml_cpy(ctx0, Vcur, v));
+            }
+            // Q = Qcur.contiguous().view(n_embd/n_head, n_head, N).permute(0, 2, 1, 3)
+            struct ggml_tensor * Q =
+                ggml_permute(ctx0,
+                        ggml_reshape_3d(ctx0, Qcur, n_embd/n_head, n_head, N),
+                        0, 2, 1, 3);
+
+            struct ggml_tensor * K =
+                ggml_permute(ctx0,
+                        ggml_reshape_3d(ctx0,
+                            ggml_view_1d(ctx0, model.kv_self.k, (n_past + N)*n_embd, il*n_ctx*ggml_element_size(model.kv_self.k)*n_embd),
+                            n_embd/n_head, n_head, n_past + N),
+                        0, 2, 1, 3);
+
+            // K * Q
+            struct ggml_tensor * KQ = ggml_mul_mat(ctx0, K, Q);
+
+            // KQ_scaled = KQ / sqrt(n_embd/n_head)
+            struct ggml_tensor * KQ_scaled =
+                ggml_scale(ctx0,
+                        KQ,
+                        ggml_new_f32(ctx0, 1.0f/sqrt(float(n_embd)/n_head))
+                        );
+
+
+            // Alibi
+            struct ggml_tensor * KQ_scaled_biased = ggml_alibi(ctx0, ggml_cont(ctx0, KQ_scaled), n_past, n_head);
+
+            // KQ_masked = mask_past(KQ_scaled)
+            struct ggml_tensor * KQ_masked = ggml_diag_mask_inf(ctx0, KQ_scaled_biased, n_past);
+
+            // KQ = soft_max(KQ_masked)
+            struct ggml_tensor * KQ_soft_max = ggml_soft_max(ctx0, KQ_masked);
+
+            // V_trans = Vmem.view(n_embd/n_head, n_head, n_past + N).permute(1, 2, 0, 3).contiguous()
+            struct ggml_tensor * V =
+                ggml_view_3d(ctx0, model.kv_self.v,
+                        n_past + N, n_embd/n_head, n_head,
+                        n_ctx*ggml_element_size(model.kv_self.v),
+                        n_ctx*ggml_element_size(model.kv_self.v)*n_embd/n_head,
+                        il*n_ctx*ggml_element_size(model.kv_self.v)*n_embd);
+
+            // KQV = transpose(V) * KQ_soft_max
+            struct ggml_tensor * KQV = ggml_mul_mat(ctx0, V, KQ_soft_max);
+
+            // KQV_merged = KQV.permute(0, 2, 1, 3)
+            struct ggml_tensor * KQV_merged = ggml_permute(ctx0, KQV, 0, 2, 1, 3);
+
+            // cur = KQV_merged.contiguous().view(n_embd, N)
+            cur = ggml_cpy(ctx0,
+                    KQV_merged,
+                    ggml_new_tensor_2d(ctx0, GGML_TYPE_F32, n_embd, N));
+
+            // projection (no bias)
+            cur = ggml_mul_mat(ctx0,
+                    model.layers[il].attn_out_proj_w,
+                    cur);
+        }
+
+
+        // residual
+        struct ggml_tensor * resSA = ggml_add(ctx0, cur, inpSA);
+        // feed-forward network
+        {
+            cur = resSA;
+            // norm2
+            cur = ggml_norm(ctx0, cur);
+            cur = ggml_mul(ctx0,
+                    ggml_repeat(ctx0, model.layers[il].norm_2_w, cur),
+                    cur);
+            // ffn
+            cur = ggml_mul_mat(ctx0,
+                    model.layers[il].ffn_up_proj_w,
+                    cur);
+            cur = ggml_gelu(ctx0, cur);
+            cur = ggml_mul_mat(ctx0,
+                    model.layers[il].ffn_down_proj_w,
+                    cur);
+
+        }
+
+        // self-attention + FF
+        inpL = ggml_add(ctx0, cur, resSA);
+    }
+
+    struct ggml_tensor * out = inpL;
+    // -> logits
+    {
+        out = ggml_norm(ctx0, out);
+        out = ggml_mul(ctx0,
+                    ggml_repeat(ctx0, model.norm_f_w, out),
+                    out);
+        out = ggml_mul_mat(ctx0, model.wte, out);
+    }
+
+
+    // run the computation
+    ggml_build_forward_expand(&gf, out);
+    ggml_graph_compute       (ctx0, &gf);
+
+
+    // return result for just the last token
+    embd_w.resize(n_vocab);
+    memcpy(embd_w.data(), (float *) ggml_get_data(out) + (n_vocab*(N-1)), sizeof(float)*n_vocab);
+
+    if (mem_per_token == 0) {
+        mem_per_token = ggml_used_mem(ctx0)/N;
+    }
+    //printf("used_mem = %zu\n", ggml_used_mem(ctx0));
+
+    ggml_free(ctx0);
+
+    return true;
+}
+
+std::vector<int> mpt_tokenize_inner(const mpt_vocab & vocab, const std::string & text) {
+    // taken from stablelm example in ggml
+    // they both use the gpt-neox tokenizer
+    // not sure if this entirely right?
+    std::vector<std::string> words;
+
+
+    // first split the text into words
+    {
+        std::string str = text;
+        std::string pat = R"('s|'t|'re|'ve|'m|'ll|'d| ?[[:alpha:]]+| ?[[:digit:]]+| ?[^\s[:alpha:][:digit:]]+|\s+(?!\S)|\s+)";
+        std::regex re(pat);
+        std::smatch m;
+
+        while (std::regex_search(str, m, re)) {
+            for (auto x : m) {
+                words.push_back(x);
+            }
+            str = m.suffix();
+        }
+    }
+
+    // find the longest tokens that form the words:
+    std::vector<mpt_vocab::id> tokens;
+    for (const auto & word : words) {
+        if (word.size() == 0) continue;
+
+        int i = 0;
+        int n = word.size();
+        while (i < n) {
+            int j = n;
+            while (j > i) {
+                auto it = vocab.token_to_id.find(word.substr(i, j-i));
+                if (it != vocab.token_to_id.end()) {
+                    tokens.push_back(it->second);
+                    i = j;
+                    break;
+                }
+                --j;
+            }
+            if (i == n) {
+                break;
+            }
+            if (j == i) {
+                auto sub = word.substr(i, 1);
+                if (vocab.token_to_id.find(sub) != vocab.token_to_id.end()) {
+                    tokens.push_back(vocab.token_to_id.at(sub));
+                } else {
+                    fprintf(stderr, "%s: unknown token '%s'\n", __func__, sub.data());
+                }
+                ++i;
+            }
+        }
+    }
+
+    return tokens;
+}
+
+std::vector<mpt_vocab::id> mpt_tokenize(const mpt_vocab & vocab, const std::string & text) {
+    // Generate the subpattern from the special_tokens vector if it's not empty
+    if (!vocab.special_tokens.empty()) {
+        std::vector<mpt_vocab::id> out;
+        std::vector<std::string> chunks;
+        std::string str = text;
+        std::string special_tokens_subpattern;
+        for (const auto &token : vocab.special_tokens) {
+            if (!special_tokens_subpattern.empty()) {
+                special_tokens_subpattern += "|";
+            }
+            special_tokens_subpattern += regex_escape(token);
+        }
+        std::regex re(special_tokens_subpattern);
+        std::smatch m;
+        while (std::regex_search(str, m, re)) {
+            auto tok = vocab.token_to_id.find(m.str());
+            if (tok != vocab.token_to_id.end()) {
+                auto tokid = tok->second;
+                auto pfxtoks = mpt_tokenize_inner(vocab, m.prefix());
+                out.insert(out.end(), pfxtoks.begin(), pfxtoks.end());
+                out.push_back(tokid);
+                str = m.suffix();
+            }
+        }
+        if (!str.empty()) {
+            auto tokrest = mpt_tokenize_inner(vocab, str);
+            out.insert(out.end(), tokrest.begin(), tokrest.end());
+        }
+        return out;
+    } else {
+        return mpt_tokenize_inner(vocab, text);
+    }
+}
+
+#define MPT_MAX_RNG_STATE 64*1024
+
+size_t mpt_get_state_size(const mpt_model &model)
+{
+    // we don't know size of rng until we actually serialize it. so reserve more than enough memory for its serialized state.
+    // for reference, std::mt19937(1337) serializes to 6701 bytes.
+    const size_t s_rng_size        = sizeof(size_t);
+    const size_t s_rng             = MPT_MAX_RNG_STATE;
+    const size_t s_kv_size         = sizeof(size_t);
+    const size_t s_kv_ntok         = sizeof(int);
+    const size_t s_kv              = model.kv_self.buf.size;
+    const size_t s_total = (
+        + s_rng_size
+        + s_rng
+        + s_kv_size
+        + s_kv_ntok
+        + s_kv
+    );
+    fflush(stdout);
+    return s_total;
+}
+
+size_t mpt_copy_state_data(const mpt_model &model, const std::mt19937 &rng, uint8_t *dest)
+{
+    uint8_t * out = dest;
+    fflush(stdout);
+    // copy rng
+    {
+        std::stringstream rng_ss;
+        rng_ss << rng;
+
+        const size_t rng_size = rng_ss.str().size();
+        char rng_buf[MPT_MAX_RNG_STATE];
+
+        memset(&rng_buf[0], 0, MPT_MAX_RNG_STATE);
+        memcpy(&rng_buf[0], rng_ss.str().data(), rng_ss.str().size());
+
+        memcpy(out, &rng_size,   sizeof(rng_size));   out += sizeof(rng_size);
+        memcpy(out, &rng_buf[0], MPT_MAX_RNG_STATE); out += MPT_MAX_RNG_STATE;
+    }
+
+    // copy kv cache
+    {
+        const size_t kv_size = model.kv_self.buf.size;
+        const int    kv_ntok = model.kv_self.n;
+
+        memcpy(out, &kv_size, sizeof(kv_size)); out += sizeof(kv_size);
+        memcpy(out, &kv_ntok, sizeof(kv_ntok)); out += sizeof(kv_ntok);
+
+        if (kv_size) {
+            memcpy(out, model.kv_self.buf.addr, kv_size); out += kv_size;
+        }
+    }
+
+    const size_t written  = out - dest;
+    const size_t expected = mpt_get_state_size(model);
+    assert(written == expected);
+    fflush(stdout);
+    return written;
+}
+
+mpt_vocab::id mpt_sample_top_k_top_p(
+        const mpt_vocab & vocab,
+        const size_t actualVocabSize,
+        const int32_t * last_n_tokens_data,
+        int   last_n_tokens_size,
+        const std::vector<float> logits,
+        int    top_k,
+        double top_p,
+        double temp,
+        float repeat_penalty,
+        std::mt19937 & rng) {
+    int n_logits = actualVocabSize;
+
+    const auto last_n_tokens = std::vector<int32_t>(last_n_tokens_data, last_n_tokens_data + last_n_tokens_size);
+    const auto * plogits = logits.data() + logits.size() - n_logits;
+
+    std::vector<std::pair<double, mpt_vocab::id>> logits_id;
+    logits_id.reserve(n_logits);
+
+    {
+        const float scale = 1.0f/temp;
+        for (int i = 0; i < n_logits; ++i) {
+            // repetition penalty from ctrl paper (https://arxiv.org/abs/1909.05858)
+            // credit https://github.com/facebookresearch/llama/compare/main...shawwn:llama:main
+            if (std::find(last_n_tokens.begin(), last_n_tokens.end(), i) != last_n_tokens.end()) {
+                // if score < 0 then repetition penalty has to multiplied to reduce the previous token probability
+                if (plogits[i] < 0.0f) {
+                    logits_id.push_back(std::make_pair(plogits[i]*scale*repeat_penalty, i));
+                } else {
+                    logits_id.push_back(std::make_pair(plogits[i]*scale/repeat_penalty, i));
+                }
+            } else {
+                logits_id.push_back(std::make_pair(plogits[i]*scale, i));
+            }
+        }
+    }
+
+    // find the top K tokens
+    std::partial_sort(
+            logits_id.begin(),
+            logits_id.begin() + top_k, logits_id.end(),
+            [](const std::pair<double, mpt_vocab::id> & a, const std::pair<double, mpt_vocab::id> & b) {
+        return a.first > b.first;
+    });
+
+    logits_id.resize(top_k);
+
+    double maxl = -INFINITY;
+    for (const auto & kv : logits_id) {
+        maxl = std::max(maxl, kv.first);
+    }
+
+    // compute probs for the top K tokens
+    std::vector<double> probs;
+    probs.reserve(logits_id.size());
+
+    double sum = 0.0;
+    for (const auto & kv : logits_id) {
+        double p = exp(kv.first - maxl);
+        probs.push_back(p);
+        sum += p;
+    }
+
+    // normalize the probs
+    for (auto & p : probs) {
+        p /= sum;
+    }
+
+    if (top_p < 1.0f) {
+        double cumsum = 0.0f;
+        for (int i = 0; i < top_k; i++) {
+            cumsum += probs[i];
+            if (cumsum >= top_p) {
+                top_k = i + 1;
+                probs.resize(top_k);
+                logits_id.resize(top_k);
+                break;
+            }
+        }
+
+        cumsum = 1.0/cumsum;
+        for (int i = 0; i < (int) probs.size(); i++) {
+            probs[i] *= cumsum;
+        }
+    }
+
+    //printf("\n");
+    //for (int i = 0; i < (int) probs.size(); i++) {
+    //    printf("%d: '%s' %f\n", i, vocab.id_to_token.at(logits_id[i].second).c_str(), probs[i]);
+    //}
+    //exit(0);
+
+    std::discrete_distribution<> dist(probs.begin(), probs.end());
+    int idx = dist(rng);
+
+    return logits_id[idx].second;
+}
+
+size_t mpt_set_state_data(mpt_model *model, std::mt19937 *rng, const uint8_t *src)
+{
+    const uint8_t * in = src;
+
+    // set rng
+    {
+        size_t rng_size;
+        char   rng_buf[MPT_MAX_RNG_STATE];
+
+        memcpy(&rng_size,   in, sizeof(rng_size));    in += sizeof(rng_size);
+        memcpy(&rng_buf[0], in, MPT_MAX_RNG_STATE); in += MPT_MAX_RNG_STATE;
+
+        std::stringstream rng_ss;
+        rng_ss.str(std::string(&rng_buf[0], rng_size));
+        rng_ss >> *rng;
+
+        assert(rng_ss.fail() == false);
+    }
+
+    // set kv cache
+    {
+        size_t kv_size;
+        int kv_ntok;
+
+        memcpy(&kv_size, in, sizeof(kv_size)); in += sizeof(kv_size);
+        memcpy(&kv_ntok, in, sizeof(kv_ntok)); in += sizeof(kv_ntok);
+
+        if (kv_size) {
+            assert(model->kv_self.buf.size == kv_size);
+
+            void * k_data = model->kv_self.k->data; // remember data pointers
+            void * v_data = model->kv_self.v->data; // because their value is stored in buf and overwritten by memcpy
+
+            memcpy(model->kv_self.buf.addr, in, kv_size); in += kv_size;
+
+            model->kv_self.k->data = k_data; // restore correct data pointers
+            model->kv_self.v->data = v_data;
+
+        }
+
+        model->kv_self.n = kv_ntok;
+    }
+
+    const size_t nread    = in - src;
+    const size_t expected = mpt_get_state_size(*model);
+    assert(nread == expected);
+    fflush(stdout);
+    return nread;
+}
+
+struct MPTPrivate {
+    const std::string modelPath;
+    bool modelLoaded;
+    mpt_vocab vocab;
+    mpt_model *model = nullptr;
+    int64_t n_threads = 0;
+    size_t mem_per_token = 0;
+    std::mt19937 rng;
+    bool has_im_end = false;
+};
+
+MPT::MPT()
+    : d_ptr(new MPTPrivate) {
+
+    d_ptr->model = new mpt_model;
+    d_ptr->modelLoaded = false;
+}
+
+bool MPT::loadModel(const std::string &modelPath) {
+    std::mt19937 rng(time(NULL));
+    d_ptr->rng = rng;
+
+    auto fin = std::ifstream(modelPath, std::ios::binary);
+
+    // load the model
+    if (!mpt_model_load(modelPath, fin, *d_ptr->model, d_ptr->vocab)) {
+        std::cerr << "GPT-J ERROR: failed to load model from " <<  modelPath;
+        return false;
+    }
+
+    d_ptr->n_threads = std::min(4, (int32_t) std::thread::hardware_concurrency());
+    d_ptr->modelLoaded = true;
+    d_ptr->has_im_end = d_ptr->vocab.token_to_id.find("<|im_end|>") != d_ptr->vocab.token_to_id.end();
+    fflush(stdout);
+    return true;
+}
+
+void MPT::setThreadCount(int32_t n_threads) {
+    d_ptr->n_threads = n_threads;
+}
+
+int32_t MPT::threadCount() {
+    return d_ptr->n_threads;
+}
+
+MPT::~MPT()
+{
+    delete d_ptr->model;
+}
+
+bool MPT::isModelLoaded() const
+{
+    return d_ptr->modelLoaded;
+}
+
+size_t MPT::stateSize() const
+{
+    return mpt_get_state_size(*d_ptr->model);
+}
+
+size_t MPT::saveState(uint8_t *dest) const
+{
+    return mpt_copy_state_data(*d_ptr->model, d_ptr->rng, dest);
+}
+
+size_t MPT::restoreState(const uint8_t *src)
+{
+    return mpt_set_state_data(d_ptr->model, &d_ptr->rng, src);
+}
+
+void MPT::prompt(const std::string &prompt,
+        std::function<bool(int32_t)> promptCallback,
+        std::function<bool(int32_t, const std::string&)> responseCallback,
+        std::function<bool(bool)> recalculateCallback,
+        PromptContext &promptCtx) {
+
+    if (!isModelLoaded()) {
+        std::cerr << "GPT-J ERROR: prompt won't work with an unloaded model!\n";
+        return;
+    }
+
+    const int64_t t_main_start_us = ggml_time_us();
+
+    int64_t t_sample_us  = 0;
+    int64_t t_predict_us = 0;
+    int64_t t_prompt_us = 0;
+
+    // tokenize the prompt
+    std::vector<int> embd_inp = mpt_tokenize(d_ptr->vocab, prompt);
+
+    // save the context size
+    promptCtx.n_ctx = d_ptr->model->hparams.n_ctx;
+
+    if ((int) embd_inp.size() > promptCtx.n_ctx - 4) {
+        responseCallback(-1, "ERROR: The prompt size exceeds the context window size and cannot be processed.");
+        std::cerr << "GPT-J ERROR: The prompt is" << embd_inp.size() <<
+            "tokens and the context window is" << promptCtx.n_ctx << "!\n";
+        return;
+    }
+
+    promptCtx.n_predict = std::min(promptCtx.n_predict, promptCtx.n_ctx - (int) embd_inp.size());
+    promptCtx.n_past = std::min(promptCtx.n_past, promptCtx.n_ctx);
+
+    // determine the required inference memory per token:
+    static bool initialized = false;
+    static std::vector<int> p_instruct;
+    static std::vector<int> r_instruct;
+    if (!initialized) {
+         mpt_eval(*d_ptr->model, d_ptr->n_threads, 0, { 0, 1, 2, 3 }, promptCtx.logits,
+            d_ptr->mem_per_token);
+        initialized = true;
+    }
+
+    // process the prompt in batches
+    size_t i = 0;
+    const int64_t t_start_prompt_us = ggml_time_us();
+    while (i < embd_inp.size()) {
+        size_t batch_end = std::min(i + promptCtx.n_batch, embd_inp.size());
+        std::vector<int> batch(embd_inp.begin() + i, embd_inp.begin() + batch_end);
+
+        // Check if the context has run out...
+        if (promptCtx.n_past + batch.size() > promptCtx.n_ctx) {
+            const int32_t erasePoint = promptCtx.n_ctx * promptCtx.contextErase;
+            // Erase the first percentage of context from the tokens...
+            std::cerr << "MPT: reached the end of the context window so resizing\n";
+            promptCtx.tokens.erase(promptCtx.tokens.begin(), promptCtx.tokens.begin() + erasePoint);
+            promptCtx.n_past = promptCtx.tokens.size();
+            recalculateContext(promptCtx, recalculateCallback);
+            assert(promptCtx.n_past + batch.size() <= promptCtx.n_ctx);
+        }
+
+        if (!mpt_eval(*d_ptr->model, d_ptr->n_threads, promptCtx.n_past, batch, promptCtx.logits,
+            d_ptr->mem_per_token)) {
+            std::cerr << "GPT-J ERROR: Failed to process prompt\n";
+            return;
+        }
+
+        size_t tokens = batch_end - i;
+        for (size_t t = 0; t < tokens; ++t) {
+            if (promptCtx.tokens.size() == promptCtx.n_ctx)
+                promptCtx.tokens.erase(promptCtx.tokens.begin());
+            promptCtx.tokens.push_back(batch.at(t));
+            if (!promptCallback(batch.at(t)))
+                return;
+        }
+        promptCtx.n_past += batch.size();
+        i = batch_end;
+    }
+    t_prompt_us += ggml_time_us() - t_start_prompt_us;
+
+    int p_instructFound = 0;
+    int r_instructFound = 0;
+
+    std::string cachedResponse;
+    std::vector<int> cachedTokens;
+    std::unordered_set<std::string> reversePrompts
+        = { "### Instruction", "### Prompt", "### Response", "### Human", "### Assistant" };
+
+    // predict next tokens
+    int32_t totalPredictions = 0;
+    for (int i = 0; i < promptCtx.n_predict; i++) {
+
+        // sample next token
+        const int n_vocab = d_ptr->model->hparams.n_vocab;
+        int id = 0;
+        {
+            const int64_t t_start_sample_us = ggml_time_us();
+            id = mpt_sample_top_k_top_p(d_ptr->vocab, n_vocab,
+                promptCtx.tokens.data() + promptCtx.n_ctx - promptCtx.n_ctx,
+                promptCtx.n_ctx,
+                promptCtx.logits,
+                promptCtx.top_k, promptCtx.top_p, promptCtx.temp,
+                promptCtx.repeat_penalty,
+                d_ptr->rng);
+
+            t_sample_us += ggml_time_us() - t_start_sample_us;
+        }
+
+        // Check if the context has run out...
+        if (promptCtx.n_past + 1 > promptCtx.n_ctx) {
+            const int32_t erasePoint = promptCtx.n_ctx * promptCtx.contextErase;
+            // Erase the first percentage of context from the tokens...
+            std::cerr << "MPT: reached the end of the context window so resizing\n";
+            promptCtx.tokens.erase(promptCtx.tokens.begin(), promptCtx.tokens.begin() + erasePoint);
+            promptCtx.n_past = promptCtx.tokens.size();
+            recalculateContext(promptCtx, recalculateCallback);
+            assert(promptCtx.n_past + 1 <= promptCtx.n_ctx);
+        }
+
+        const int64_t t_start_predict_us = ggml_time_us();
+        if (!mpt_eval(*d_ptr->model, d_ptr->n_threads, promptCtx.n_past, { id }, promptCtx.logits,
+            d_ptr->mem_per_token)) {
+            std::cerr << "GPT-J ERROR: Failed to predict next token\n";
+            return;
+        }
+        t_predict_us += ggml_time_us() - t_start_predict_us;
+
+        promptCtx.n_past += 1;
+        // display text
+        ++totalPredictions;
+
+        // mpt-7b-chat has special token for end
+        if (d_ptr->has_im_end && id == d_ptr->vocab.token_to_id["<|im_end|>"])
+            goto stop_generating;
+
+        if (id == 0 /*end of text*/)
+            goto stop_generating;
+
+        const std::string str = d_ptr->vocab.id_to_token[id];
+
+        // Check if the provided str is part of our reverse prompts
+        bool foundPartialReversePrompt = false;
+        const std::string completed = cachedResponse + str;
+        if (reversePrompts.find(completed) != reversePrompts.end()) {
+            goto stop_generating;
+        }
+
+        // Check if it partially matches our reverse prompts and if so, cache
+        for (auto s : reversePrompts) {
+            if (s.compare(0, completed.size(), completed) == 0) {
+                foundPartialReversePrompt = true;
+                cachedResponse = completed;
+                break;
+            }
+        }
+
+        // Regardless the token gets added to our cache
+        cachedTokens.push_back(id);
+
+        // Continue if we have found a partial match
+        if (foundPartialReversePrompt)
+            continue;
+
+        // Empty the cache
+        for (auto t : cachedTokens) {
+            if (promptCtx.tokens.size() == promptCtx.n_ctx)
+                promptCtx.tokens.erase(promptCtx.tokens.begin());
+            promptCtx.tokens.push_back(t);
+            if (!responseCallback(t, d_ptr->vocab.id_to_token[t]))
+                goto stop_generating;
+        }
+        cachedTokens.clear();
+    }
+
+stop_generating:
+
+#if 0
+    // report timing
+    {
+        const int64_t t_main_end_us = ggml_time_us();
+
+        std::cout << "GPT-J INFO: mem per token = " << mem_per_token << " bytes\n";
+        std::cout << "GPT-J INFO:   sample time = " << t_sample_us/1000.0f << " ms\n";
+        std::cout << "GPT-J INFO:   prompt time = " << t_prompt_us/1000.0f << " ms\n";
+        std::cout << "GPT-J INFO:  predict time = " << t_predict_us/1000.0f << " ms / " << t_predict_us/1000.0f/totalPredictions << " ms per token\n";
+        std::cout << "GPT-J INFO:    total time = " << (t_main_end_us - t_main_start_us)/1000.0f << " ms\n";
+        fflush(stdout);
+    }
+#endif
+
+    return;
+}
+
+void MPT::recalculateContext(PromptContext &promptCtx, std::function<bool(bool)> recalculate)
+{
+    size_t i = 0;
+    promptCtx.n_past = 0;
+    while (i < promptCtx.tokens.size()) {
+        size_t batch_end = std::min(i + promptCtx.n_batch, promptCtx.tokens.size());
+        std::vector<int> batch(promptCtx.tokens.begin() + i, promptCtx.tokens.begin() + batch_end);
+
+        assert(promptCtx.n_past + batch.size() <= promptCtx.n_ctx);
+
+        if (!mpt_eval(*d_ptr->model, d_ptr->n_threads, promptCtx.n_past, batch, promptCtx.logits,
+            d_ptr->mem_per_token)) {
+            std::cerr << "MPT ERROR: Failed to process prompt\n";
+            goto stop_generating;
+        }
+        promptCtx.n_past += batch.size();
+        if (!recalculate(true))
+            goto stop_generating;
+        i = batch_end;
+    }
+    assert(promptCtx.n_past == promptCtx.tokens.size());
+
+stop_generating:
+    recalculate(false);
+}
diff --git a/gpt4all-chat/llmodel/mpt.h b/gpt4all-chat/llmodel/mpt.h
new file mode 100644
index 00000000..9e693f6a
--- /dev/null
+++ b/gpt4all-chat/llmodel/mpt.h
@@ -0,0 +1,36 @@
+#ifndef MPT_H
+#define MPT_H
+
+#include <string>
+#include <functional>
+#include <vector>
+#include "llmodel.h"
+
+class MPTPrivate;
+class MPT : public LLModel {
+public:
+    MPT();
+    ~MPT();
+
+    bool loadModel(const std::string &modelPath) override;
+    bool isModelLoaded() const override;
+    size_t stateSize() const override;
+    size_t saveState(uint8_t *dest) const override;
+    size_t restoreState(const uint8_t *src) override;
+    void prompt(const std::string &prompt,
+        std::function<bool(int32_t)> promptCallback,
+        std::function<bool(int32_t, const std::string&)> responseCallback,
+        std::function<bool(bool)> recalculateCallback,
+        PromptContext &ctx) override;
+    void setThreadCount(int32_t n_threads) override;
+    int32_t threadCount() override;
+
+protected:
+    void recalculateContext(PromptContext &promptCtx,
+        std::function<bool(bool)> recalculate) override;
+
+private:
+    MPTPrivate *d_ptr;
+};
+
+#endif // MPT_H
diff --git a/gpt4all-chat/llmodel/scripts/convert_mpt_hf_to_ggml.py b/gpt4all-chat/llmodel/scripts/convert_mpt_hf_to_ggml.py
new file mode 100644
index 00000000..981432fc
--- /dev/null
+++ b/gpt4all-chat/llmodel/scripts/convert_mpt_hf_to_ggml.py
@@ -0,0 +1,175 @@
+# Convert Hugging Face fine-tuned bloom-like models to ggml format
+#
+# Usage:
+#
+#   python3 models/convert-h5-to-ggml.py 
+#
+# This script is similar to "convert-pt-to-ggml.py"
+#
+
+import io
+import os
+import sys
+import struct
+import json
+import code
+import torch
+import numpy as np
+
+from transformers import AutoTokenizer, AutoModelForCausalLM, AutoConfig, BloomForCausalLM
+
+# ref: https://github.com/openai/gpt-2/blob/master/src/encoder.py
+def bytes_to_unicode():
+    """
+    Returns list of utf-8 byte and a corresponding list of unicode strings.
+    The reversible bpe codes work on unicode strings.
+    This means you need a large # of unicode characters in your vocab if you want to avoid UNKs.
+    When you're at something like a 10B token dataset you end up needing around 5K for decent coverage.
+    This is a significant percentage of your normal, say, 32K bpe vocab.
+    To avoid that, we want lookup tables between utf-8 bytes and unicode strings.
+    And avoids mapping to whitespace/control characters the bpe code barfs on.
+    """
+    bs = list(range(ord("!"), ord("~")+1))+list(range(ord("¡"), ord("¬")+1))+list(range(ord("®"), ord("ÿ")+1))
+    cs = bs[:]
+    n = 0
+    for b in range(2**8):
+        if b not in bs:
+            bs.append(b)
+            cs.append(2**8+n)
+            n += 1
+    cs = [chr(n) for n in cs]
+    return dict(zip(bs, cs))
+
+if len(sys.argv) < 3:
+    print("Usage: python convert-hf-to-ggml.py model_name dir-output [use-f32]")
+    print("  model_name: name of the model to convert. Example: 'bigscience/bloomz-560m'")
+    print("  dir-output: directory where the output file will be written")
+    print("  use-f32:    if present, use float32 instead of float16")
+    sys.exit(1)
+
+model_name = sys.argv[1]
+dir_out = sys.argv[2]
+
+# make sure the output directory exists
+os.makedirs(dir_out, exist_ok=True)
+
+# possible data types
+#   ftype == 0 -> float32
+#   ftype == 1 -> float16
+#
+# map from ftype to string
+ftype_str = ["f32", "f16"]
+ftype = 1
+if len(sys.argv) > 3:
+    ftype = 0
+
+tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
+config = AutoConfig.from_pretrained(model_name, trust_remote_code=True)
+hparams = config.to_dict()
+print("Loading model: ", model_name)
+model = AutoModelForCausalLM.from_pretrained(model_name, trust_remote_code=True, config=config, torch_dtype=torch.float16 if ftype == 1 else torch.float32, low_cpu_mem_usage=True)
+print("Model loaded: ", model_name)
+
+
+fname_out = dir_out + f"/ggml-model-{model_name.split('/')[-1]}-{ftype_str[ftype]}.bin"
+fout = open(fname_out, "wb")
+vocab = tokenizer.vocab
+
+hparams["multiple_of"] = 1
+fout.write(struct.pack("i", 0x67676d6d)) # magic: ggml in hex
+fout.write(struct.pack("i", hparams["vocab_size"]))
+fout.write(struct.pack("i", hparams["max_seq_len"]))
+fout.write(struct.pack("i", hparams["d_model"]))
+fout.write(struct.pack("i", hparams["n_heads"]))
+fout.write(struct.pack("i", hparams["n_layers"]))
+# n_rot (unused)
+fout.write(struct.pack("i", 0))
+fout.write(struct.pack("i", ftype))
+
+# # Is this correct??
+# dot_token = tokenizer.encode(".")[0]
+# write tokens to ggml file 
+fout.write(struct.pack("i", hparams["vocab_size"]))
+
+for i in range(hparams["vocab_size"]):
+    text = tokenizer.decode([i]).encode('utf-8')
+    fout.write(struct.pack("i", len(text)))
+    fout.write(text)
+    
+list_vars = model.state_dict()
+for name in list_vars.keys():
+    data = list_vars[name].squeeze().numpy()
+    print("Processing variable: " + name + " with shape: ", data.shape)
+
+    # we don't need these
+    if name.endswith("attn.masked_bias") or name.endswith(".attn.bias"):
+        print("  Skipping variable: " + name)
+        continue
+
+    if "Wqkv.weight" in name:
+        # chunk qkv
+        query, key, value = np.split(data, 3, axis=0)
+
+        new_name = name.split("Wqkv.weight")[0]
+
+        for (data, name) in [(query, new_name + "q_proj.weight"), (key, new_name + "k_proj.weight"), (value, new_name + "v_proj.weight")]:
+            print(f"Processing variable: {name} with shape: {data.shape}")
+            n_dims = len(data.shape);
+
+            # ftype == 0 -> float32, ftype == 1 -> float16
+            ftype_cur = 0;
+            if ftype != 0:
+                print("  Converting to float16")
+                data = data.astype(np.float16)
+                ftype_cur = 1
+            else:
+                if data.dtype != np.float32:
+                    print("  Converting to float32")
+                    data = data.astype(np.float32)
+                    ftype_cur = 0
+
+            # header
+            str = name.encode('utf-8')
+            fout.write(struct.pack("iii", n_dims, len(str), ftype_cur))
+            for i in range(n_dims):
+                fout.write(struct.pack("i", data.shape[n_dims - 1 - i]))
+            fout.write(str);
+
+            # data
+            data.tofile(fout)
+
+    else:
+
+        n_dims = len(data.shape);
+
+        # ftype == 0 -> float32, ftype == 1 -> float16
+        ftype_cur = 0;
+        if ftype != 0:
+            if name[-7:] == ".weight" and n_dims == 2:
+                print("  Converting to float16")
+                data = data.astype(np.float16)
+                ftype_cur = 1
+            else:
+                print("  Converting to float32")
+                data = data.astype(np.float32)
+                ftype_cur = 0
+        else:
+            if data.dtype != np.float32:
+                print("  Converting to float32")
+                data = data.astype(np.float32)
+                ftype_cur = 0
+
+        # header
+        str = name.encode('utf-8')
+        fout.write(struct.pack("iii", n_dims, len(str), ftype_cur))
+        for i in range(n_dims):
+            fout.write(struct.pack("i", data.shape[n_dims - 1 - i]))
+        fout.write(str);
+
+        # data
+        data.tofile(fout)
+
+fout.close()
+
+print("Done. Output file: " + fname_out)
+print("")
\ No newline at end of file
diff --git a/gpt4all-chat/llmodel/utils.cpp b/gpt4all-chat/llmodel/utils.cpp
new file mode 100644
index 00000000..b9b653f5
--- /dev/null
+++ b/gpt4all-chat/llmodel/utils.cpp
@@ -0,0 +1,274 @@
+#include "utils.h"
+
+#include <fstream>
+#include <regex>
+
+void replace(std::string & str, const std::string & needle, const std::string & replacement) {
+    size_t pos = 0;
+    while ((pos = str.find(needle, pos)) != std::string::npos) {
+        str.replace(pos, needle.length(), replacement);
+        pos += replacement.length();
+    }
+}
+
+std::map<std::string, int32_t> json_parse(const std::string & fname) {
+    std::map<std::string, int32_t> result;
+
+    // read file into string
+    std::string json;
+    {
+        std::ifstream ifs(fname);
+        if (!ifs) {
+            fprintf(stderr, "Failed to open %s\n", fname.c_str());
+            exit(1);
+        }
+
+        json = std::string((std::istreambuf_iterator<char>(ifs)),
+                (std::istreambuf_iterator<char>()));
+    }
+
+    if (json[0] != '{') {
+        return result;
+    }
+
+    // parse json
+    {
+        bool has_key  = false;
+        bool in_token = false;
+
+        std::string str_key = "";
+        std::string str_val = "";
+
+        int n = json.size();
+        for (int i = 1; i < n; ++i) {
+            if (!in_token) {
+                if (json[i] == ' ') continue;
+                if (json[i] == '"') {
+                    in_token = true;
+                    continue;
+                }
+            } else {
+                if (json[i] == '\\' && i+1 < n) {
+                    if (has_key == false) {
+                        str_key += json[i];
+                    } else {
+                        str_val += json[i];
+                    }
+                    ++i;
+                } else if (json[i] == '"') {
+                    if (has_key == false) {
+                        has_key = true;
+                        ++i;
+                        while (json[i] == ' ') ++i;
+                        ++i; // :
+                        while (json[i] == ' ') ++i;
+                        if (json[i] != '\"') {
+                            while (json[i] != ',' && json[i] != '}') {
+                                str_val += json[i++];
+                            }
+                            has_key = false;
+                        } else {
+                            in_token = true;
+                            continue;
+                        }
+                    } else {
+                        has_key = false;
+                    }
+
+                    ::replace(str_key, "\\u0120", " " ); // \u0120 -> space
+                    ::replace(str_key, "\\u010a", "\n"); // \u010a -> new line
+                    ::replace(str_key, "\\\"",    "\""); // \\\"   -> "
+
+                    try {
+                        result[str_key] = std::stoi(str_val);
+                    } catch (...) {
+                        //fprintf(stderr, "%s: ignoring key '%s' with value '%s'\n", fname.c_str(), str_key.c_str(), str_val.c_str());
+
+                    }
+                    str_key = "";
+                    str_val = "";
+                    in_token = false;
+                    continue;
+                }
+                if (has_key == false) {
+                    str_key += json[i];
+                } else {
+                    str_val += json[i];
+                }
+            }
+        }
+    }
+
+    return result;
+}
+
+std::vector<gpt_vocab::id> gpt_tokenize(const gpt_vocab & vocab, const std::string & text) {
+    std::vector<std::string> words;
+
+    // first split the text into words
+    {
+        std::string str = text;
+        std::string pat = R"('s|'t|'re|'ve|'m|'ll|'d| ?[[:alpha:]]+| ?[[:digit:]]+| ?[^\s[:alpha:][:digit:]]+|\s+(?!\S)|\s+)";
+
+        std::regex re(pat);
+        std::smatch m;
+
+        while (std::regex_search(str, m, re)) {
+            for (auto x : m) {
+                words.push_back(x);
+            }
+            str = m.suffix();
+        }
+    }
+
+    // find the longest tokens that form the words:
+    std::vector<gpt_vocab::id> tokens;
+    for (const auto & word : words) {
+        if (word.size() == 0) continue;
+
+        int i = 0;
+        int n = word.size();
+        while (i < n) {
+            int j = n;
+            while (j > i) {
+                auto it = vocab.token_to_id.find(word.substr(i, j-i));
+                if (it != vocab.token_to_id.end()) {
+                    tokens.push_back(it->second);
+                    i = j;
+                    break;
+                }
+                --j;
+            }
+            if (i == n) {
+                break;
+            }
+            if (j == i) {
+                auto sub = word.substr(i, 1);
+                if (vocab.token_to_id.find(sub) != vocab.token_to_id.end()) {
+                    tokens.push_back(vocab.token_to_id.at(sub));
+                } else {
+                    fprintf(stderr, "%s: unknown token '%s'\n", __func__, sub.data());
+                }
+                ++i;
+            }
+        }
+    }
+
+    return tokens;
+}
+
+bool gpt_vocab_init(const std::string & fname, gpt_vocab & vocab) {
+    printf("%s: loading vocab from '%s'\n", __func__, fname.c_str());
+
+    vocab.token_to_id = ::json_parse(fname);
+
+    for (const auto & kv : vocab.token_to_id) {
+        vocab.id_to_token[kv.second] = kv.first;
+    }
+
+    printf("%s: vocab size = %d\n", __func__, (int) vocab.token_to_id.size());
+
+    // print the vocabulary
+    //for (auto kv : vocab.token_to_id) {
+    //    printf("'%s' -> %d\n", kv.first.data(), kv.second);
+    //}
+
+    return true;
+}
+
+gpt_vocab::id gpt_sample_top_k_top_p(
+        const gpt_vocab & vocab,
+        const int32_t * last_n_tokens_data,
+        int   last_n_tokens_size,
+        const std::vector<float> logits,
+        int    top_k,
+        double top_p,
+        double temp,
+        float repeat_penalty,
+        std::mt19937 & rng) {
+    int n_logits = vocab.id_to_token.size();
+
+    const auto last_n_tokens = std::vector<int32_t>(last_n_tokens_data, last_n_tokens_data + last_n_tokens_size);
+    const auto * plogits = logits.data() + logits.size() - n_logits;
+
+    std::vector<std::pair<double, gpt_vocab::id>> logits_id;
+    logits_id.reserve(n_logits);
+
+    {
+        const float scale = 1.0f/temp;
+        for (int i = 0; i < n_logits; ++i) {
+            // repetition penalty from ctrl paper (https://arxiv.org/abs/1909.05858)
+            // credit https://github.com/facebookresearch/llama/compare/main...shawwn:llama:main
+            if (std::find(last_n_tokens.begin(), last_n_tokens.end(), i) != last_n_tokens.end()) {
+                // if score < 0 then repetition penalty has to multiplied to reduce the previous token probability
+                if (plogits[i] < 0.0f) {
+                    logits_id.push_back(std::make_pair(plogits[i]*scale*repeat_penalty, i));
+                } else {
+                    logits_id.push_back(std::make_pair(plogits[i]*scale/repeat_penalty, i));
+                }
+            } else {
+                logits_id.push_back(std::make_pair(plogits[i]*scale, i));
+            }
+        }
+    }
+
+    // find the top K tokens
+    std::partial_sort(
+            logits_id.begin(),
+            logits_id.begin() + top_k, logits_id.end(),
+            [](const std::pair<double, gpt_vocab::id> & a, const std::pair<double, gpt_vocab::id> & b) {
+        return a.first > b.first;
+    });
+
+    logits_id.resize(top_k);
+
+    double maxl = -INFINITY;
+    for (const auto & kv : logits_id) {
+        maxl = std::max(maxl, kv.first);
+    }
+
+    // compute probs for the top K tokens
+    std::vector<double> probs;
+    probs.reserve(logits_id.size());
+
+    double sum = 0.0;
+    for (const auto & kv : logits_id) {
+        double p = exp(kv.first - maxl);
+        probs.push_back(p);
+        sum += p;
+    }
+
+    // normalize the probs
+    for (auto & p : probs) {
+        p /= sum;
+    }
+
+    if (top_p < 1.0f) {
+        double cumsum = 0.0f;
+        for (int i = 0; i < top_k; i++) {
+            cumsum += probs[i];
+            if (cumsum >= top_p) {
+                top_k = i + 1;
+                probs.resize(top_k);
+                logits_id.resize(top_k);
+                break;
+            }
+        }
+
+        cumsum = 1.0/cumsum;
+        for (int i = 0; i < (int) probs.size(); i++) {
+            probs[i] *= cumsum;
+        }
+    }
+
+    //printf("\n");
+    //for (int i = 0; i < (int) probs.size(); i++) {
+    //    printf("%d: '%s' %f\n", i, vocab.id_to_token.at(logits_id[i].second).c_str(), probs[i]);
+    //}
+    //exit(0);
+
+    std::discrete_distribution<> dist(probs.begin(), probs.end());
+    int idx = dist(rng);
+
+    return logits_id[idx].second;
+}
diff --git a/gpt4all-chat/llmodel/utils.h b/gpt4all-chat/llmodel/utils.h
new file mode 100644
index 00000000..90cfdd97
--- /dev/null
+++ b/gpt4all-chat/llmodel/utils.h
@@ -0,0 +1,85 @@
+// Various helper functions and utilities
+
+#pragma once
+
+#include <string>
+#include <map>
+#include <vector>
+#include <random>
+#include <thread>
+
+//
+// CLI argument parsing
+//
+
+struct gpt_params {
+    int32_t seed      = -1; // RNG seed
+    int32_t n_threads = std::min(4, (int32_t) std::thread::hardware_concurrency());
+    int32_t n_predict = 200; // new tokens to predict
+
+    // sampling parameters
+    int32_t top_k = 40;
+    float   top_p = 0.9f;
+    float   temp  = 0.9f;
+
+    int32_t n_batch = 8; // batch size for prompt processing
+
+    std::string model = "models/gpt-2-117M/ggml-model.bin"; // model path
+    std::string prompt;
+};
+
+bool gpt_params_parse(int argc, char ** argv, gpt_params & params);
+
+void gpt_print_usage(int argc, char ** argv, const gpt_params & params);
+
+std::string gpt_random_prompt(std::mt19937 & rng);
+
+//
+// Vocab utils
+//
+
+struct gpt_vocab {
+    using id    = int32_t;
+    using token = std::string;
+
+    std::map<token, id> token_to_id;
+    std::map<id, token> id_to_token;
+};
+
+void replace(std::string & str, const std::string & needle, const std::string & replacement);
+
+// poor-man's JSON parsing
+std::map<std::string, int32_t> json_parse(const std::string & fname);
+
+// split text into tokens
+//
+// ref: https://github.com/openai/gpt-2/blob/a74da5d99abaaba920de8131d64da2862a8f213b/src/encoder.py#L53
+//
+// Regex (Python):
+// r"""'s|'t|'re|'ve|'m|'ll|'d| ?\p{L}+| ?\p{N}+| ?[^\s\p{L}\p{N}]+|\s+(?!\S)|\s+"""
+//
+// Regex (C++):
+// R"('s|'t|'re|'ve|'m|'ll|'d| ?[[:alpha:]]+| ?[[:digit:]]+| ?[^\s[:alpha:][:digit:]]+|\s+(?!\S)|\s+)"
+//
+std::vector<gpt_vocab::id> gpt_tokenize(const gpt_vocab & vocab, const std::string & text);
+
+// load the tokens from encoder.json
+bool gpt_vocab_init(const std::string & fname, gpt_vocab & vocab);
+
+// sample next token given probabilities for each embedding
+//
+//   - consider only the top K tokens
+//   - from them, consider only the top tokens with cumulative probability > P
+//
+// TODO: not sure if this implementation is correct
+//
+gpt_vocab::id gpt_sample_top_k_top_p(
+        const gpt_vocab & vocab,
+        const int32_t * last_n_tokens_data,
+        int   last_n_tokens_size,
+        const std::vector<float> logits,
+        int    top_k,
+        double top_p,
+        double temp,
+        float repeat_penalty,
+        std::mt19937 & rng);
diff --git a/gpt4all-chat/main.cpp b/gpt4all-chat/main.cpp
new file mode 100644
index 00000000..aece4026
--- /dev/null
+++ b/gpt4all-chat/main.cpp
@@ -0,0 +1,43 @@
+#include <QGuiApplication>
+#include <QQmlApplicationEngine>
+#include <QQmlContext>
+
+#include <QDirIterator>
+#include <QSettings>
+
+#include "llm.h"
+#include "download.h"
+#include "network.h"
+#include "config.h"
+
+int main(int argc, char *argv[])
+{
+    QCoreApplication::setOrganizationName("nomic.ai");
+    QCoreApplication::setOrganizationDomain("gpt4all.io");
+    QCoreApplication::setApplicationName("GPT4All");
+    QCoreApplication::setApplicationVersion(APP_VERSION);
+    QSettings::setDefaultFormat(QSettings::IniFormat);
+
+    QGuiApplication app(argc, argv);
+    QQmlApplicationEngine engine;
+    qmlRegisterSingletonInstance("llm", 1, 0, "LLM", LLM::globalInstance());
+    qmlRegisterSingletonInstance("download", 1, 0, "Download", Download::globalInstance());
+    qmlRegisterSingletonInstance("network", 1, 0, "Network", Network::globalInstance());
+    const QUrl url(u"qrc:/gpt4all/main.qml"_qs);
+
+    QObject::connect(&engine, &QQmlApplicationEngine::objectCreated,
+        &app, [url](QObject *obj, const QUrl &objUrl) {
+            if (!obj && url == objUrl)
+                QCoreApplication::exit(-1);
+        }, Qt::QueuedConnection);
+    engine.load(url);
+
+#if 0
+    QDirIterator it("qrc:", QDirIterator::Subdirectories);
+    while (it.hasNext()) {
+        qDebug() << it.next();
+    }
+#endif
+
+    return app.exec();
+}
diff --git a/gpt4all-chat/main.qml b/gpt4all-chat/main.qml
new file mode 100644
index 00000000..6ab92df0
--- /dev/null
+++ b/gpt4all-chat/main.qml
@@ -0,0 +1,894 @@
+import QtCore
+import QtQuick
+import QtQuick.Controls
+import QtQuick.Controls.Basic
+import QtQuick.Layouts
+import llm
+import download
+import network
+
+Window {
+    id: window
+    width: 1280
+    height: 720
+    visible: true
+    title: qsTr("GPT4All v") + Qt.application.version
+
+    Theme {
+        id: theme
+    }
+
+    property var currentChat: LLM.chatListModel.currentChat
+    property var chatModel: currentChat.chatModel
+
+    color: theme.textColor
+
+    // Startup code
+    Component.onCompleted: {
+        if (!LLM.compatHardware) {
+            Network.sendNonCompatHardware();
+            errorCompatHardware.open();
+        } else
+            startupDialogs();
+    }
+
+    Connections {
+        target: firstStartDialog
+        function onClosed() {
+            startupDialogs();
+        }
+    }
+
+    Connections {
+        target: downloadNewModels
+        function onClosed() {
+            startupDialogs();
+        }
+    }
+
+    Connections {
+        target: Download
+        function onHasNewerReleaseChanged() {
+            startupDialogs();
+        }
+    }
+
+    Connections {
+        target: currentChat
+        function onResponseInProgressChanged() {
+            if (Network.isActive && !currentChat.responseInProgress)
+                Network.sendConversation(currentChat.id, getConversationJson());
+        }
+    }
+
+    function startupDialogs() {
+        // check for first time start of this version
+        if (Download.isFirstStart()) {
+            firstStartDialog.open();
+            return;
+        }
+
+        // check for any current models and if not, open download dialog
+        if (currentChat.modelList.length === 0 && !firstStartDialog.opened) {
+            downloadNewModels.open();
+            return;
+        }
+
+        // check for new version
+        if (Download.hasNewerRelease && !firstStartDialog.opened && !downloadNewModels.opened) {
+            newVersionDialog.open();
+            return;
+        }
+    }
+
+    PopupDialog {
+        id: errorCompatHardware
+        anchors.centerIn: parent
+        shouldTimeOut: false
+        shouldShowBusy: false
+        closePolicy: Popup.NoAutoClose
+        modal: true
+        text: qsTr("Incompatible hardware detected. Please try the avx-only installer on https://gpt4all.io")
+    }
+
+    StartupDialog {
+        id: firstStartDialog
+        anchors.centerIn: parent
+    }
+
+    NewVersionDialog {
+        id: newVersionDialog
+        anchors.centerIn: parent
+    }
+
+    AboutDialog {
+        id: aboutDialog
+        anchors.centerIn: parent
+    }
+
+    Item {
+        Accessible.role: Accessible.Window
+        Accessible.name: title
+    }
+
+    Rectangle {
+        id: header
+        anchors.left: parent.left
+        anchors.right: parent.right
+        anchors.top: parent.top
+        height: 100
+        color: theme.backgroundDarkest
+
+        Item {
+            anchors.centerIn: parent
+            height: childrenRect.height
+            visible: currentChat.isModelLoaded
+
+            Label {
+                id: modelLabel
+                color: theme.textColor
+                padding: 20
+                font.pixelSize: theme.fontSizeLarger
+                text: ""
+                background: Rectangle {
+                    color: theme.backgroundDarkest
+                }
+                horizontalAlignment: TextInput.AlignRight
+            }
+
+            ComboBox {
+                id: comboBox
+                width: 350
+                anchors.top: modelLabel.top
+                anchors.bottom: modelLabel.bottom
+                anchors.horizontalCenter: parent.horizontalCenter
+                font.pixelSize: theme.fontSizeLarge
+                spacing: 0
+                model: currentChat.modelList
+                Accessible.role: Accessible.ComboBox
+                Accessible.name: qsTr("ComboBox for displaying/picking the current model")
+                Accessible.description: qsTr("Use this for picking the current model to use; the first item is the current model")
+                contentItem: Text {
+                    anchors.horizontalCenter: parent.horizontalCenter
+                    leftPadding: 10
+                    rightPadding: 10
+                    text: comboBox.displayText
+                    font: comboBox.font
+                    color: theme.textColor
+                    verticalAlignment: Text.AlignVCenter
+                    horizontalAlignment: Text.AlignHCenter
+                    elide: Text.ElideRight
+                }
+                delegate: ItemDelegate {
+                    width: comboBox.width
+                    contentItem: Text {
+                        text: modelData
+                        color: theme.textColor
+                        font: comboBox.font
+                        elide: Text.ElideRight
+                        verticalAlignment: Text.AlignVCenter
+                    }
+                    background: Rectangle {
+                        color: highlighted ? theme.backgroundLight : theme.backgroundDark
+                    }
+                    highlighted: comboBox.highlightedIndex === index
+                }
+                popup: Popup {
+                    y: comboBox.height - 1
+                    width: comboBox.width
+                    implicitHeight: contentItem.implicitHeight
+                    padding: 0
+
+                    contentItem: ListView {
+                        clip: true
+                        implicitHeight: contentHeight
+                        model: comboBox.popup.visible ? comboBox.delegateModel : null
+                        currentIndex: comboBox.highlightedIndex
+                        ScrollIndicator.vertical: ScrollIndicator { }
+                    }
+
+                    background: Rectangle {
+                        color: theme.backgroundDark
+                    }
+                }
+
+                background: Rectangle {
+                    color: theme.backgroundDark
+                }
+
+                onActivated: {
+                    currentChat.stopGenerating()
+                    currentChat.reset();
+                    currentChat.modelName = comboBox.currentText
+                }
+            }
+        }
+
+        BusyIndicator {
+            anchors.centerIn: parent
+            visible: !currentChat.isModelLoaded
+            running: !currentChat.isModelLoaded
+            Accessible.role: Accessible.Animation
+            Accessible.name: qsTr("Busy indicator")
+            Accessible.description: qsTr("Displayed when the model is loading")
+        }
+    }
+
+    SettingsDialog {
+        id: settingsDialog
+        anchors.centerIn: parent
+        width: Math.min(1024, window.width - (window.width * .2))
+        height: Math.min(600, window.height - (window.height * .2))
+    }
+
+    Button {
+        id: drawerButton
+        anchors.left: parent.left
+        anchors.top: parent.top
+        anchors.topMargin: 30
+        anchors.leftMargin: 30
+        width: 40
+        height: 40
+        z: 200
+        padding: 15
+
+        Accessible.role: Accessible.ButtonMenu
+        Accessible.name: qsTr("Hamburger button")
+        Accessible.description: qsTr("Hamburger button that reveals a drawer on the left of the application")
+
+        background: Item {
+            anchors.centerIn: parent
+            width: 30
+            height: 30
+
+            Rectangle {
+                id: bar1
+                color: theme.backgroundLightest
+                width: parent.width
+                height: 6
+                radius: 2
+                antialiasing: true
+            }
+
+            Rectangle {
+                id: bar2
+                anchors.centerIn: parent
+                color: theme.backgroundLightest
+                width: parent.width
+                height: 6
+                radius: 2
+                antialiasing: true
+            }
+
+            Rectangle {
+                id: bar3
+                anchors.bottom: parent.bottom
+                color: theme.backgroundLightest
+                width: parent.width
+                height: 6
+                radius: 2
+                antialiasing: true
+            }
+        }
+        onClicked: {
+            drawer.visible = !drawer.visible
+        }
+    }
+
+    NetworkDialog {
+        id: networkDialog
+        anchors.centerIn: parent
+        width: Math.min(1024, window.width - (window.width * .2))
+        height: Math.min(600, window.height - (window.height * .2))
+        Item {
+            Accessible.role: Accessible.Dialog
+            Accessible.name: qsTr("Network dialog")
+            Accessible.description: qsTr("Dialog for opt-in to sharing feedback/conversations")
+        }
+    }
+
+    Button {
+        id: networkButton
+        anchors.right: parent.right
+        anchors.top: parent.top
+        anchors.topMargin: 30
+        anchors.rightMargin: 30
+        width: 40
+        height: 40
+        z: 200
+        padding: 15
+
+        Accessible.role: Accessible.Button
+        Accessible.name: qsTr("Network button")
+        Accessible.description: qsTr("Reveals a dialogue where you can opt-in for sharing data over network")
+
+        background: Item {
+            anchors.fill: parent
+            Rectangle {
+                anchors.fill: parent
+                color: "transparent"
+                visible: Network.isActive
+                border.color: theme.backgroundLightest
+                border.width: 1
+                radius: 10
+            }
+            Image {
+                anchors.centerIn: parent
+                width: 30
+                height: 30
+                source: "qrc:/gpt4all/icons/network.svg"
+            }
+        }
+
+        onClicked: {
+            if (Network.isActive) {
+                Network.isActive = false
+                Network.sendNetworkToggled(false);
+            } else
+                networkDialog.open()
+        }
+    }
+
+    Connections {
+        target: Network
+        function onHealthCheckFailed(code) {
+            healthCheckFailed.open();
+        }
+    }
+
+    Button {
+        id: settingsButton
+        anchors.right: networkButton.left
+        anchors.top: parent.top
+        anchors.topMargin: 30
+        anchors.rightMargin: 30
+        width: 40
+        height: 40
+        z: 200
+        padding: 15
+
+        background: Item {
+            anchors.fill: parent
+            Image {
+                anchors.centerIn: parent
+                width: 30
+                height: 30
+                source: "qrc:/gpt4all/icons/settings.svg"
+            }
+        }
+
+        Accessible.role: Accessible.Button
+        Accessible.name: qsTr("Settings button")
+        Accessible.description: qsTr("Reveals a dialogue where you can change various settings")
+
+        onClicked: {
+            settingsDialog.open()
+        }
+    }
+
+    PopupDialog {
+        id: copyMessage
+        anchors.centerIn: parent
+        text: qsTr("Conversation copied to clipboard.")
+    }
+
+    PopupDialog {
+        id: healthCheckFailed
+        anchors.centerIn: parent
+        text: qsTr("Connection to datalake failed.")
+    }
+
+    PopupDialog {
+        id: recalcPopup
+        anchors.centerIn: parent
+        shouldTimeOut: false
+        shouldShowBusy: true
+        text: qsTr("Recalculating context.")
+
+        Connections {
+            target: currentChat
+            function onRecalcChanged() {
+                if (currentChat.isRecalc)
+                    recalcPopup.open()
+                else
+                    recalcPopup.close()
+            }
+        }
+    }
+
+    Button {
+        id: copyButton
+        anchors.right: settingsButton.left
+        anchors.top: parent.top
+        anchors.topMargin: 30
+        anchors.rightMargin: 30
+        width: 40
+        height: 40
+        z: 200
+        padding: 15
+
+        Accessible.role: Accessible.Button
+        Accessible.name: qsTr("Copy button")
+        Accessible.description: qsTr("Copy the conversation to the clipboard")
+
+        background: Item {
+            anchors.fill: parent
+            Image {
+                anchors.centerIn: parent
+                width: 30
+                height: 30
+                source: "qrc:/gpt4all/icons/copy.svg"
+            }
+        }
+
+        TextEdit{
+            id: copyEdit
+            visible: false
+        }
+
+        onClicked: {
+            var conversation = getConversation()
+            copyEdit.text = conversation
+            copyEdit.selectAll()
+            copyEdit.copy()
+            copyMessage.open()
+        }
+    }
+
+    function getConversation() {
+        var conversation = "";
+        for (var i = 0; i < chatModel.count; i++) {
+            var item = chatModel.get(i)
+            var string = item.name;
+            var isResponse = item.name === qsTr("Response: ")
+            string += chatModel.get(i).value
+            if (isResponse && item.stopped)
+                string += " <stopped>"
+            string += "\n"
+            conversation += string
+        }
+        return conversation
+    }
+
+    function getConversationJson() {
+        var str = "{\"conversation\": [";
+        for (var i = 0; i < chatModel.count; i++) {
+            var item = chatModel.get(i)
+            var isResponse = item.name === qsTr("Response: ")
+            str += "{\"content\": ";
+            str += JSON.stringify(item.value)
+            str += ", \"role\": \"" + (isResponse ? "assistant" : "user") + "\"";
+            if (isResponse && item.thumbsUpState !== item.thumbsDownState)
+                str += ", \"rating\": \"" + (item.thumbsUpState ? "positive" : "negative") + "\"";
+            if (isResponse && item.newResponse !== "")
+                str += ", \"edited_content\": " + JSON.stringify(item.newResponse);
+            if (isResponse && item.stopped)
+                str += ", \"stopped\": \"true\""
+            if (!isResponse)
+                str += "},"
+            else
+                str += ((i < chatModel.count - 1) ? "}," : "}")
+        }
+        return str + "]}"
+    }
+
+    Button {
+        id: resetContextButton
+        anchors.right: copyButton.left
+        anchors.top: parent.top
+        anchors.topMargin: 30
+        anchors.rightMargin: 30
+        width: 40
+        height: 40
+        z: 200
+        padding: 15
+
+        Accessible.role: Accessible.Button
+        Accessible.name: text
+        Accessible.description: qsTr("Reset the context which erases current conversation")
+
+        background: Item {
+            anchors.fill: parent
+            Image {
+                anchors.centerIn: parent
+                width: 30
+                height: 30
+                source: "qrc:/gpt4all/icons/regenerate.svg"
+            }
+        }
+
+        onClicked: {
+            Network.sendResetContext(chatModel.count)
+            currentChat.reset();
+        }
+    }
+
+    Dialog {
+        id: checkForUpdatesError
+        anchors.centerIn: parent
+        modal: false
+        opacity: 0.9
+        padding: 20
+        Text {
+            horizontalAlignment: Text.AlignJustify
+            text: qsTr("ERROR: Update system could not find the MaintenanceTool used<br>
+                   to check for updates!<br><br>
+                   Did you install this application using the online installer? If so,<br>
+                   the MaintenanceTool executable should be located one directory<br>
+                   above where this application resides on your filesystem.<br><br>
+                   If you can't start it manually, then I'm afraid you'll have to<br>
+                   reinstall.")
+            color: theme.textColor
+            Accessible.role: Accessible.Dialog
+            Accessible.name: text
+            Accessible.description: qsTr("Dialog indicating an error")
+        }
+        background: Rectangle {
+            anchors.fill: parent
+            color: theme.backgroundDarkest
+            border.width: 1
+            border.color: theme.dialogBorder
+            radius: 10
+        }
+    }
+
+    ModelDownloaderDialog {
+        id: downloadNewModels
+        anchors.centerIn: parent
+        width: Math.min(1024, window.width - (window.width * .2))
+        height: Math.min(600, window.height - (window.height * .2))
+        Item {
+            Accessible.role: Accessible.Dialog
+            Accessible.name: qsTr("Download new models dialog")
+            Accessible.description: qsTr("Dialog for downloading new models")
+        }
+    }
+
+    ChatDrawer {
+        id: drawer
+        y: header.height
+        width: 0.3 * window.width
+        height: window.height - y
+        onDownloadClicked: {
+            downloadNewModels.open()
+        }
+        onAboutClicked: {
+            aboutDialog.open()
+        }
+    }
+
+    Rectangle {
+        id: conversation
+        color: theme.backgroundLight
+        anchors.left: parent.left
+        anchors.right: parent.right
+        anchors.bottom: parent.bottom
+        anchors.top: header.bottom
+
+        ScrollView {
+            id: scrollView
+            anchors.left: parent.left
+            anchors.right: parent.right
+            anchors.top: parent.top
+            anchors.bottom: textInputView.top
+            anchors.bottomMargin: 30
+            ScrollBar.vertical.policy: ScrollBar.AlwaysOn
+
+            Rectangle {
+                anchors.fill: parent
+                color: theme.backgroundLighter
+
+                ListView {
+                    id: listView
+                    anchors.fill: parent
+                    model: chatModel
+
+                    Accessible.role: Accessible.List
+                    Accessible.name: qsTr("List of prompt/response pairs")
+                    Accessible.description: qsTr("This is the list of prompt/response pairs comprising the actual conversation with the model")
+
+                    delegate: TextArea {
+                        text: value
+                        width: listView.width
+                        color: theme.textColor
+                        wrapMode: Text.WordWrap
+                        focus: false
+                        readOnly: true
+                        font.pixelSize: theme.fontSizeLarge
+                        cursorVisible: currentResponse ? currentChat.responseInProgress : false
+                        cursorPosition: text.length
+                        background: Rectangle {
+                            color: name === qsTr("Response: ") ? theme.backgroundLighter : theme.backgroundLight
+                        }
+
+                        Accessible.role: Accessible.Paragraph
+                        Accessible.name: name
+                        Accessible.description: name === qsTr("Response: ") ? "The response by the model" : "The prompt by the user"
+
+                        topPadding: 20
+                        bottomPadding: 20
+                        leftPadding: 100
+                        rightPadding: 100
+
+                        BusyIndicator {
+                            anchors.left: parent.left
+                            anchors.leftMargin: 90
+                            anchors.top: parent.top
+                            anchors.topMargin: 5
+                            visible: (currentResponse ? true : false) && value === "" && currentChat.responseInProgress
+                            running: (currentResponse ? true : false) && value === "" && currentChat.responseInProgress
+
+                            Accessible.role: Accessible.Animation
+                            Accessible.name: qsTr("Busy indicator")
+                            Accessible.description: qsTr("Displayed when the model is thinking")
+                        }
+
+                        Rectangle {
+                            anchors.left: parent.left
+                            anchors.top: parent.top
+                            anchors.leftMargin: 20
+                            anchors.topMargin: 20
+                            width: 30
+                            height: 30
+                            radius: 5
+                            color: name === qsTr("Response: ") ? theme.assistantColor : theme.userColor
+
+                            Text {
+                                anchors.centerIn: parent
+                                text: name === qsTr("Response: ") ? "R" : "P"
+                                color: "white"
+                            }
+                        }
+
+                        ThumbsDownDialog {
+                            id: thumbsDownDialog
+                            property point globalPoint: mapFromItem(window,
+                                window.width / 2 - width / 2,
+                                window.height / 2 - height / 2)
+                            x: globalPoint.x
+                            y: globalPoint.y
+                            property string text: value
+                            response: newResponse === undefined || newResponse === "" ? text : newResponse
+                            onAccepted: {
+                                var responseHasChanged = response !== text && response !== newResponse
+                                if (thumbsDownState && !thumbsUpState && !responseHasChanged)
+                                    return
+
+                                chatModel.updateNewResponse(index, response)
+                                chatModel.updateThumbsUpState(index, false)
+                                chatModel.updateThumbsDownState(index, true)
+                                Network.sendConversation(currentChat.id, getConversationJson());
+                            }
+                        }
+
+                        Column {
+                            visible: name === qsTr("Response: ") &&
+                                (!currentResponse || !currentChat.responseInProgress) && Network.isActive
+                            anchors.right: parent.right
+                            anchors.rightMargin: 20
+                            anchors.top: parent.top
+                            anchors.topMargin: 20
+                            spacing: 10
+
+                            Item {
+                                width: childrenRect.width
+                                height: childrenRect.height
+                                Button {
+                                    id: thumbsUp
+                                    width: 30
+                                    height: 30
+                                    opacity: thumbsUpState || thumbsUpState == thumbsDownState ? 1.0 : 0.2
+                                    background: Image {
+                                        anchors.fill: parent
+                                        source: "qrc:/gpt4all/icons/thumbs_up.svg"
+                                    }
+                                    onClicked: {
+                                        if (thumbsUpState && !thumbsDownState)
+                                            return
+
+                                        chatModel.updateNewResponse(index, "")
+                                        chatModel.updateThumbsUpState(index, true)
+                                        chatModel.updateThumbsDownState(index, false)
+                                        Network.sendConversation(currentChat.id, getConversationJson());
+                                    }
+                                }
+
+                                Button {
+                                    id: thumbsDown
+                                    anchors.top: thumbsUp.top
+                                    anchors.topMargin: 10
+                                    anchors.left: thumbsUp.right
+                                    anchors.leftMargin: 2
+                                    width: 30
+                                    height: 30
+                                    checked: thumbsDownState
+                                    opacity: thumbsDownState || thumbsUpState == thumbsDownState ? 1.0 : 0.2
+                                    transform: [
+                                      Matrix4x4 {
+                                        matrix: Qt.matrix4x4(-1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1)
+                                      },
+                                      Translate {
+                                        x: thumbsDown.width
+                                      }
+                                    ]
+                                    background: Image {
+                                        anchors.fill: parent
+                                        source: "qrc:/gpt4all/icons/thumbs_down.svg"
+                                    }
+                                    onClicked: {
+                                        thumbsDownDialog.open()
+                                    }
+                                }
+                            }
+                        }
+                    }
+
+                    property bool shouldAutoScroll: true
+                    property bool isAutoScrolling: false
+
+                    Connections {
+                        target: currentChat
+                        function onResponseChanged() {
+                            if (listView.shouldAutoScroll) {
+                                listView.isAutoScrolling = true
+                                listView.positionViewAtEnd()
+                                listView.isAutoScrolling = false
+                            }
+                        }
+                    }
+
+                    onContentYChanged: {
+                        if (!isAutoScrolling)
+                            shouldAutoScroll = atYEnd
+                    }
+
+                    Component.onCompleted: {
+                        shouldAutoScroll = true
+                        positionViewAtEnd()
+                    }
+
+                    footer: Item {
+                        id: bottomPadding
+                        width: parent.width
+                        height: 60
+                    }
+                }
+            }
+        }
+
+        Button {
+            visible: chatModel.count
+            Image {
+                anchors.verticalCenter: parent.verticalCenter
+                anchors.left: parent.left
+                anchors.leftMargin: 15
+                source: currentChat.responseInProgress ? "qrc:/gpt4all/icons/stop_generating.svg" : "qrc:/gpt4all/icons/regenerate.svg"
+            }
+            leftPadding: 50
+            onClicked: {
+                var index = Math.max(0, chatModel.count - 1);
+                var listElement = chatModel.get(index);
+
+                if (currentChat.responseInProgress) {
+                    listElement.stopped = true
+                    currentChat.stopGenerating()
+                } else {
+                    currentChat.regenerateResponse()
+                    if (chatModel.count) {
+                        if (listElement.name === qsTr("Response: ")) {
+                            chatModel.updateCurrentResponse(index, true);
+                            chatModel.updateStopped(index, false);
+                            chatModel.updateThumbsUpState(index, false);
+                            chatModel.updateThumbsDownState(index, false);
+                            chatModel.updateNewResponse(index, "");
+                            currentChat.prompt(listElement.prompt, settingsDialog.promptTemplate,
+                                       settingsDialog.maxLength,
+                                       settingsDialog.topK, settingsDialog.topP,
+                                       settingsDialog.temperature,
+                                       settingsDialog.promptBatchSize,
+                                       settingsDialog.repeatPenalty,
+                                       settingsDialog.repeatPenaltyTokens)
+                        }
+                    }
+                }
+            }
+            anchors.bottom: textInputView.top
+            anchors.horizontalCenter: textInputView.horizontalCenter
+            anchors.bottomMargin: 40
+            padding: 15
+            contentItem: Text {
+                text: currentChat.responseInProgress ? qsTr("Stop generating") : qsTr("Regenerate response")
+                color: theme.textColor
+                Accessible.role: Accessible.Button
+                Accessible.name: text
+                Accessible.description: qsTr("Controls generation of the response")
+            }
+            background: Rectangle {
+                opacity: .5
+                border.color: theme.backgroundLightest
+                border.width: 1
+                radius: 10
+                color: theme.backgroundLight
+            }
+        }
+
+        ScrollView {
+            id: textInputView
+            anchors.left: parent.left
+            anchors.right: parent.right
+            anchors.bottom: parent.bottom
+            anchors.margins: 30
+            height: Math.min(contentHeight, 200)
+
+            TextArea {
+                id: textInput
+                color: theme.textColor
+                padding: 20
+                rightPadding: 40
+                enabled: currentChat.isModelLoaded
+                wrapMode: Text.WordWrap
+                font.pixelSize: theme.fontSizeLarge
+                placeholderText: qsTr("Send a message...")
+                placeholderTextColor: theme.backgroundLightest
+                background: Rectangle {
+                    color: theme.backgroundLighter
+                    radius: 10
+                }
+                Accessible.role: Accessible.EditableText
+                Accessible.name: placeholderText
+                Accessible.description: qsTr("Textfield for sending messages/prompts to the model")
+                Keys.onReturnPressed: (event)=> {
+                    if (event.modifiers & Qt.ControlModifier || event.modifiers & Qt.ShiftModifier)
+                        event.accepted = false;
+                    else {
+                        editingFinished();
+                        sendMessage()
+                    }
+                }
+                function sendMessage() {
+                    if (textInput.text === "")
+                        return
+
+                    currentChat.stopGenerating()
+
+                    if (chatModel.count) {
+                        var index = Math.max(0, chatModel.count - 1);
+                        var listElement = chatModel.get(index);
+                        chatModel.updateCurrentResponse(index, false);
+                    }
+                    currentChat.newPromptResponsePair(textInput.text);
+                    currentChat.prompt(textInput.text, settingsDialog.promptTemplate,
+                               settingsDialog.maxLength,
+                               settingsDialog.topK,
+                               settingsDialog.topP,
+                               settingsDialog.temperature,
+                               settingsDialog.promptBatchSize,
+                               settingsDialog.repeatPenalty,
+                               settingsDialog.repeatPenaltyTokens)
+                    textInput.text = ""
+                }
+            }
+        }
+
+        Button {
+            anchors.right: textInputView.right
+            anchors.verticalCenter: textInputView.verticalCenter
+            anchors.rightMargin: 15
+            width: 30
+            height: 30
+
+            background: Image {
+                anchors.centerIn: parent
+                source: "qrc:/gpt4all/icons/send_message.svg"
+            }
+
+            Accessible.role: Accessible.Button
+            Accessible.name: qsTr("Send the message button")
+            Accessible.description: qsTr("Sends the message/prompt contained in textfield to the model")
+
+            onClicked: {
+                textInput.sendMessage()
+            }
+        }
+    }
+}
diff --git a/gpt4all-chat/network.cpp b/gpt4all-chat/network.cpp
new file mode 100644
index 00000000..d70bf7df
--- /dev/null
+++ b/gpt4all-chat/network.cpp
@@ -0,0 +1,531 @@
+#include "network.h"
+#include "llm.h"
+#include "sysinfo.h"
+
+#include <QCoreApplication>
+#include <QGuiApplication>
+#include <QUuid>
+#include <QJsonDocument>
+#include <QJsonArray>
+#include <QJsonObject>
+#include <QSettings>
+#include <QNetworkRequest>
+#include <QScreen>
+
+//#define DEBUG
+
+#if defined(Q_OS_MAC)
+#include <sys/sysctl.h>
+std::string getCPUModel() {
+    char buffer[256];
+    size_t bufferlen = sizeof(buffer);
+    sysctlbyname("machdep.cpu.brand_string", &buffer, &bufferlen, NULL, 0);
+    return std::string(buffer);
+}
+#endif
+
+class MyNetwork: public Network { };
+Q_GLOBAL_STATIC(MyNetwork, networkInstance)
+Network *Network::globalInstance()
+{
+    return networkInstance();
+}
+
+Network::Network()
+    : QObject{nullptr}
+    , m_isActive(false)
+    , m_usageStatsActive(false)
+    , m_shouldSendStartup(false)
+{
+    QSettings settings;
+    settings.sync();
+    m_uniqueId = settings.value("uniqueId", generateUniqueId()).toString();
+    settings.setValue("uniqueId", m_uniqueId);
+    settings.sync();
+    m_isActive = settings.value("network/isActive", false).toBool();
+    if (m_isActive)
+        sendHealth();
+    m_usageStatsActive = settings.value("network/usageStatsActive", false).toBool();
+    if (m_usageStatsActive)
+        sendIpify();
+    connect(&m_networkManager, &QNetworkAccessManager::sslErrors, this,
+        &Network::handleSslErrors);
+}
+
+void Network::setActive(bool b)
+{
+    QSettings settings;
+    settings.setValue("network/isActive", b);
+    settings.sync();
+    m_isActive = b;
+    emit activeChanged();
+    if (m_isActive)
+        sendHealth();
+}
+
+void Network::setUsageStatsActive(bool b)
+{
+    QSettings settings;
+    settings.setValue("network/usageStatsActive", b);
+    settings.sync();
+    m_usageStatsActive = b;
+    emit usageStatsActiveChanged();
+    if (!m_usageStatsActive)
+        sendOptOut();
+    else {
+        // model might be loaded already when user opt-in for first time
+        sendStartup();
+        sendIpify();
+    }
+}
+
+QString Network::generateUniqueId() const
+{
+    return QUuid::createUuid().toString(QUuid::WithoutBraces);
+}
+
+bool Network::packageAndSendJson(const QString &ingestId, const QString &json)
+{
+    if (!m_isActive)
+        return false;
+
+    QJsonParseError err;
+    QJsonDocument doc = QJsonDocument::fromJson(json.toUtf8(), &err);
+    if (err.error != QJsonParseError::NoError) {
+        qDebug() << "Couldn't parse: " << json << err.errorString();
+        return false;
+    }
+
+    Q_ASSERT(doc.isObject());
+    Q_ASSERT(LLM::globalInstance()->chatListModel()->currentChat());
+    QJsonObject object = doc.object();
+    object.insert("source", "gpt4all-chat");
+    object.insert("agent_id", LLM::globalInstance()->chatListModel()->currentChat()->modelName());
+    object.insert("submitter_id", m_uniqueId);
+    object.insert("ingest_id", ingestId);
+
+    QSettings settings;
+    settings.sync();
+    QString attribution = settings.value("network/attribution", QString()).toString();
+    if (!attribution.isEmpty())
+        object.insert("network/attribution", attribution);
+
+    QJsonDocument newDoc;
+    newDoc.setObject(object);
+
+#if defined(DEBUG)
+    printf("%s\n", qPrintable(newDoc.toJson(QJsonDocument::Indented)));
+    fflush(stdout);
+#endif
+
+    QUrl jsonUrl("https://api.gpt4all.io/v1/ingest/chat");
+    QNetworkRequest request(jsonUrl);
+    QSslConfiguration conf = request.sslConfiguration();
+    conf.setPeerVerifyMode(QSslSocket::VerifyNone);
+    request.setSslConfiguration(conf);
+    QByteArray body(newDoc.toJson());
+    request.setHeader(QNetworkRequest::ContentTypeHeader, "application/json");
+    QNetworkReply *jsonReply = m_networkManager.post(request, body);
+    connect(jsonReply, &QNetworkReply::finished, this, &Network::handleJsonUploadFinished);
+    m_activeUploads.append(jsonReply);
+    return true;
+}
+
+void Network::handleJsonUploadFinished()
+{
+    QNetworkReply *jsonReply = qobject_cast<QNetworkReply *>(sender());
+    if (!jsonReply)
+        return;
+
+    m_activeUploads.removeAll(jsonReply);
+
+    QVariant response = jsonReply->attribute(QNetworkRequest::HttpStatusCodeAttribute);
+    Q_ASSERT(response.isValid());
+    bool ok;
+    int code = response.toInt(&ok);
+    if (!ok)
+        qWarning() << "ERROR: ingest invalid response.";
+    if (code != 200) {
+        qWarning() << "ERROR: ingest response != 200 code:" << code;
+        sendHealth();
+    }
+
+    QByteArray jsonData = jsonReply->readAll();
+    QJsonParseError err;
+    QJsonDocument document = QJsonDocument::fromJson(jsonData, &err);
+    if (err.error != QJsonParseError::NoError) {
+        qDebug() << "ERROR: Couldn't parse: " << jsonData << err.errorString();
+        return;
+    }
+
+#if defined(DEBUG)
+    printf("%s\n", qPrintable(document.toJson(QJsonDocument::Indented)));
+    fflush(stdout);
+#endif
+
+    jsonReply->deleteLater();
+}
+
+void Network::handleSslErrors(QNetworkReply *reply, const QList<QSslError> &errors)
+{
+    QUrl url = reply->request().url();
+    for (auto e : errors)
+        qWarning() << "ERROR: Received ssl error:" << e.errorString() << "for" << url;
+}
+
+void Network::sendOptOut()
+{
+    QJsonObject properties;
+    properties.insert("token", "ce362e568ddaee16ed243eaffb5860a2");
+    properties.insert("time", QDateTime::currentSecsSinceEpoch());
+    properties.insert("distinct_id", m_uniqueId);
+    properties.insert("$insert_id", generateUniqueId());
+
+    QJsonObject event;
+    event.insert("event", "opt_out");
+    event.insert("properties", properties);
+
+    QJsonArray array;
+    array.append(event);
+
+    QJsonDocument doc;
+    doc.setArray(array);
+    sendMixpanel(doc.toJson(), true /*isOptOut*/);
+
+#if defined(DEBUG)
+    printf("%s %s\n", qPrintable("opt_out"), qPrintable(doc.toJson(QJsonDocument::Indented)));
+    fflush(stdout);
+#endif
+}
+
+void Network::sendModelLoaded()
+{
+    if (!m_usageStatsActive)
+        return;
+    sendMixpanelEvent("model_load");
+}
+
+void Network::sendResetContext(int conversationLength)
+{
+    if (!m_usageStatsActive)
+        return;
+
+    KeyValue kv;
+    kv.key = QString("length");
+    kv.value = QJsonValue(conversationLength);
+    sendMixpanelEvent("reset_context", QVector<KeyValue>{kv});
+}
+
+void Network::sendStartup()
+{
+    if (!m_usageStatsActive)
+        return;
+    m_shouldSendStartup = true;
+    if (m_ipify.isEmpty())
+        return; // when it completes it will send
+    sendMixpanelEvent("startup");
+}
+
+void Network::sendCheckForUpdates()
+{
+    if (!m_usageStatsActive)
+        return;
+    sendMixpanelEvent("check_for_updates");
+}
+
+void Network::sendModelDownloaderDialog()
+{
+    if (!m_usageStatsActive)
+        return;
+    sendMixpanelEvent("download_dialog");
+}
+
+void Network::sendDownloadStarted(const QString &model)
+{
+    if (!m_usageStatsActive)
+        return;
+    KeyValue kv;
+    kv.key = QString("model");
+    kv.value = QJsonValue(model);
+    sendMixpanelEvent("download_started", QVector<KeyValue>{kv});
+}
+
+void Network::sendDownloadCanceled(const QString &model)
+{
+    if (!m_usageStatsActive)
+        return;
+    KeyValue kv;
+    kv.key = QString("model");
+    kv.value = QJsonValue(model);
+    sendMixpanelEvent("download_canceled", QVector<KeyValue>{kv});
+}
+
+void Network::sendDownloadError(const QString &model, int code, const QString &errorString)
+{
+    if (!m_usageStatsActive)
+        return;
+    KeyValue kv;
+    kv.key = QString("model");
+    kv.value = QJsonValue(model);
+    KeyValue kvCode;
+    kvCode.key = QString("code");
+    kvCode.value = QJsonValue(code);
+    KeyValue kvError;
+    kvError.key = QString("error");
+    kvError.value = QJsonValue(errorString);
+    sendMixpanelEvent("download_error", QVector<KeyValue>{kv, kvCode, kvError});
+}
+
+void Network::sendDownloadFinished(const QString &model, bool success)
+{
+    if (!m_usageStatsActive)
+        return;
+    KeyValue kv;
+    kv.key = QString("model");
+    kv.value = QJsonValue(model);
+    KeyValue kvSuccess;
+    kvSuccess.key = QString("success");
+    kvSuccess.value = QJsonValue(success);
+    sendMixpanelEvent("download_finished", QVector<KeyValue>{kv, kvSuccess});
+}
+
+void Network::sendSettingsDialog()
+{
+    if (!m_usageStatsActive)
+        return;
+    sendMixpanelEvent("settings_dialog");
+}
+
+void Network::sendNetworkToggled(bool isActive)
+{
+    if (!m_usageStatsActive)
+        return;
+    KeyValue kv;
+    kv.key = QString("isActive");
+    kv.value = QJsonValue(isActive);
+    sendMixpanelEvent("network_toggled", QVector<KeyValue>{kv});
+}
+
+void Network::sendSaveChatsToggled(bool isActive)
+{
+    if (!m_usageStatsActive)
+        return;
+    KeyValue kv;
+    kv.key = QString("isActive");
+    kv.value = QJsonValue(isActive);
+    sendMixpanelEvent("savechats_toggled", QVector<KeyValue>{kv});
+}
+
+void Network::sendNewChat(int count)
+{
+    if (!m_usageStatsActive)
+        return;
+    KeyValue kv;
+    kv.key = QString("number_of_chats");
+    kv.value = QJsonValue(count);
+    sendMixpanelEvent("new_chat", QVector<KeyValue>{kv});
+}
+
+void Network::sendRemoveChat()
+{
+    if (!m_usageStatsActive)
+        return;
+    sendMixpanelEvent("remove_chat");
+}
+
+void Network::sendRenameChat()
+{
+    if (!m_usageStatsActive)
+        return;
+    sendMixpanelEvent("rename_chat");
+}
+
+void Network::sendChatStarted()
+{
+    if (!m_usageStatsActive)
+        return;
+    sendMixpanelEvent("chat_started");
+}
+
+void Network::sendRecalculatingContext(int conversationLength)
+{
+    if (!m_usageStatsActive)
+        return;
+
+    KeyValue kv;
+    kv.key = QString("length");
+    kv.value = QJsonValue(conversationLength);
+    sendMixpanelEvent("recalc_context", QVector<KeyValue>{kv});
+}
+
+void Network::sendNonCompatHardware()
+{
+    if (!m_usageStatsActive)
+        return;
+    sendMixpanelEvent("noncompat_hardware");
+}
+
+void Network::sendMixpanelEvent(const QString &ev, const QVector<KeyValue> &values)
+{
+    if (!m_usageStatsActive)
+        return;
+
+    Q_ASSERT(LLM::globalInstance()->chatListModel()->currentChat());
+    QJsonObject properties;
+    properties.insert("token", "ce362e568ddaee16ed243eaffb5860a2");
+    properties.insert("time", QDateTime::currentSecsSinceEpoch());
+    properties.insert("distinct_id", m_uniqueId);
+    properties.insert("$insert_id", generateUniqueId());
+    properties.insert("$os", QSysInfo::prettyProductName());
+    if (!m_ipify.isEmpty())
+        properties.insert("ip", m_ipify);
+    properties.insert("name", QCoreApplication::applicationName() + " v"
+        + QCoreApplication::applicationVersion());
+    properties.insert("model", LLM::globalInstance()->chatListModel()->currentChat()->modelName());
+
+    // Some additional startup information
+    if (ev == "startup") {
+        const QSize display = QGuiApplication::primaryScreen()->size();
+        properties.insert("display", QString("%1x%2").arg(display.width()).arg(display.height()));
+        properties.insert("ram", getSystemTotalRAM());
+#if defined(__x86_64__) || defined(__i386__)
+        properties.insert("avx", bool(__builtin_cpu_supports("avx")));
+        properties.insert("avx2", bool(__builtin_cpu_supports("avx2")));
+        properties.insert("fma", bool(__builtin_cpu_supports("fma")));
+#endif
+#if defined(Q_OS_MAC)
+        properties.insert("cpu", QString::fromStdString(getCPUModel()));
+#endif
+    }
+
+    for (auto p : values)
+        properties.insert(p.key, p.value);
+
+    QJsonObject event;
+    event.insert("event", ev);
+    event.insert("properties", properties);
+
+    QJsonArray array;
+    array.append(event);
+
+    QJsonDocument doc;
+    doc.setArray(array);
+    sendMixpanel(doc.toJson());
+
+#if defined(DEBUG)
+    printf("%s %s\n", qPrintable(ev), qPrintable(doc.toJson(QJsonDocument::Indented)));
+    fflush(stdout);
+#endif
+}
+
+void Network::sendIpify()
+{
+    if (!m_usageStatsActive || !m_ipify.isEmpty())
+        return;
+
+    QUrl ipifyUrl("https://api.ipify.org");
+    QNetworkRequest request(ipifyUrl);
+    QSslConfiguration conf = request.sslConfiguration();
+    conf.setPeerVerifyMode(QSslSocket::VerifyNone);
+    request.setSslConfiguration(conf);
+    QNetworkReply *reply = m_networkManager.get(request);
+    connect(reply, &QNetworkReply::finished, this, &Network::handleIpifyFinished);
+}
+
+void Network::sendMixpanel(const QByteArray &json, bool isOptOut)
+{
+    if (!m_usageStatsActive && !isOptOut)
+        return;
+
+    QUrl trackUrl("https://api.mixpanel.com/track");
+    QNetworkRequest request(trackUrl);
+    QSslConfiguration conf = request.sslConfiguration();
+    conf.setPeerVerifyMode(QSslSocket::VerifyNone);
+    request.setSslConfiguration(conf);
+    request.setHeader(QNetworkRequest::ContentTypeHeader, "application/json");
+    QNetworkReply *trackReply = m_networkManager.post(request, json);
+    connect(trackReply, &QNetworkReply::finished, this, &Network::handleMixpanelFinished);
+}
+
+void Network::handleIpifyFinished()
+{
+    Q_ASSERT(m_usageStatsActive);
+    QNetworkReply *reply = qobject_cast<QNetworkReply *>(sender());
+    if (!reply)
+        return;
+
+    QVariant response = reply->attribute(QNetworkRequest::HttpStatusCodeAttribute);
+    Q_ASSERT(response.isValid());
+    bool ok;
+    int code = response.toInt(&ok);
+    if (!ok)
+        qWarning() << "ERROR: ipify invalid response.";
+    if (code != 200)
+        qWarning() << "ERROR: ipify response != 200 code:" << code;
+    m_ipify = qPrintable(reply->readAll());
+#if defined(DEBUG)
+    printf("ipify finished %s\n", m_ipify.toLatin1().constData());
+    fflush(stdout);
+#endif
+    reply->deleteLater();
+
+    if (m_shouldSendStartup)
+        sendStartup();
+}
+
+void Network::handleMixpanelFinished()
+{
+    QNetworkReply *reply = qobject_cast<QNetworkReply *>(sender());
+    if (!reply)
+        return;
+
+    QVariant response = reply->attribute(QNetworkRequest::HttpStatusCodeAttribute);
+    Q_ASSERT(response.isValid());
+    bool ok;
+    int code = response.toInt(&ok);
+    if (!ok)
+        qWarning() << "ERROR: track invalid response.";
+    if (code != 200)
+        qWarning() << "ERROR: track response != 200 code:" << code;
+#if defined(DEBUG)
+    printf("mixpanel finished %s\n", qPrintable(reply->readAll()));
+    fflush(stdout);
+#endif
+    reply->deleteLater();
+}
+
+bool Network::sendConversation(const QString &ingestId, const QString &conversation)
+{
+    return packageAndSendJson(ingestId, conversation);
+}
+
+void Network::sendHealth()
+{
+    QUrl healthUrl("https://api.gpt4all.io/v1/health");
+    QNetworkRequest request(healthUrl);
+    QSslConfiguration conf = request.sslConfiguration();
+    conf.setPeerVerifyMode(QSslSocket::VerifyNone);
+    request.setSslConfiguration(conf);
+    QNetworkReply *healthReply = m_networkManager.get(request);
+    connect(healthReply, &QNetworkReply::finished, this, &Network::handleHealthFinished);
+}
+
+void Network::handleHealthFinished()
+{
+    QNetworkReply *healthReply = qobject_cast<QNetworkReply *>(sender());
+    if (!healthReply)
+        return;
+
+    QVariant response = healthReply->attribute(QNetworkRequest::HttpStatusCodeAttribute);
+    Q_ASSERT(response.isValid());
+    bool ok;
+    int code = response.toInt(&ok);
+    if (!ok)
+        qWarning() << "ERROR: health invalid response.";
+    if (code != 200) {
+        qWarning() << "ERROR: health response != 200 code:" << code;
+        emit healthCheckFailed(code);
+        setActive(false);
+    }
+    healthReply->deleteLater();
+}
diff --git a/gpt4all-chat/network.h b/gpt4all-chat/network.h
new file mode 100644
index 00000000..1c9de2df
--- /dev/null
+++ b/gpt4all-chat/network.h
@@ -0,0 +1,87 @@
+#ifndef NETWORK_H
+#define NETWORK_H
+
+#include <QObject>
+#include <QNetworkAccessManager>
+#include <QNetworkReply>
+#include <QJsonValue>
+
+struct KeyValue {
+    QString key;
+    QJsonValue value;
+};
+
+class Network : public QObject
+{
+    Q_OBJECT
+    Q_PROPERTY(bool isActive READ isActive WRITE setActive NOTIFY activeChanged)
+    Q_PROPERTY(bool usageStatsActive READ usageStatsActive WRITE setUsageStatsActive NOTIFY usageStatsActiveChanged)
+
+public:
+    static Network *globalInstance();
+
+    bool isActive() const { return m_isActive; }
+    void setActive(bool b);
+
+    bool usageStatsActive() const { return m_usageStatsActive; }
+    void setUsageStatsActive(bool b);
+
+    Q_INVOKABLE QString generateUniqueId() const;
+    Q_INVOKABLE bool sendConversation(const QString &ingestId, const QString &conversation);
+
+Q_SIGNALS:
+    void activeChanged();
+    void usageStatsActiveChanged();
+    void healthCheckFailed(int code);
+
+public Q_SLOTS:
+    void sendOptOut();
+    void sendModelLoaded();
+    void sendStartup();
+    void sendCheckForUpdates();
+    Q_INVOKABLE void sendModelDownloaderDialog();
+    Q_INVOKABLE void sendResetContext(int conversationLength);
+    void sendDownloadStarted(const QString &model);
+    void sendDownloadCanceled(const QString &model);
+    void sendDownloadError(const QString &model, int code, const QString &errorString);
+    void sendDownloadFinished(const QString &model, bool success);
+    Q_INVOKABLE void sendSettingsDialog();
+    Q_INVOKABLE void sendNetworkToggled(bool active);
+    Q_INVOKABLE void sendSaveChatsToggled(bool active);
+    Q_INVOKABLE void sendNewChat(int count);
+    Q_INVOKABLE void sendRemoveChat();
+    Q_INVOKABLE void sendRenameChat();
+    Q_INVOKABLE void sendNonCompatHardware();
+    void sendChatStarted();
+    void sendRecalculatingContext(int conversationLength);
+
+private Q_SLOTS:
+    void handleIpifyFinished();
+    void handleHealthFinished();
+    void handleJsonUploadFinished();
+    void handleSslErrors(QNetworkReply *reply, const QList<QSslError> &errors);
+    void handleMixpanelFinished();
+
+private:
+    void sendHealth();
+    void sendIpify();
+    void sendMixpanelEvent(const QString &event, const QVector<KeyValue> &values = QVector<KeyValue>());
+    void sendMixpanel(const QByteArray &json, bool isOptOut = false);
+    bool packageAndSendJson(const QString &ingestId, const QString &json);
+
+private:
+    bool m_shouldSendStartup;
+    bool m_isActive;
+    bool m_usageStatsActive;
+    QString m_ipify;
+    QString m_uniqueId;
+    QNetworkAccessManager m_networkManager;
+    QVector<QNetworkReply*> m_activeUploads;
+
+private:
+    explicit Network();
+    ~Network() {}
+    friend class MyNetwork;
+};
+
+#endif // LLM_H
diff --git a/gpt4all-chat/qml/AboutDialog.qml b/gpt4all-chat/qml/AboutDialog.qml
new file mode 100644
index 00000000..35d1ee43
--- /dev/null
+++ b/gpt4all-chat/qml/AboutDialog.qml
@@ -0,0 +1,113 @@
+import QtCore
+import QtQuick
+import QtQuick.Controls
+import QtQuick.Controls.Basic
+import QtQuick.Layouts
+import download
+import network
+import llm
+
+Dialog {
+    id: abpoutDialog
+    anchors.centerIn: parent
+    modal: false
+    opacity: 0.9
+    padding: 20
+    width: 1024
+    height: column.height + 40
+
+    Theme {
+        id: theme
+    }
+
+    Column {
+        id: column
+        spacing: 20
+        Item {
+            width: childrenRect.width
+            height: childrenRect.height
+            Image {
+                id: img
+                anchors.top: parent.top
+                anchors.left: parent.left
+                width: 60
+                height: 60
+                source: "qrc:/gpt4all/icons/logo.svg"
+            }
+            Text {
+                anchors.left: img.right
+                anchors.leftMargin: 30
+                anchors.verticalCenter: img.verticalCenter
+                text: qsTr("About GPT4All")
+                color: theme.textColor
+            }
+        }
+
+        ScrollView {
+            clip: true
+            height: 200
+            width: 1024 - 40
+            ScrollBar.vertical.policy: ScrollBar.AlwaysOn
+            ScrollBar.horizontal.policy: ScrollBar.AlwaysOff
+
+            TextArea {
+                id: welcome
+                wrapMode: Text.Wrap
+                width: 1024 - 40
+                padding: 20
+                textFormat: TextEdit.MarkdownText
+                text: qsTr("### Release notes\n")
+                    + Download.releaseInfo.notes
+                    + qsTr("### Contributors\n")
+                    + Download.releaseInfo.contributors
+                color: theme.textColor
+                focus: false
+                readOnly: true
+                Accessible.role: Accessible.Paragraph
+                Accessible.name: qsTr("Release notes")
+                Accessible.description: qsTr("Release notes for this version")
+                background: Rectangle {
+                    color: theme.backgroundLight
+                    radius: 10
+                }
+            }
+        }
+
+        Label {
+            id: discordLink
+            width: parent.width
+            textFormat: Text.RichText
+            wrapMode: Text.WordWrap
+            text: qsTr("Check out our discord channel <a href=\"https://discord.gg/4M2QFmTt2k\">https://discord.gg/4M2QFmTt2k</a>")
+            onLinkActivated: { Qt.openUrlExternally("https://discord.gg/4M2QFmTt2k") }
+            color: theme.textColor
+            linkColor: theme.linkColor
+
+            Accessible.role: Accessible.Link
+            Accessible.name: qsTr("Discord link")
+        }
+
+        Label {
+            id: nomicProps
+            width: parent.width
+            textFormat: Text.RichText
+            wrapMode: Text.WordWrap
+            text: qsTr("Thank you to <a href=\"https://home.nomic.ai\">Nomic AI</a> and the community for contributing so much great data, code, ideas, and energy to the growing open source AI ecosystem!")
+            onLinkActivated: { Qt.openUrlExternally("https://home.nomic.ai") }
+            color: theme.textColor
+            linkColor: theme.linkColor
+
+            Accessible.role: Accessible.Paragraph
+            Accessible.name: qsTr("Thank you blurb")
+            Accessible.description: qsTr("Contains embedded link to https://home.nomic.ai")
+        }
+    }
+
+    background: Rectangle {
+        anchors.fill: parent
+        color: theme.backgroundDarkest
+        border.width: 1
+        border.color: theme.dialogBorder
+        radius: 10
+    }
+}
diff --git a/gpt4all-chat/qml/ChatDrawer.qml b/gpt4all-chat/qml/ChatDrawer.qml
new file mode 100644
index 00000000..d3298f1a
--- /dev/null
+++ b/gpt4all-chat/qml/ChatDrawer.qml
@@ -0,0 +1,353 @@
+import QtCore
+import QtQuick
+import QtQuick.Controls
+import QtQuick.Controls.Basic
+import QtQuick.Layouts
+import llm
+import download
+import network
+
+Drawer {
+    id: chatDrawer
+    modal: false
+    opacity: 0.9
+
+    Theme {
+        id: theme
+    }
+
+    signal downloadClicked
+    signal aboutClicked
+
+    background: Rectangle {
+        height: parent.height
+        color: theme.backgroundDarkest
+    }
+
+    Item {
+        anchors.fill: parent
+        anchors.margins: 10
+
+        Accessible.role: Accessible.Pane
+        Accessible.name: qsTr("Drawer on the left of the application")
+        Accessible.description: qsTr("Drawer that is revealed by pressing the hamburger button")
+
+        Button {
+            id: newChat
+            anchors.left: parent.left
+            anchors.right: parent.right
+            padding: 15
+            font.pixelSize: theme.fontSizeLarger
+            background: Rectangle {
+                color: theme.backgroundDarkest
+                opacity: .5
+                border.color: theme.backgroundLightest
+                border.width: 1
+                radius: 10
+            }
+            contentItem: Text {
+                text: qsTr("New chat")
+                horizontalAlignment: Text.AlignHCenter
+                color: theme.textColor
+
+                Accessible.role: Accessible.Button
+                Accessible.name: text
+                Accessible.description: qsTr("Use this to launch an external application that will check for updates to the installer")
+            }
+            onClicked: {
+                LLM.chatListModel.addChat();
+                Network.sendNewChat(LLM.chatListModel.count)
+            }
+        }
+
+        ScrollView {
+            anchors.left: parent.left
+            anchors.right: parent.right
+            anchors.rightMargin: -10
+            anchors.topMargin: 10
+            anchors.top: newChat.bottom
+            anchors.bottom: checkForUpdatesButton.top
+            anchors.bottomMargin: 10
+            ScrollBar.vertical.policy: ScrollBar.AlwaysOn
+
+            ListView {
+                id: conversationList
+                anchors.fill: parent
+                anchors.rightMargin: 10
+
+                model: LLM.chatListModel
+
+                delegate: Rectangle {
+                    id: chatRectangle
+                    width: conversationList.width
+                    height: chatName.height
+                    opacity: 0.9
+                    property bool isCurrent: LLM.chatListModel.currentChat === LLM.chatListModel.get(index)
+                    property bool trashQuestionDisplayed: false
+                    z: isCurrent ? 199 : 1
+                    color: index % 2 === 0 ? theme.backgroundLight : theme.backgroundLighter
+                    border.width: isCurrent
+                    border.color: chatName.readOnly ? theme.assistantColor : theme.userColor
+                    TextField {
+                        id: chatName
+                        anchors.left: parent.left
+                        anchors.right: buttons.left
+                        color: theme.textColor
+                        padding: 15
+                        focus: false
+                        readOnly: true
+                        wrapMode: Text.NoWrap
+                        hoverEnabled: false // Disable hover events on the TextArea
+                        selectByMouse: false // Disable text selection in the TextArea
+                        font.pixelSize: theme.fontSizeLarger
+                        text: readOnly ? metrics.elidedText : name
+                        horizontalAlignment: TextInput.AlignLeft
+                        opacity: trashQuestionDisplayed ? 0.5 : 1.0
+                        TextMetrics {
+                            id: metrics
+                            font: chatName.font
+                            text: name
+                            elide: Text.ElideRight
+                            elideWidth: chatName.width - 25
+                        }
+                        background: Rectangle {
+                            color: "transparent"
+                        }
+                        onEditingFinished: {
+                            // Work around a bug in qml where we're losing focus when the whole window
+                            // goes out of focus even though this textfield should be marked as not
+                            // having focus
+                            if (chatName.readOnly)
+                                return;
+                            changeName();
+                            Network.sendRenameChat()
+                        }
+                        function changeName() {
+                            LLM.chatListModel.get(index).name = chatName.text
+                            chatName.focus = false
+                            chatName.readOnly = true
+                            chatName.selectByMouse = false
+                        }
+                        TapHandler {
+                            onTapped: {
+                                if (isCurrent)
+                                    return;
+                                LLM.chatListModel.currentChat = LLM.chatListModel.get(index);
+                            }
+                        }
+                        Accessible.role: Accessible.Button
+                        Accessible.name: qsTr("Select the current chat")
+                        Accessible.description: qsTr("Provides a button to select the current chat or edit the chat when in edit mode")
+                    }
+                    Row {
+                        id: buttons
+                        anchors.verticalCenter: chatName.verticalCenter
+                        anchors.right: chatRectangle.right
+                        anchors.rightMargin: 10
+                        spacing: 10
+                        Button {
+                            id: editButton
+                            width: 30
+                            height: 30
+                            visible: isCurrent
+                            opacity: trashQuestionDisplayed ? 0.5 : 1.0
+                            background: Image {
+                                width: 30
+                                height: 30
+                                source: "qrc:/gpt4all/icons/edit.svg"
+                            }
+                            onClicked: {
+                                chatName.focus = true
+                                chatName.readOnly = false
+                                chatName.selectByMouse = true
+                            }
+                            Accessible.role: Accessible.Button
+                            Accessible.name: qsTr("Edit the chat name")
+                            Accessible.description: qsTr("Provides a button to edit the chat name")
+                        }
+                        Button {
+                            id: c
+                            width: 30
+                            height: 30
+                            visible: isCurrent
+                            background: Image {
+                                width: 30
+                                height: 30
+                                source: "qrc:/gpt4all/icons/trash.svg"
+                            }
+                            onClicked: {
+                                trashQuestionDisplayed = true
+                                timer.start()
+                            }
+                            Accessible.role: Accessible.Button
+                            Accessible.name: qsTr("Delete of the chat")
+                            Accessible.description: qsTr("Provides a button to delete the chat")
+                        }
+                    }
+                    Rectangle {
+                        id: trashSureQuestion
+                        anchors.top: buttons.bottom
+                        anchors.topMargin: 10
+                        anchors.right: buttons.right
+                        width: childrenRect.width
+                        height: childrenRect.height
+                        color: chatRectangle.color
+                        visible: isCurrent && trashQuestionDisplayed
+                        opacity: 1.0
+                        radius: 10
+                        z: 200
+                        Row {
+                            spacing: 10
+                            Button {
+                                id: checkMark
+                                width: 30
+                                height: 30
+                                contentItem: Text {
+                                    color: theme.textErrorColor
+                                    text: "\u2713"
+                                    font.pixelSize: theme.fontSizeLarger
+                                    horizontalAlignment: Text.AlignHCenter
+                                    verticalAlignment: Text.AlignVCenter
+                                }
+                                background: Rectangle {
+                                    width: 30
+                                    height: 30
+                                    color: "transparent"
+                                }
+                                onClicked: {
+                                    LLM.chatListModel.removeChat(LLM.chatListModel.get(index))
+                                    Network.sendRemoveChat()
+                                }
+                                Accessible.role: Accessible.Button
+                                Accessible.name: qsTr("Confirm delete of the chat")
+                                Accessible.description: qsTr("Provides a button to confirm delete of the chat")
+                            }
+                            Button {
+                                id: cancel
+                                width: 30
+                                height: 30
+                                contentItem: Text {
+                                    color: theme.textColor
+                                    text: "\u2715"
+                                    font.pixelSize: theme.fontSizeLarger
+                                    horizontalAlignment: Text.AlignHCenter
+                                    verticalAlignment: Text.AlignVCenter
+                                }
+                                background: Rectangle {
+                                    width: 30
+                                    height: 30
+                                    color: "transparent"
+                                }
+                                onClicked: {
+                                    trashQuestionDisplayed = false
+                                }
+                                Accessible.role: Accessible.Button
+                                Accessible.name: qsTr("Cancel the delete of the chat")
+                                Accessible.description: qsTr("Provides a button to cancel delete of the chat")
+                            }
+                        }
+                    }
+                    Timer {
+                        id: timer
+                        interval: 3000; running: false; repeat: false
+                        onTriggered: trashQuestionDisplayed = false
+                    }
+                }
+
+                Accessible.role: Accessible.List
+                Accessible.name: qsTr("List of chats")
+                Accessible.description: qsTr("List of chats in the drawer dialog")
+            }
+        }
+
+        Button {
+            id: checkForUpdatesButton
+            anchors.left: parent.left
+            anchors.right: parent.right
+            anchors.bottom: downloadButton.top
+            anchors.bottomMargin: 10
+            padding: 15
+            contentItem: Text {
+                text: qsTr("Updates")
+                horizontalAlignment: Text.AlignHCenter
+                color: theme.textColor
+
+                Accessible.role: Accessible.Button
+                Accessible.name: text
+                Accessible.description: qsTr("Use this to launch an external application that will check for updates to the installer")
+            }
+
+            background: Rectangle {
+                opacity: .5
+                border.color: theme.backgroundLightest
+                border.width: 1
+                radius: 10
+                color: theme.backgroundLight
+            }
+
+            onClicked: {
+                if (!LLM.checkForUpdates())
+                    checkForUpdatesError.open()
+            }
+        }
+
+        Button {
+            id: downloadButton
+            anchors.left: parent.left
+            anchors.right: parent.right
+            anchors.bottom: aboutButton.top
+            anchors.bottomMargin: 10
+            padding: 15
+            contentItem: Text {
+                text: qsTr("Downloads")
+                horizontalAlignment: Text.AlignHCenter
+                color: theme.textColor
+
+                Accessible.role: Accessible.Button
+                Accessible.name: text
+                Accessible.description: qsTr("Use this to launch a dialog to download new models")
+            }
+
+            background: Rectangle {
+                opacity: .5
+                border.color: theme.backgroundLightest
+                border.width: 1
+                radius: 10
+                color: theme.backgroundLight
+            }
+
+            onClicked: {
+                downloadClicked()
+            }
+        }
+
+        Button {
+            id: aboutButton
+            anchors.left: parent.left
+            anchors.right: parent.right
+            anchors.bottom: parent.bottom
+            padding: 15
+            contentItem: Text {
+                text: qsTr("About")
+                horizontalAlignment: Text.AlignHCenter
+                color: theme.textColor
+
+                Accessible.role: Accessible.Button
+                Accessible.name: text
+                Accessible.description: qsTr("Use this to launch a dialog to show the about page")
+            }
+
+            background: Rectangle {
+                opacity: .5
+                border.color: theme.backgroundLightest
+                border.width: 1
+                radius: 10
+                color: theme.backgroundLight
+            }
+
+            onClicked: {
+                aboutClicked()
+            }
+        }
+    }
+}
\ No newline at end of file
diff --git a/gpt4all-chat/qml/ModelDownloaderDialog.qml b/gpt4all-chat/qml/ModelDownloaderDialog.qml
new file mode 100644
index 00000000..0c2a58a5
--- /dev/null
+++ b/gpt4all-chat/qml/ModelDownloaderDialog.qml
@@ -0,0 +1,383 @@
+import QtCore
+import QtQuick
+import QtQuick.Controls
+import QtQuick.Controls.Basic
+import QtQuick.Dialogs
+import QtQuick.Layouts
+import download
+import llm
+import network
+
+Dialog {
+    id: modelDownloaderDialog
+    modal: true
+    opacity: 0.9
+    closePolicy: LLM.chatListModel.currentChat.modelList.length === 0 ? Popup.NoAutoClose : (Popup.CloseOnEscape | Popup.CloseOnPressOutside)
+    background: Rectangle {
+        anchors.fill: parent
+        anchors.margins: -20
+        color: theme.backgroundDarkest
+        border.width: 1
+        border.color: theme.dialogBorder
+        radius: 10
+    }
+
+    onOpened: {
+        Network.sendModelDownloaderDialog();
+    }
+
+    property string defaultModelPath: Download.defaultLocalModelsPath()
+    property alias modelPath: settings.modelPath
+    Settings {
+        id: settings
+        property string modelPath: modelDownloaderDialog.defaultModelPath
+    }
+
+    Component.onCompleted: {
+        Download.downloadLocalModelsPath = settings.modelPath
+    }
+
+    Component.onDestruction: {
+        settings.sync()
+    }
+
+    ColumnLayout {
+        anchors.fill: parent
+        anchors.margins: 20
+        spacing: 30
+
+        Label {
+            id: listLabel
+            text: "Available Models:"
+            Layout.alignment: Qt.AlignLeft
+            Layout.fillWidth: true
+            color: theme.textColor
+        }
+
+        ScrollView {
+            id: scrollView
+            ScrollBar.vertical.policy: ScrollBar.AlwaysOn
+            Layout.fillWidth: true
+            Layout.fillHeight: true
+            clip: true
+
+            ListView {
+                id: modelList
+                model: Download.modelList
+                boundsBehavior: Flickable.StopAtBounds
+
+                delegate: Item {
+                    id: delegateItem
+                    width: modelList.width
+                    height: modelName.height + modelName.padding
+                        + description.height + description.padding
+                    objectName: "delegateItem"
+                    property bool downloading: false
+                    Rectangle {
+                        anchors.fill: parent
+                        color: index % 2 === 0 ? theme.backgroundLight : theme.backgroundLighter
+                    }
+
+                    Text {
+                        id: modelName
+                        objectName: "modelName"
+                        property string filename: modelData.filename
+                        text: filename.slice(5, filename.length - 4)
+                        padding: 20
+                        anchors.top: parent.top
+                        anchors.left: parent.left
+                        font.bold: modelData.isDefault || modelData.bestGPTJ || modelData.bestLlama || modelData.bestMPT
+                        color: theme.assistantColor
+                        Accessible.role: Accessible.Paragraph
+                        Accessible.name: qsTr("Model file")
+                        Accessible.description: qsTr("Model file to be downloaded")
+                    }
+
+                    Text {
+                        id: description
+                        text: "    - " + modelData.description
+                        leftPadding: 20
+                        rightPadding: 20
+                        anchors.top: modelName.bottom
+                        anchors.left: modelName.left
+                        anchors.right: parent.right
+                        wrapMode: Text.WordWrap
+                        color: theme.textColor
+                        Accessible.role: Accessible.Paragraph
+                        Accessible.name: qsTr("Description")
+                        Accessible.description: qsTr("The description of the file")
+                    }
+
+                    Text {
+                        id: isDefault
+                        text: qsTr("(default)")
+                        visible: modelData.isDefault
+                        anchors.top: modelName.top
+                        anchors.left: modelName.right
+                        padding: 20
+                        color: theme.textColor
+                        Accessible.role: Accessible.Paragraph
+                        Accessible.name: qsTr("Default file")
+                        Accessible.description: qsTr("Whether the file is the default model")
+                    }
+
+                    Text {
+                        text: modelData.filesize
+                        anchors.top: modelName.top
+                        anchors.left: isDefault.visible ? isDefault.right : modelName.right
+                        padding: 20
+                        color: theme.textColor
+                        Accessible.role: Accessible.Paragraph
+                        Accessible.name: qsTr("File size")
+                        Accessible.description: qsTr("The size of the file")
+                    }
+
+                    Label {
+                        id: speedLabel
+                        anchors.top: modelName.top
+                        anchors.right: itemProgressBar.left
+                        padding: 20
+                        objectName: "speedLabel"
+                        color: theme.textColor
+                        text: ""
+                        visible: downloading
+                        Accessible.role: Accessible.Paragraph
+                        Accessible.name: qsTr("Download speed")
+                        Accessible.description: qsTr("Download speed in bytes/kilobytes/megabytes per second")
+                    }
+
+                    ProgressBar {
+                        id: itemProgressBar
+                        objectName: "itemProgressBar"
+                        anchors.top: modelName.top
+                        anchors.right: downloadButton.left
+                        anchors.topMargin: 20
+                        anchors.rightMargin: 20
+                        width: 100
+                        visible: downloading
+                        background: Rectangle {
+                            implicitWidth: 200
+                            implicitHeight: 30
+                            color: theme.backgroundDarkest
+                            radius: 3
+                        }
+
+                        contentItem: Item {
+                            implicitWidth: 200
+                            implicitHeight: 25
+
+                            Rectangle {
+                                width: itemProgressBar.visualPosition * parent.width
+                                height: parent.height
+                                radius: 2
+                                color: theme.assistantColor
+                            }
+                        }
+                        Accessible.role: Accessible.ProgressBar
+                        Accessible.name: qsTr("Download progressBar")
+                        Accessible.description: qsTr("Shows the progress made in the download")
+                    }
+
+                    Item {
+                        visible: modelData.calcHash
+                        anchors.top: modelName.top
+                        anchors.right: parent.right
+
+                        Label {
+                            id: calcHashLabel
+                            anchors.right: busyCalcHash.left
+                            padding: 20
+                            objectName: "calcHashLabel"
+                            color: theme.textColor
+                            text: qsTr("Calculating MD5...")
+                            Accessible.role: Accessible.Paragraph
+                            Accessible.name: text
+                            Accessible.description: qsTr("Whether the file hash is being calculated")
+                        }
+
+                        BusyIndicator {
+                            id: busyCalcHash
+                            anchors.right: parent.right
+                            padding: 20
+                            running: modelData.calcHash
+                            Accessible.role: Accessible.Animation
+                            Accessible.name: qsTr("Busy indicator")
+                            Accessible.description: qsTr("Displayed when the file hash is being calculated")
+                        }
+                    }
+
+                    Label {
+                        id: installedLabel
+                        anchors.top: modelName.top
+                        anchors.right: parent.right
+                        padding: 20
+                        objectName: "installedLabel"
+                        color: theme.textColor
+                        text: qsTr("Already installed")
+                        visible: modelData.installed
+                        Accessible.role: Accessible.Paragraph
+                        Accessible.name: text
+                        Accessible.description: qsTr("Whether the file is already installed on your system")
+                    }
+
+                    Button {
+                        id: downloadButton
+                        contentItem: Text {
+                            color: theme.textColor
+                            text: downloading ? "Cancel" : "Download"
+                        }
+                        anchors.top: modelName.top
+                        anchors.right: parent.right
+                        anchors.topMargin: 15
+                        anchors.rightMargin: 20
+                        visible: !modelData.installed && !modelData.calcHash
+                        onClicked: {
+                            if (!downloading) {
+                                downloading = true;
+                                Download.downloadModel(modelData.filename);
+                            } else {
+                                downloading = false;
+                                Download.cancelDownload(modelData.filename);
+                            }
+                        }
+                        background: Rectangle {
+                            opacity: .5
+                            border.color: theme.backgroundLightest
+                            border.width: 1
+                            radius: 10
+                            color: theme.backgroundLight
+                        }
+                        Accessible.role: Accessible.Button
+                        Accessible.name: text
+                        Accessible.description: qsTr("Cancel/Download button to stop/start the download")
+
+                    }
+                }
+
+                Component.onCompleted: {
+                    Download.downloadProgress.connect(updateProgress);
+                    Download.downloadFinished.connect(resetProgress);
+                }
+
+                property var lastUpdate: ({})
+
+                function updateProgress(bytesReceived, bytesTotal, modelName) {
+                    let currentTime = new Date().getTime();
+
+                    for (let i = 0; i < modelList.contentItem.children.length; i++) {
+                        let delegateItem = modelList.contentItem.children[i];
+                        if (delegateItem.objectName === "delegateItem") {
+                            let modelNameText = delegateItem.children.find(child => child.objectName === "modelName").filename;
+                            if (modelNameText === modelName) {
+                                let progressBar = delegateItem.children.find(child => child.objectName === "itemProgressBar");
+                                progressBar.value = bytesReceived / bytesTotal;
+
+                                // Calculate the download speed
+                                if (lastUpdate[modelName] && lastUpdate[modelName].timestamp) {
+                                    let timeDifference = currentTime - lastUpdate[modelName].timestamp;
+                                    let bytesDifference = bytesReceived - lastUpdate[modelName].bytesReceived;
+                                    let speed = (bytesDifference / timeDifference) * 1000; // bytes per second
+                                    delegateItem.downloading = true
+
+                                    // Update the speed label
+                                    let speedLabel = delegateItem.children.find(child => child.objectName === "speedLabel");
+                                    if (speed < 1024) {
+                                        speedLabel.text = speed.toFixed(2) + " B/s";
+                                    } else if (speed < 1024 * 1024) {
+                                        speedLabel.text = (speed / 1024).toFixed(2) + " KB/s";
+                                    } else {
+                                        speedLabel.text = (speed / (1024 * 1024)).toFixed(2) + " MB/s";
+                                    }
+                                }
+
+                                // Update the lastUpdate object for the current model
+                                lastUpdate[modelName] = {"timestamp": currentTime, "bytesReceived": bytesReceived};
+                                break;
+                            }
+                        }
+                    }
+                }
+
+                function resetProgress(modelName) {
+                    for (let i = 0; i < modelList.contentItem.children.length; i++) {
+                        let delegateItem = modelList.contentItem.children[i];
+                        if (delegateItem.objectName === "delegateItem") {
+                            let modelNameText = delegateItem.children.find(child => child.objectName === "modelName").filename;
+                            if (modelNameText === modelName) {
+                                let progressBar = delegateItem.children.find(child => child.objectName === "itemProgressBar");
+                                progressBar.value = 0;
+                                delegateItem.downloading = false;
+
+                                // Remove speed label text
+                                let speedLabel = delegateItem.children.find(child => child.objectName === "speedLabel");
+                                speedLabel.text = "";
+
+                                // Remove the lastUpdate object for the canceled model
+                                delete lastUpdate[modelName];
+                                break;
+                            }
+                        }
+                    }
+                }
+            }
+        }
+
+        RowLayout {
+            Layout.alignment: Qt.AlignCenter
+            Layout.fillWidth: true
+            spacing: 20
+            FolderDialog {
+                id: modelPathDialog
+                title: "Please choose a directory"
+                currentFolder: Download.downloadLocalModelsPath
+                onAccepted: {
+                    Download.downloadLocalModelsPath = selectedFolder
+                    settings.modelPath = Download.downloadLocalModelsPath
+                    settings.sync()
+                }
+            }
+            Label {
+                id: modelPathLabel
+                text: qsTr("Download path:")
+                color: theme.textColor
+                Layout.row: 1
+                Layout.column: 0
+            }
+            TextField {
+                id: modelPathDisplayLabel
+                text: Download.downloadLocalModelsPath
+                readOnly: true
+                color: theme.textColor
+                Layout.fillWidth: true
+                ToolTip.text: qsTr("Path where model files will be downloaded to")
+                ToolTip.visible: hovered
+                Accessible.role: Accessible.ToolTip
+                Accessible.name: modelPathDisplayLabel.text
+                Accessible.description: ToolTip.text
+                background: Rectangle {
+                    color: theme.backgroundLighter
+                    radius: 10
+                }
+            }
+            Button {
+                text: qsTr("Browse")
+                contentItem: Text {
+                    text: qsTr("Browse")
+                    horizontalAlignment: Text.AlignHCenter
+                    color: theme.textColor
+                    Accessible.role: Accessible.Button
+                    Accessible.name: text
+                    Accessible.description: qsTr("Opens a folder picker dialog to choose where to save model files")
+                }
+                background: Rectangle {
+                    opacity: .5
+                    border.color: theme.backgroundLightest
+                    border.width: 1
+                    radius: 10
+                    color: theme.backgroundLight
+                }
+                onClicked: modelPathDialog.open()
+            }
+        }
+    }
+}
diff --git a/gpt4all-chat/qml/NetworkDialog.qml b/gpt4all-chat/qml/NetworkDialog.qml
new file mode 100644
index 00000000..10b97bf9
--- /dev/null
+++ b/gpt4all-chat/qml/NetworkDialog.qml
@@ -0,0 +1,174 @@
+import QtCore
+import QtQuick
+import QtQuick.Controls
+import QtQuick.Controls.Basic
+import QtQuick.Layouts
+import download
+import network
+import llm
+
+Dialog {
+    id: networkDialog
+    anchors.centerIn: parent
+    modal: true
+    opacity: 0.9
+    padding: 20
+
+    Theme {
+        id: theme
+    }
+
+    Settings {
+        id: settings
+        category: "network"
+        property string attribution: ""
+    }
+
+    Component.onDestruction: {
+        settings.sync()
+    }
+
+    Column {
+        id: column
+        spacing: 20
+        Item {
+            width: childrenRect.width
+            height: childrenRect.height
+            Image {
+                id: img
+                anchors.top: parent.top
+                anchors.left: parent.left
+                width: 60
+                height: 60
+                source: "qrc:/gpt4all/icons/logo.svg"
+            }
+            Text {
+                anchors.left: img.right
+                anchors.leftMargin: 30
+                anchors.verticalCenter: img.verticalCenter
+                text: qsTr("Contribute data to the GPT4All Opensource Datalake.")
+                color: theme.textColor
+            }
+        }
+
+        ScrollView {
+            clip: true
+            height: 300
+            width: 1024 - 40
+            ScrollBar.vertical.policy: ScrollBar.AlwaysOn
+            ScrollBar.horizontal.policy: ScrollBar.AlwaysOff
+
+            TextArea {
+                id: textOptIn
+                wrapMode: Text.Wrap
+                width: 1024 - 40
+                padding: 20
+                text: qsTr("By enabling this feature, you will be able to participate in the democratic process of training a large language model by contributing data for future model improvements.
+
+When a GPT4All model responds to you and you have opted-in, your conversation will be sent to the GPT4All Open Source Datalake. Additionally, you can like/dislike its response. If you dislike a response, you can suggest an alternative response. This data will be collected and aggregated in the GPT4All Datalake.
+
+NOTE: By turning on this feature, you will be sending your data to the GPT4All Open Source Datalake. You should have no expectation of chat privacy when this feature is enabled. You should; however, have an expectation of an optional attribution if you wish. Your chat data will be openly available for anyone to download and will be used by Nomic AI to improve future GPT4All models. Nomic AI will retain all attribution information attached to your data and you will be credited as a contributor to any GPT4All model release that uses your data!")
+                color: theme.textColor
+                focus: false
+                readOnly: true
+                Accessible.role: Accessible.Paragraph
+                Accessible.name: qsTr("Terms for opt-in")
+                Accessible.description: qsTr("Describes what will happen when you opt-in")
+                background: Rectangle {
+                    color: theme.backgroundLight
+                    radius: 10
+                }
+            }
+        }
+
+        TextField {
+            id: attribution
+            color: theme.textColor
+            padding: 20
+            width: parent.width
+            text: settings.attribution
+            font.pixelSize: theme.fontSizeLarge
+            placeholderText: qsTr("Please provide a name for attribution (optional)")
+            placeholderTextColor: theme.backgroundLightest
+            background: Rectangle {
+                color: theme.backgroundLighter
+                radius: 10
+            }
+            Accessible.role: Accessible.EditableText
+            Accessible.name: qsTr("Attribution (optional)")
+            Accessible.description: qsTr("Textfield for providing attribution")
+            onEditingFinished: {
+                settings.attribution = attribution.text;
+                settings.sync();
+            }
+        }
+    }
+
+    background: Rectangle {
+        anchors.fill: parent
+        color: theme.backgroundDarkest
+        border.width: 1
+        border.color: theme.dialogBorder
+        radius: 10
+    }
+
+    footer: DialogButtonBox {
+        id: dialogBox
+        padding: 20
+        alignment: Qt.AlignRight
+        spacing: 10
+        Button {
+            contentItem: Text {
+                color: theme.textColor
+                text: qsTr("Enable")
+            }
+            background: Rectangle {
+                border.color: theme.backgroundLightest
+                border.width: 1
+                radius: 10
+                color: theme.backgroundLight
+            }
+            Accessible.role: Accessible.Button
+            Accessible.name: text
+            Accessible.description: qsTr("Enable opt-in button")
+
+            padding: 15
+            DialogButtonBox.buttonRole: DialogButtonBox.AcceptRole
+        }
+        Button {
+            contentItem: Text {
+                color: theme.textColor
+                text: qsTr("Cancel")
+            }
+            background: Rectangle {
+                border.color: theme.backgroundLightest
+                border.width: 1
+                radius: 10
+                color: theme.backgroundLight
+            }
+            Accessible.role: Accessible.Button
+            Accessible.name: text
+            Accessible.description: qsTr("Cancel opt-in button")
+
+            padding: 15
+            DialogButtonBox.buttonRole: DialogButtonBox.RejectRole
+        }
+        background: Rectangle {
+            color: "transparent"
+        }
+    }
+
+    onAccepted: {
+        if (Network.isActive)
+            return
+        Network.isActive = true;
+        Network.sendNetworkToggled(true);
+    }
+
+    onRejected: {
+        if (!Network.isActive)
+            return
+        Network.isActive = false;
+        Network.sendNetworkToggled(false);
+    }
+}
diff --git a/gpt4all-chat/qml/NewVersionDialog.qml b/gpt4all-chat/qml/NewVersionDialog.qml
new file mode 100644
index 00000000..8da15f31
--- /dev/null
+++ b/gpt4all-chat/qml/NewVersionDialog.qml
@@ -0,0 +1,76 @@
+import QtCore
+import QtQuick
+import QtQuick.Controls
+import QtQuick.Controls.Basic
+import QtQuick.Layouts
+import download
+import network
+import llm
+
+Dialog {
+    id: newVerionDialog
+    anchors.centerIn: parent
+    modal: true
+    opacity: 0.9
+    width: contentItem.width
+    height: contentItem.height
+    padding: 20
+
+    Theme {
+        id: theme
+    }
+
+    background: Rectangle {
+        anchors.fill: parent
+        color: theme.backgroundDarkest
+        border.width: 1
+        border.color: theme.dialogBorder
+        radius: 10
+    }
+
+    Item {
+        id: contentItem
+        width: childrenRect.width + 40
+        height: childrenRect.height + 40
+
+        Label {
+            id: label
+            anchors.top: parent.top
+            anchors.left: parent.left
+            topPadding: 20
+            bottomPadding: 20
+            text: qsTr("New version is available:")
+            color: theme.textColor
+        }
+
+        Button {
+            id: button
+            anchors.left: label.right
+            anchors.leftMargin: 10
+            anchors.verticalCenter: label.verticalCenter
+            padding: 20
+            contentItem: Text {
+                text: qsTr("Update")
+                horizontalAlignment: Text.AlignHCenter
+                color: theme.textColor
+
+                Accessible.role: Accessible.Button
+                Accessible.name: text
+                Accessible.description: qsTr("Use this to launch an external application that will check for updates to the installer")
+            }
+
+            background: Rectangle {
+                opacity: .5
+                border.color: theme.backgroundLightest
+                border.width: 1
+                radius: 10
+                color: theme.backgroundLight
+            }
+
+            onClicked: {
+                if (!LLM.checkForUpdates())
+                    checkForUpdatesError.open()
+            }
+        }
+    }
+}
diff --git a/gpt4all-chat/qml/PopupDialog.qml b/gpt4all-chat/qml/PopupDialog.qml
new file mode 100644
index 00000000..dfd80d54
--- /dev/null
+++ b/gpt4all-chat/qml/PopupDialog.qml
@@ -0,0 +1,71 @@
+import QtCore
+import QtQuick
+import QtQuick.Controls
+import QtQuick.Controls.Basic
+import QtQuick.Layouts
+
+Dialog {
+    id: popupDialog
+    anchors.centerIn: parent
+    opacity: 0.9
+    padding: 20
+    property alias text: textField.text
+    property bool shouldTimeOut: true
+    property bool shouldShowBusy: false
+    modal: shouldShowBusy
+    closePolicy: shouldShowBusy ? Popup.NoAutoClose : (Popup.CloseOnEscape | Popup.CloseOnPressOutside)
+
+    Theme {
+        id: theme
+    }
+
+    Row {
+        anchors.centerIn: parent
+        width: childrenRect.width
+        height: childrenRect.height
+        spacing: 20
+
+        Text {
+            id: textField
+            anchors.verticalCenter: busyIndicator.verticalCenter
+            horizontalAlignment: Text.AlignJustify
+            color: theme.textColor
+            Accessible.role: Accessible.HelpBalloon
+            Accessible.name: text
+            Accessible.description: qsTr("Reveals a shortlived help balloon")
+        }
+
+        BusyIndicator {
+            id: busyIndicator
+            visible: shouldShowBusy
+            running: shouldShowBusy
+
+            Accessible.role: Accessible.Animation
+            Accessible.name: qsTr("Busy indicator")
+            Accessible.description: qsTr("Displayed when the popup is showing busy")
+        }
+    }
+
+    background: Rectangle {
+        anchors.fill: parent
+        color: theme.backgroundDarkest
+        border.width: 1
+        border.color: theme.dialogBorder
+        radius: 10
+    }
+
+    exit: Transition {
+        NumberAnimation { duration: 500; property: "opacity"; from: 1.0; to: 0.0 }
+    }
+
+    onOpened: {
+        if (shouldTimeOut)
+            timer.start()
+    }
+
+    Timer {
+        id: timer
+        interval: 500; running: false; repeat: false
+        onTriggered: popupDialog.close()
+    }
+}
\ No newline at end of file
diff --git a/gpt4all-chat/qml/SettingsDialog.qml b/gpt4all-chat/qml/SettingsDialog.qml
new file mode 100644
index 00000000..c9f3557f
--- /dev/null
+++ b/gpt4all-chat/qml/SettingsDialog.qml
@@ -0,0 +1,828 @@
+import QtCore
+import QtQuick
+import QtQuick.Controls
+import QtQuick.Controls.Basic
+import QtQuick.Dialogs
+import QtQuick.Layouts
+import download
+import network
+import llm
+
+Dialog {
+    id: settingsDialog
+    modal: true
+    opacity: 0.9
+    background: Rectangle {
+        anchors.fill: parent
+        anchors.margins: -20
+        color: theme.backgroundDarkest
+        border.width: 1
+        border.color: theme.dialogBorder
+        radius: 10
+    }
+
+    onOpened: {
+        Network.sendSettingsDialog();
+    }
+
+    property var currentChat: LLM.chatListModel.currentChat
+
+    Theme {
+        id: theme
+    }
+
+    property real defaultTemperature: 0.28
+    property real defaultTopP: 0.95
+    property int defaultTopK: 40
+    property int defaultMaxLength: 4096
+    property int defaultPromptBatchSize: 9
+    property real defaultRepeatPenalty: 1.10
+    property int defaultRepeatPenaltyTokens: 64
+    property int defaultThreadCount: 0
+    property bool defaultSaveChats: false
+    property string defaultPromptTemplate: "### Human:
+%1
+### Assistant:\n"
+    property string defaultModelPath: Download.defaultLocalModelsPath()
+    property string defaultUserDefaultModel: "Application default"
+
+    property alias temperature: settings.temperature
+    property alias topP: settings.topP
+    property alias topK: settings.topK
+    property alias maxLength: settings.maxLength
+    property alias promptBatchSize: settings.promptBatchSize
+    property alias promptTemplate: settings.promptTemplate
+    property alias repeatPenalty: settings.repeatPenalty
+    property alias repeatPenaltyTokens: settings.repeatPenaltyTokens
+    property alias threadCount: settings.threadCount
+    property alias saveChats: settings.saveChats
+    property alias modelPath: settings.modelPath
+    property alias userDefaultModel: settings.userDefaultModel
+
+    Settings {
+        id: settings
+        property real temperature: settingsDialog.defaultTemperature
+        property real topP: settingsDialog.defaultTopP
+        property int topK: settingsDialog.defaultTopK
+        property int maxLength: settingsDialog.defaultMaxLength
+        property int promptBatchSize: settingsDialog.defaultPromptBatchSize
+        property int threadCount: settingsDialog.defaultThreadCount
+        property bool saveChats: settingsDialog.defaultSaveChats
+        property real repeatPenalty: settingsDialog.defaultRepeatPenalty
+        property int repeatPenaltyTokens: settingsDialog.defaultRepeatPenaltyTokens
+        property string promptTemplate: settingsDialog.defaultPromptTemplate
+        property string modelPath: settingsDialog.defaultModelPath
+        property string userDefaultModel: settingsDialog.defaultUserDefaultModel
+    }
+
+    function restoreGenerationDefaults() {
+        settings.temperature = defaultTemperature
+        settings.topP = defaultTopP
+        settings.topK = defaultTopK
+        settings.maxLength = defaultMaxLength
+        settings.promptBatchSize = defaultPromptBatchSize
+        settings.promptTemplate = defaultPromptTemplate
+        settings.repeatPenalty = defaultRepeatPenalty
+        settings.repeatPenaltyTokens = defaultRepeatPenaltyTokens
+        settings.sync()
+    }
+
+    function restoreApplicationDefaults() {
+        settings.modelPath = settingsDialog.defaultModelPath
+        settings.threadCount = defaultThreadCount
+        settings.saveChats = defaultSaveChats
+        settings.userDefaultModel = defaultUserDefaultModel
+        Download.downloadLocalModelsPath = settings.modelPath
+        LLM.threadCount = settings.threadCount
+        LLM.chatListModel.shouldSaveChats = settings.saveChats
+        settings.sync()
+    }
+
+    Component.onCompleted: {
+        LLM.threadCount = settings.threadCount
+        LLM.chatListModel.shouldSaveChats = settings.saveChats
+        Download.downloadLocalModelsPath = settings.modelPath
+    }
+
+    Connections {
+        target: settingsDialog
+        function onClosed() {
+            settings.sync()
+        }
+    }
+
+    Item {
+        Accessible.role: Accessible.Dialog
+        Accessible.name: qsTr("Settings dialog")
+        Accessible.description: qsTr("Dialog containing various application settings")
+    }
+    TabBar {
+        id: settingsTabBar
+        width: parent.width / 1.5
+
+        TabButton {
+            id: genSettingsButton
+            contentItem: IconLabel {
+                color: theme.textColor
+                font.bold: genSettingsButton.checked
+                font.pixelSize: genSettingsButton.checked ? theme.fontSizeLarger : theme.fontSizeLarge
+                text: qsTr("Generation")
+            }
+            background: Rectangle {
+                color: genSettingsButton.checked ? theme.backgroundDarkest : theme.backgroundLight
+                border.color: theme.tabBorder
+                border.width: 1 ? genSettingsButton.checked : 0
+            }
+            Accessible.role: Accessible.Button
+            Accessible.name: qsTr("Generation settings")
+            Accessible.description: qsTr("Settings related to how the model generates text")
+        }
+
+        TabButton {
+            id: appSettingsButton
+            contentItem: IconLabel {
+                color: theme.textColor
+                font.bold: appSettingsButton.checked
+                font.pixelSize: appSettingsButton.checked ? theme.fontSizeLarger : theme.fontSizeLarge
+                text: qsTr("Application")
+            }
+            background: Rectangle {
+                color: appSettingsButton.checked ? theme.backgroundDarkest : theme.backgroundLight
+                border.color: theme.tabBorder
+                border.width: 1 ? appSettingsButton.checked : 0
+            }
+            Accessible.role: Accessible.Button
+            Accessible.name: qsTr("Application settings")
+            Accessible.description: qsTr("Settings related to general behavior of the application")
+        }
+    }
+
+    StackLayout {
+        anchors.top: settingsTabBar.bottom
+        width: parent.width
+        height: availableHeight
+        currentIndex: settingsTabBar.currentIndex
+
+        Item {
+            id: generationSettingsTab
+            ScrollView {
+                background: Rectangle {
+                    color: 'transparent'
+                    border.color: theme.tabBorder
+                    border.width: 1
+                    radius: 2
+                }
+                padding: 10
+                width: parent.width
+                height: parent.height - 30
+                contentWidth: availableWidth - 20
+                contentHeight: generationSettingsTabInner.implicitHeight + 40
+                ScrollBar.vertical.policy: ScrollBar.AlwaysOn
+
+                GridLayout {
+                    id: generationSettingsTabInner
+                    anchors.margins: 10
+                    columns: 2
+                    rowSpacing: 10
+                    columnSpacing: 10
+                    anchors.fill: parent
+
+                    Label {
+                        id: tempLabel
+                        text: qsTr("Temperature:")
+                        color: theme.textColor
+                        Layout.row: 0
+                        Layout.column: 0
+                    }
+                    TextField {
+                        text: settings.temperature.toString()
+                        color: theme.textColor
+                        background: Rectangle {
+                            implicitWidth: 150
+                            color: theme.backgroundLighter
+                            radius: 10
+                        }
+                        padding: 10
+                        ToolTip.text: qsTr("Temperature increases the chances of choosing less likely tokens - higher temperature gives more creative but less predictable outputs")
+                        ToolTip.visible: hovered
+                        Layout.row: 0
+                        Layout.column: 1
+                        validator: DoubleValidator {
+                            locale: "C"
+                        }
+                        onEditingFinished: {
+                            var val = parseFloat(text)
+                            if (!isNaN(val)) {
+                                settings.temperature = val
+                                settings.sync()
+                                focus = false
+                            } else {
+                                text = settings.temperature.toString()
+                            }
+                        }
+                        Accessible.role: Accessible.EditableText
+                        Accessible.name: tempLabel.text
+                        Accessible.description: ToolTip.text
+                    }
+                    Label {
+                        id: topPLabel
+                        text: qsTr("Top P:")
+                        color: theme.textColor
+                        Layout.row: 1
+                        Layout.column: 0
+                    }
+                    TextField {
+                        text: settings.topP.toString()
+                        color: theme.textColor
+                        background: Rectangle {
+                            implicitWidth: 150
+                            color: theme.backgroundLighter
+                            radius: 10
+                        }
+                        padding: 10
+                        ToolTip.text: qsTr("Only the most likely tokens up to a total probability of top_p can be chosen, prevents choosing highly unlikely tokens, aka Nucleus Sampling")
+                        ToolTip.visible: hovered
+                        Layout.row: 1
+                        Layout.column: 1
+                        validator: DoubleValidator {
+                            locale: "C"
+                        }
+                        onEditingFinished: {
+                            var val = parseFloat(text)
+                            if (!isNaN(val)) {
+                                settings.topP = val
+                                settings.sync()
+                                focus = false
+                            } else {
+                                text = settings.topP.toString()
+                            }
+                        }
+                        Accessible.role: Accessible.EditableText
+                        Accessible.name: topPLabel.text
+                        Accessible.description: ToolTip.text
+                    }
+                    Label {
+                        id: topKLabel
+                        text: qsTr("Top K:")
+                        color: theme.textColor
+                        Layout.row: 2
+                        Layout.column: 0
+                    }
+                    TextField {
+                        text: settings.topK.toString()
+                        color: theme.textColor
+                        background: Rectangle {
+                            implicitWidth: 150
+                            color: theme.backgroundLighter
+                            radius: 10
+                        }
+                        padding: 10
+                        ToolTip.text: qsTr("Only the top K most likely tokens will be chosen from")
+                        ToolTip.visible: hovered
+                        Layout.row: 2
+                        Layout.column: 1
+                        validator: IntValidator {
+                            bottom: 1
+                        }
+                        onEditingFinished: {
+                            var val = parseInt(text)
+                            if (!isNaN(val)) {
+                                settings.topK = val
+                                settings.sync()
+                                focus = false
+                            } else {
+                                text = settings.topK.toString()
+                            }
+                        }
+                        Accessible.role: Accessible.EditableText
+                        Accessible.name: topKLabel.text
+                        Accessible.description: ToolTip.text
+                    }
+                    Label {
+                        id: maxLengthLabel
+                        text: qsTr("Max Length:")
+                        color: theme.textColor
+                        Layout.row: 3
+                        Layout.column: 0
+                    }
+                    TextField {
+                        text: settings.maxLength.toString()
+                        color: theme.textColor
+                        background: Rectangle {
+                            implicitWidth: 150
+                            color: theme.backgroundLighter
+                            radius: 10
+                        }
+                        padding: 10
+                        ToolTip.text: qsTr("Maximum length of response in tokens")
+                        ToolTip.visible: hovered
+                        Layout.row: 3
+                        Layout.column: 1
+                        validator: IntValidator {
+                            bottom: 1
+                        }
+                        onEditingFinished: {
+                            var val = parseInt(text)
+                            if (!isNaN(val)) {
+                                settings.maxLength = val
+                                settings.sync()
+                                focus = false
+                            } else {
+                                text = settings.maxLength.toString()
+                            }
+                        }
+                        Accessible.role: Accessible.EditableText
+                        Accessible.name: maxLengthLabel.text
+                        Accessible.description: ToolTip.text
+                    }
+
+                    Label {
+                        id: batchSizeLabel
+                        text: qsTr("Prompt Batch Size:")
+                        color: theme.textColor
+                        Layout.row: 4
+                        Layout.column: 0
+                    }
+                    TextField {
+                        text: settings.promptBatchSize.toString()
+                        color: theme.textColor
+                        background: Rectangle {
+                            implicitWidth: 150
+                            color: theme.backgroundLighter
+                            radius: 10
+                        }
+                        padding: 10
+                        ToolTip.text: qsTr("Amount of prompt tokens to process at once, higher values can speed up reading prompts but will use more RAM")
+                        ToolTip.visible: hovered
+                        Layout.row: 4
+                        Layout.column: 1
+                        validator: IntValidator {
+                            bottom: 1
+                        }
+                        onEditingFinished: {
+                            var val = parseInt(text)
+                            if (!isNaN(val)) {
+                                settings.promptBatchSize = val
+                                settings.sync()
+                                focus = false
+                            } else {
+                                text = settings.promptBatchSize.toString()
+                            }
+                        }
+                        Accessible.role: Accessible.EditableText
+                        Accessible.name: batchSizeLabel.text
+                        Accessible.description: ToolTip.text
+                    }
+                    Label {
+                        id: repeatPenaltyLabel
+                        text: qsTr("Repeat Penalty:")
+                        color: theme.textColor
+                        Layout.row: 5
+                        Layout.column: 0
+                    }
+                    TextField {
+                        text: settings.repeatPenalty.toString()
+                        color: theme.textColor
+                        background: Rectangle {
+                            implicitWidth: 150
+                            color: theme.backgroundLighter
+                            radius: 10
+                        }
+                        padding: 10
+                        ToolTip.text: qsTr("Amount to penalize repetitiveness of the output")
+                        ToolTip.visible: hovered
+                        Layout.row: 5
+                        Layout.column: 1
+                        validator: DoubleValidator {
+                            locale: "C"
+                        }
+                        onEditingFinished: {
+                            var val = parseFloat(text)
+                            if (!isNaN(val)) {
+                                settings.repeatPenalty = val
+                                settings.sync()
+                                focus = false
+                            } else {
+                                text = settings.repeatPenalty.toString()
+                            }
+                        }
+                        Accessible.role: Accessible.EditableText
+                        Accessible.name: repeatPenaltyLabel.text
+                        Accessible.description: ToolTip.text
+                    }
+                    Label {
+                        id: repeatPenaltyTokensLabel
+                        text: qsTr("Repeat Penalty Tokens:")
+                        color: theme.textColor
+                        Layout.row: 6
+                        Layout.column: 0
+                    }
+                    TextField {
+                        text: settings.repeatPenaltyTokens.toString()
+                        color: theme.textColor
+                        background: Rectangle {
+                            implicitWidth: 150
+                            color: theme.backgroundLighter
+                            radius: 10
+                        }
+                        padding: 10
+                        ToolTip.text: qsTr("How far back in output to apply repeat penalty")
+                        ToolTip.visible: hovered
+                        Layout.row: 6
+                        Layout.column: 1
+                        validator: IntValidator {
+                            bottom: 1
+                        }
+                        onEditingFinished: {
+                            var val = parseInt(text)
+                            if (!isNaN(val)) {
+                                settings.repeatPenaltyTokens = val
+                                settings.sync()
+                                focus = false
+                            } else {
+                                text = settings.repeatPenaltyTokens.toString()
+                            }
+                        }
+                        Accessible.role: Accessible.EditableText
+                        Accessible.name: repeatPenaltyTokensLabel.text
+                        Accessible.description: ToolTip.text
+                    }
+
+                    Label {
+                        id: promptTemplateLabel
+                        text: qsTr("Prompt Template:")
+                        color: theme.textColor
+                        Layout.row: 7
+                        Layout.column: 0
+                    }
+                    Rectangle {
+                        Layout.row: 7
+                        Layout.column: 1
+                        Layout.fillWidth: true
+                        height: 200
+                        color: "transparent"
+                        clip: true
+                        Label {
+                            id: promptTemplateLabelHelp
+                            visible: settings.promptTemplate.indexOf(
+                                         "%1") === -1
+                            font.bold: true
+                            color: theme.textErrorColor
+                            text: qsTr("Prompt template must contain %1 to be replaced with the user's input.")
+                            anchors.fill: templateScrollView
+                            z: 200
+                            padding: 10
+                            wrapMode: TextArea.Wrap
+                            Accessible.role: Accessible.EditableText
+                            Accessible.name: text
+                        }
+                        ScrollView {
+                            id: templateScrollView
+                            anchors.fill: parent
+                            TextArea {
+                                text: settings.promptTemplate
+                                color: theme.textColor
+                                background: Rectangle {
+                                    implicitWidth: 150
+                                    color: theme.backgroundLighter
+                                    radius: 10
+                                }
+                                padding: 10
+                                wrapMode: TextArea.Wrap
+                                onTextChanged: {
+                                    settings.promptTemplate = text
+                                    settings.sync()
+                                }
+                                bottomPadding: 10
+                                Accessible.role: Accessible.EditableText
+                                Accessible.name: promptTemplateLabel.text
+                                Accessible.description: promptTemplateLabelHelp.text
+                            }
+                        }
+                    }
+                    Button {
+                        Layout.row: 8
+                        Layout.column: 1
+                        Layout.fillWidth: true
+                        padding: 10
+                        contentItem: Text {
+                            text: qsTr("Restore Defaults")
+                            horizontalAlignment: Text.AlignHCenter
+                            color: theme.textColor
+                            Accessible.role: Accessible.Button
+                            Accessible.name: text
+                            Accessible.description: qsTr("Restores the settings dialog to a default state")
+                        }
+
+                        background: Rectangle {
+                            opacity: .5
+                            border.color: theme.backgroundLightest
+                            border.width: 1
+                            radius: 10
+                            color: theme.backgroundLight
+                        }
+                        onClicked: {
+                            settingsDialog.restoreGenerationDefaults()
+                        }
+                    }
+                }
+            }
+        }
+        Item {
+            id: applicationSettingsTab
+            ScrollView {
+                background: Rectangle {
+                    color: 'transparent'
+                    border.color: theme.tabBorder
+                    border.width: 1
+                    radius: 2
+                }
+                padding: 10
+                width: parent.width
+                height: parent.height - 30
+                contentWidth: availableWidth - 20
+                ScrollBar.vertical.policy: ScrollBar.AlwaysOn
+
+                GridLayout {
+                    anchors.margins: 10
+                    columns: 3
+                    rowSpacing: 10
+                    columnSpacing: 10
+                    anchors.fill: parent
+                    Label {
+                        id: defaultModelLabel
+                        text: qsTr("Default model:")
+                        color: theme.textColor
+                        Layout.row: 1
+                        Layout.column: 0
+                    }
+                    ComboBox {
+                        id: comboBox
+                        Layout.row: 1
+                        Layout.column: 1
+                        Layout.minimumWidth: 350
+                        font.pixelSize: theme.fontSizeLarge
+                        spacing: 0
+                        padding: 10
+                        model: modelList
+                        Accessible.role: Accessible.ComboBox
+                        Accessible.name: qsTr("ComboBox for displaying/picking the default model")
+                        Accessible.description: qsTr("Use this for picking the default model to use; the first item is the current default model")
+                        function updateModel(newModelList) {
+                            var newArray = Array.from(newModelList);
+                            newArray.unshift('Application default');
+                            comboBox.model = newArray;
+                            settings.sync();
+                            comboBox.currentIndex = comboBox.indexOfValue(settingsDialog.userDefaultModel);
+
+                        }
+                        Component.onCompleted: {
+                            comboBox.updateModel(currentChat.modelList)
+                        }
+                        Connections {
+                            target: settings
+                            function onUserDefaultModelChanged() {
+                                comboBox.updateModel(currentChat.modelList)
+                            }
+                        }
+                        Connections {
+                            target: currentChat
+                            function onModelListChanged() {
+                                comboBox.updateModel(currentChat.modelList)
+                            }
+                        }
+                        contentItem: Text {
+                            anchors.horizontalCenter: parent.horizontalCenter
+                            leftPadding: 10
+                            rightPadding: 10
+                            text: comboBox.displayText
+                            font: comboBox.font
+                            color: theme.textColor
+                            verticalAlignment: Text.AlignVCenter
+                            horizontalAlignment: Text.AlignHCenter
+                            elide: Text.ElideRight
+                        }
+                        delegate: ItemDelegate {
+                            width: comboBox.width
+                            contentItem: Text {
+                                text: modelData
+                                color: theme.textColor
+                                font: comboBox.font
+                                elide: Text.ElideRight
+                                verticalAlignment: Text.AlignVCenter
+                            }
+                            background: Rectangle {
+                                color: highlighted ? theme.backgroundLight : theme.backgroundDark
+                            }
+                            highlighted: comboBox.highlightedIndex === index
+                        }
+                        popup: Popup {
+                            y: comboBox.height - 1
+                            width: comboBox.width
+                            implicitHeight: contentItem.implicitHeight
+                            padding: 0
+
+                            contentItem: ListView {
+                                clip: true
+                                implicitHeight: contentHeight
+                                model: comboBox.popup.visible ? comboBox.delegateModel : null
+                                currentIndex: comboBox.highlightedIndex
+                                ScrollIndicator.vertical: ScrollIndicator { }
+                            }
+
+                            background: Rectangle {
+                                color: theme.backgroundDark
+                            }
+                        }
+
+                        background: Rectangle {
+                            color: theme.backgroundDark
+                            border.width: 1
+                            border.color: theme.backgroundLightest
+                            radius: 10
+                        }
+
+                        onActivated: {
+                            settingsDialog.userDefaultModel = comboBox.currentText
+                            settings.sync()
+                        }
+                    }
+                    FolderDialog {
+                        id: modelPathDialog
+                        title: "Please choose a directory"
+                        currentFolder: Download.downloadLocalModelsPath
+                        onAccepted: {
+                            Download.downloadLocalModelsPath = selectedFolder
+                            settings.modelPath = Download.downloadLocalModelsPath
+                            settings.sync()
+                        }
+                    }
+                    Label {
+                        id: modelPathLabel
+                        text: qsTr("Download path:")
+                        color: theme.textColor
+                        Layout.row: 2
+                        Layout.column: 0
+                    }
+                    TextField {
+                        id: modelPathDisplayLabel
+                        text: Download.downloadLocalModelsPath
+                        readOnly: true
+                        color: theme.textColor
+                        implicitWidth: 300
+                        padding: 10
+                        Layout.row: 2
+                        Layout.column: 1
+                        Layout.fillWidth: true
+                        ToolTip.text: qsTr("Path where model files will be downloaded to")
+                        ToolTip.visible: hovered
+                        Accessible.role: Accessible.ToolTip
+                        Accessible.name: modelPathDisplayLabel.text
+                        Accessible.description: ToolTip.text
+                        background: Rectangle {
+                            color: theme.backgroundLighter
+                            radius: 10
+                        }
+                    }
+                    Button {
+                        Layout.row: 2
+                        Layout.column: 2
+                        text: qsTr("Browse")
+                        contentItem: Text {
+                            text: qsTr("Browse")
+                            horizontalAlignment: Text.AlignHCenter
+                            color: theme.textColor
+                            Accessible.role: Accessible.Button
+                            Accessible.name: text
+                            Accessible.description: qsTr("Opens a folder picker dialog to choose where to save model files")
+                        }
+                        background: Rectangle {
+                            opacity: .5
+                            border.color: theme.backgroundLightest
+                            border.width: 1
+                            radius: 10
+                            color: theme.backgroundLight
+                        }
+                        onClicked: modelPathDialog.open()
+                    }
+                    Label {
+                        id: nThreadsLabel
+                        text: qsTr("CPU Threads:")
+                        color: theme.textColor
+                        Layout.row: 3
+                        Layout.column: 0
+                    }
+                    TextField {
+                        text: settingsDialog.threadCount.toString()
+                        color: theme.textColor
+                        background: Rectangle {
+                            implicitWidth: 150
+                            color: theme.backgroundLighter
+                            radius: 10
+                        }
+                        padding: 10
+                        ToolTip.text: qsTr("Amount of processing threads to use, a setting of 0 will use the lesser of 4 or your number of CPU threads")
+                        ToolTip.visible: hovered
+                        Layout.row: 3
+                        Layout.column: 1
+                        validator: IntValidator {
+                            bottom: 1
+                        }
+                        onEditingFinished: {
+                            var val = parseInt(text)
+                            if (!isNaN(val)) {
+                                settingsDialog.threadCount = val
+                                LLM.threadCount = val
+                                settings.sync()
+                                focus = false
+                            } else {
+                                text = settingsDialog.threadCount.toString()
+                            }
+                        }
+                        Accessible.role: Accessible.EditableText
+                        Accessible.name: nThreadsLabel.text
+                        Accessible.description: ToolTip.text
+                    }
+                    Label {
+                        id: saveChatsLabel
+                        text: qsTr("Save chats to disk:")
+                        color: theme.textColor
+                        Layout.row: 4
+                        Layout.column: 0
+                    }
+                    CheckBox {
+                        id: saveChatsBox
+                        Layout.row: 4
+                        Layout.column: 1
+                        checked: settingsDialog.saveChats
+                        onClicked: {
+                            Network.sendSaveChatsToggled(saveChatsBox.checked);
+                            settingsDialog.saveChats = saveChatsBox.checked
+                            LLM.chatListModel.shouldSaveChats = saveChatsBox.checked
+                            settings.sync()
+                        }
+
+                        ToolTip.text: qsTr("WARNING: Saving chats to disk can be ~2GB per chat")
+                        ToolTip.visible: hovered
+
+                        background: Rectangle {
+                            color: "transparent"
+                        }
+
+                        indicator: Rectangle {
+                            implicitWidth: 26
+                            implicitHeight: 26
+                            x: saveChatsBox.leftPadding
+                            y: parent.height / 2 - height / 2
+                            border.color: theme.dialogBorder
+                            color: "transparent"
+
+                            Rectangle {
+                                width: 14
+                                height: 14
+                                x: 6
+                                y: 6
+                                color: theme.textColor
+                                visible: saveChatsBox.checked
+                            }
+                        }
+
+                        contentItem: Text {
+                            text: saveChatsBox.text
+                            font: saveChatsBox.font
+                            opacity: enabled ? 1.0 : 0.3
+                            color: theme.textColor
+                            verticalAlignment: Text.AlignVCenter
+                            leftPadding: saveChatsBox.indicator.width + saveChatsBox.spacing
+                        }
+                    }
+                    Button {
+                        Layout.row: 5
+                        Layout.column: 1
+                        Layout.fillWidth: true
+                        padding: 10
+                        contentItem: Text {
+                            text: qsTr("Restore Defaults")
+                            horizontalAlignment: Text.AlignHCenter
+                            color: theme.textColor
+                            Accessible.role: Accessible.Button
+                            Accessible.name: text
+                            Accessible.description: qsTr("Restores the settings dialog to a default state")
+                        }
+
+                        background: Rectangle {
+                            opacity: .5
+                            border.color: theme.backgroundLightest
+                            border.width: 1
+                            radius: 10
+                            color: theme.backgroundLight
+                        }
+                        onClicked: {
+                            settingsDialog.restoreApplicationDefaults()
+                        }
+                    }
+                }
+            }
+        }
+    }
+}
diff --git a/gpt4all-chat/qml/StartupDialog.qml b/gpt4all-chat/qml/StartupDialog.qml
new file mode 100644
index 00000000..fabc02ef
--- /dev/null
+++ b/gpt4all-chat/qml/StartupDialog.qml
@@ -0,0 +1,357 @@
+import QtCore
+import QtQuick
+import QtQuick.Controls
+import QtQuick.Controls.Basic
+import QtQuick.Layouts
+import download
+import network
+import llm
+
+Dialog {
+    id: startupDialog
+    anchors.centerIn: parent
+    modal: true
+    opacity: 0.9
+    padding: 20
+    width: 1024
+    height: column.height + 40
+    closePolicy: !optInStatisticsRadio.choiceMade || !optInNetworkRadio.choiceMade ? Popup.NoAutoClose : (Popup.CloseOnEscape | Popup.CloseOnPressOutside)
+
+    Theme {
+        id: theme
+    }
+
+    Column {
+        id: column
+        spacing: 20
+        Item {
+            width: childrenRect.width
+            height: childrenRect.height
+            Image {
+                id: img
+                anchors.top: parent.top
+                anchors.left: parent.left
+                width: 60
+                height: 60
+                source: "qrc:/gpt4all/icons/logo.svg"
+            }
+            Text {
+                anchors.left: img.right
+                anchors.leftMargin: 30
+                anchors.verticalCenter: img.verticalCenter
+                text: qsTr("Welcome!")
+                color: theme.textColor
+            }
+        }
+
+        ScrollView {
+            clip: true
+            height: 200
+            width: 1024 - 40
+            ScrollBar.vertical.policy: ScrollBar.AlwaysOn
+            ScrollBar.horizontal.policy: ScrollBar.AlwaysOff
+
+            TextArea {
+                id: welcome
+                wrapMode: Text.Wrap
+                width: 1024 - 40
+                padding: 20
+                textFormat: TextEdit.MarkdownText
+                text: qsTr("### Release notes\n")
+                    + Download.releaseInfo.notes
+                    + qsTr("### Contributors\n")
+                    + Download.releaseInfo.contributors
+                color: theme.textColor
+                focus: false
+                readOnly: true
+                Accessible.role: Accessible.Paragraph
+                Accessible.name: qsTr("Release notes")
+                Accessible.description: qsTr("Release notes for this version")
+                background: Rectangle {
+                    color: theme.backgroundLight
+                    radius: 10
+                }
+            }
+        }
+
+        ScrollView {
+            clip: true
+            height: 150
+            width: 1024 - 40
+            ScrollBar.vertical.policy: ScrollBar.AlwaysOn
+            ScrollBar.horizontal.policy: ScrollBar.AlwaysOff
+
+            TextArea {
+                id: optInTerms
+                wrapMode: Text.Wrap
+                width: 1024 - 40
+                padding: 20
+                textFormat: TextEdit.MarkdownText
+                text: qsTr(
+"### Opt-ins for anonymous usage analytics and datalake
+By enabling these features, you will be able to participate in the democratic process of training a
+large language model by contributing data for future model improvements.
+
+When a GPT4All model responds to you and you have opted-in, your conversation will be sent to the GPT4All
+Open Source Datalake. Additionally, you can like/dislike its response. If you dislike a response, you
+can suggest an alternative response. This data will be collected and aggregated in the GPT4All Datalake.
+
+NOTE: By turning on this feature, you will be sending your data to the GPT4All Open Source Datalake.
+You should have no expectation of chat privacy when this feature is enabled. You should; however, have
+an expectation of an optional attribution if you wish. Your chat data will be openly available for anyone
+to download and will be used by Nomic AI to improve future GPT4All models. Nomic AI will retain all
+attribution information attached to your data and you will be credited as a contributor to any GPT4All
+model release that uses your data!")
+
+                color: theme.textColor
+                focus: false
+                readOnly: true
+                Accessible.role: Accessible.Paragraph
+                Accessible.name: qsTr("Terms for opt-in")
+                Accessible.description: qsTr("Describes what will happen when you opt-in")
+                background: Rectangle {
+                    color: theme.backgroundLight
+                    radius: 10
+                }
+            }
+        }
+
+        GridLayout {
+            columns: 2
+            rowSpacing: 10
+            columnSpacing: 10
+            anchors.right: parent.right
+            Label {
+                id: optInStatistics
+                text: "Opt-in to anonymous usage analytics used to improve GPT4All"
+                Layout.row: 0
+                Layout.column: 0
+                color: theme.textColor
+                Accessible.role: Accessible.Paragraph
+                Accessible.name: qsTr("Opt-in for anonymous usage statistics")
+                Accessible.description: qsTr("Label for opt-in")
+            }
+
+            ButtonGroup {
+                buttons: optInStatisticsRadio.children
+                onClicked: {
+                    Network.usageStatsActive = optInStatisticsRadio.checked
+                    if (optInNetworkRadio.choiceMade && optInStatisticsRadio.choiceMade)
+                        startupDialog.close();
+                }
+            }
+
+            RowLayout {
+                id: optInStatisticsRadio
+                Layout.alignment: Qt.AlignVCenter
+                Layout.row: 0
+                Layout.column: 1
+                property bool defaultChecked: Network.usageStatsActive
+                property alias checked: optInStatisticsRadioYes.checked
+                property bool choiceMade: optInStatisticsRadioYes.checked || optInStatisticsRadioNo.checked
+
+                RadioButton {
+                    id: optInStatisticsRadioYes
+                    checked: optInStatisticsRadio.defaultChecked
+                    text: qsTr("Yes")
+                    Accessible.role: Accessible.RadioButton
+                    Accessible.name: qsTr("Opt-in for anonymous usage statistics")
+                    Accessible.description: qsTr("Radio button to allow opt-in for anonymous usage statistics")
+
+                    background: Rectangle {
+                        color: "transparent"
+                    }
+
+                    indicator: Rectangle {
+                        implicitWidth: 26
+                        implicitHeight: 26
+                        x: optInStatisticsRadioYes.leftPadding
+                        y: parent.height / 2 - height / 2
+                        radius: 13
+                        border.color: theme.dialogBorder
+                        color: "transparent"
+
+                        Rectangle {
+                            width: 14
+                            height: 14
+                            x: 6
+                            y: 6
+                            radius: 7
+                            color: theme.textColor
+                            visible: optInStatisticsRadioYes.checked
+                        }
+                    }
+
+                    contentItem: Text {
+                        text: optInStatisticsRadioYes.text
+                        font: optInStatisticsRadioYes.font
+                        opacity: enabled ? 1.0 : 0.3
+                        color: theme.textColor
+                        verticalAlignment: Text.AlignVCenter
+                        leftPadding: optInStatisticsRadioYes.indicator.width + optInStatisticsRadioYes.spacing
+                    }
+                }
+                RadioButton {
+                    id: optInStatisticsRadioNo
+                    text: qsTr("No")
+                    Accessible.role: Accessible.RadioButton
+                    Accessible.name: qsTr("Opt-out for anonymous usage statistics")
+                    Accessible.description: qsTr("Radio button to allow opt-out for anonymous usage statistics")
+
+                    background: Rectangle {
+                        color: "transparent"
+                    }
+
+                    indicator: Rectangle {
+                        implicitWidth: 26
+                        implicitHeight: 26
+                        x: optInStatisticsRadioNo.leftPadding
+                        y: parent.height / 2 - height / 2
+                        radius: 13
+                        border.color: theme.dialogBorder
+                        color: "transparent"
+
+                        Rectangle {
+                            width: 14
+                            height: 14
+                            x: 6
+                            y: 6
+                            radius: 7
+                            color: theme.textColor
+                            visible: optInStatisticsRadioNo.checked
+                        }
+                    }
+
+                    contentItem: Text {
+                        text: optInStatisticsRadioNo.text
+                        font: optInStatisticsRadioNo.font
+                        opacity: enabled ? 1.0 : 0.3
+                        color: theme.textColor
+                        verticalAlignment: Text.AlignVCenter
+                        leftPadding: optInStatisticsRadioNo.indicator.width + optInStatisticsRadioNo.spacing
+                    }
+                }
+            }
+
+            Label {
+                id: optInNetwork
+                text: "Opt-in to anonymous sharing of chats to the GPT4All Datalake"
+                Layout.row: 1
+                Layout.column: 0
+                color: theme.textColor
+                Accessible.role: Accessible.Paragraph
+                Accessible.name: qsTr("Opt-in for network")
+                Accessible.description: qsTr("Checkbox to allow opt-in for network")
+            }
+
+            ButtonGroup {
+                buttons: optInNetworkRadio.children
+                onClicked: {
+                    Network.isActive = optInNetworkRadio.checked
+                    if (optInNetworkRadio.choiceMade && optInStatisticsRadio.choiceMade)
+                        startupDialog.close();
+                }
+            }
+
+            RowLayout {
+                id: optInNetworkRadio
+                Layout.alignment: Qt.AlignVCenter
+                Layout.row: 1
+                Layout.column: 1
+                property bool defaultChecked: Network.isActive
+                property alias checked: optInNetworkRadioYes.checked
+                property bool choiceMade: optInNetworkRadioYes.checked || optInNetworkRadioNo.checked
+
+                RadioButton {
+                    id: optInNetworkRadioYes
+                    checked: optInNetworkRadio.defaultChecked
+                    text: qsTr("Yes")
+                    Accessible.role: Accessible.RadioButton
+                    Accessible.name: qsTr("Opt-in for network")
+                    Accessible.description: qsTr("Radio button to allow opt-in anonymous sharing of chats to the GPT4All Datalake")
+
+                    background: Rectangle {
+                        color: "transparent"
+                    }
+
+                    indicator: Rectangle {
+                        implicitWidth: 26
+                        implicitHeight: 26
+                        x: optInNetworkRadioYes.leftPadding
+                        y: parent.height / 2 - height / 2
+                        radius: 13
+                        border.color: theme.dialogBorder
+                        color: "transparent"
+
+                        Rectangle {
+                            width: 14
+                            height: 14
+                            x: 6
+                            y: 6
+                            radius: 7
+                            color: theme.textColor
+                            visible: optInNetworkRadioYes.checked
+                        }
+                    }
+
+                    contentItem: Text {
+                        text: optInNetworkRadioYes.text
+                        font: optInNetworkRadioYes.font
+                        opacity: enabled ? 1.0 : 0.3
+                        color: theme.textColor
+                        verticalAlignment: Text.AlignVCenter
+                        leftPadding: optInNetworkRadioYes.indicator.width + optInNetworkRadioYes.spacing
+                    }
+                }
+                RadioButton {
+                    id: optInNetworkRadioNo
+                    text: qsTr("No")
+                    Accessible.role: Accessible.RadioButton
+                    Accessible.name: qsTr("Opt-out for network")
+                    Accessible.description: qsTr("Radio button to allow opt-out anonymous sharing of chats to the GPT4All Datalake")
+
+                    background: Rectangle {
+                        color: "transparent"
+                    }
+
+                    indicator: Rectangle {
+                        implicitWidth: 26
+                        implicitHeight: 26
+                        x: optInNetworkRadioNo.leftPadding
+                        y: parent.height / 2 - height / 2
+                        radius: 13
+                        border.color: theme.dialogBorder
+                        color: "transparent"
+
+                        Rectangle {
+                            width: 14
+                            height: 14
+                            x: 6
+                            y: 6
+                            radius: 7
+                            color: theme.textColor
+                            visible: optInNetworkRadioNo.checked
+                        }
+                    }
+
+                    contentItem: Text {
+                        text: optInNetworkRadioNo.text
+                        font: optInNetworkRadioNo.font
+                        opacity: enabled ? 1.0 : 0.3
+                        color: theme.textColor
+                        verticalAlignment: Text.AlignVCenter
+                        leftPadding: optInNetworkRadioNo.indicator.width + optInNetworkRadioNo.spacing
+                    }
+                }
+            }
+        }
+    }
+
+    background: Rectangle {
+        anchors.fill: parent
+        color: theme.backgroundDarkest
+        border.width: 1
+        border.color: theme.dialogBorder
+        radius: 10
+    }
+}
diff --git a/gpt4all-chat/qml/Theme.qml b/gpt4all-chat/qml/Theme.qml
new file mode 100644
index 00000000..6417550d
--- /dev/null
+++ b/gpt4all-chat/qml/Theme.qml
@@ -0,0 +1,20 @@
+import QtCore
+import QtQuick
+import QtQuick.Controls.Basic
+
+QtObject {
+    property color textColor: "#d1d5db"
+    property color textErrorColor: "red"
+    property color backgroundDarkest: "#202123"
+    property color backgroundDark: "#242528"
+    property color backgroundLight: "#343541"
+    property color backgroundLighter: "#444654"
+    property color backgroundLightest: "#7d7d8e"
+    property color dialogBorder: "#d1d5db"
+    property color userColor: "#ec86bf"
+    property color assistantColor: "#10a37f"
+    property color linkColor: "white"
+    property color tabBorder: "#aaa"
+    property real  fontSizeLarge: Qt.application.font.pixelSize
+    property real  fontSizeLarger: Qt.application.font.pixelSize + 2
+}
diff --git a/gpt4all-chat/qml/ThumbsDownDialog.qml b/gpt4all-chat/qml/ThumbsDownDialog.qml
new file mode 100644
index 00000000..8cb1d115
--- /dev/null
+++ b/gpt4all-chat/qml/ThumbsDownDialog.qml
@@ -0,0 +1,112 @@
+import QtCore
+import QtQuick
+import QtQuick.Controls
+import QtQuick.Controls.Basic
+import QtQuick.Layouts
+import download
+import network
+import llm
+
+Dialog {
+    id: thumbsDownDialog
+    modal: true
+    opacity: 0.9
+    padding: 20
+
+    Theme {
+        id: theme
+    }
+
+    property alias response: thumbsDownNewResponse.text
+
+    Column {
+        anchors.fill: parent
+        spacing: 20
+        Item {
+            width: childrenRect.width
+            height: childrenRect.height
+            Image {
+                id: img
+                anchors.top: parent.top
+                anchors.left: parent.left
+                width: 60
+                height: 60
+                source: "qrc:/gpt4all/icons/thumbs_down.svg"
+            }
+            Text {
+                anchors.left: img.right
+                anchors.leftMargin: 30
+                anchors.verticalCenter: img.verticalCenter
+                text: qsTr("Please edit the text below to provide a better response. (optional)")
+                color: theme.textColor
+            }
+        }
+
+        ScrollView {
+            clip: true
+            height: 300
+            width: parent.width
+            ScrollBar.vertical.policy: ScrollBar.AlwaysOn
+            ScrollBar.horizontal.policy: ScrollBar.AlwaysOff
+
+            TextArea {
+                id: thumbsDownNewResponse
+                color: theme.textColor
+                padding: 20
+                wrapMode: Text.Wrap
+                font.pixelSize: theme.fontSizeLarge
+                placeholderText: qsTr("Please provide a better response...")
+                placeholderTextColor: theme.backgroundLightest
+                background: Rectangle {
+                    color: theme.backgroundLighter
+                    radius: 10
+                }
+            }
+        }
+    }
+
+    background: Rectangle {
+        anchors.fill: parent
+        color: theme.backgroundDarkest
+        border.width: 1
+        border.color: theme.dialogBorder
+        radius: 10
+    }
+
+    footer: DialogButtonBox {
+        padding: 20
+        alignment: Qt.AlignRight
+        spacing: 10
+        Button {
+            contentItem: Text {
+                color: theme.textColor
+                text: qsTr("Submit")
+            }
+            background: Rectangle {
+                border.color: theme.backgroundLightest
+                border.width: 1
+                radius: 10
+                color: theme.backgroundLight
+            }
+            padding: 15
+            DialogButtonBox.buttonRole: DialogButtonBox.AcceptRole
+        }
+        Button {
+            contentItem: Text {
+                color: theme.textColor
+                text: qsTr("Cancel")
+            }
+            background: Rectangle {
+                border.color: theme.backgroundLightest
+                border.width: 1
+                radius: 10
+                color: theme.backgroundLight
+            }
+            padding: 15
+            DialogButtonBox.buttonRole: DialogButtonBox.RejectRole
+        }
+        background: Rectangle {
+            color: "transparent"
+        }
+    }
+}
\ No newline at end of file
diff --git a/gpt4all-chat/sysinfo.h b/gpt4all-chat/sysinfo.h
new file mode 100644
index 00000000..4a02826f
--- /dev/null
+++ b/gpt4all-chat/sysinfo.h
@@ -0,0 +1,48 @@
+#include <QtCore/QCoreApplication>
+#include <QDebug>
+#include <QFile>
+#include <QTextStream>
+#include <QRegularExpression>
+
+#if defined(Q_OS_MAC)
+#include <sys/types.h>
+#include <sys/sysctl.h>
+#endif
+
+#if defined(Q_OS_WIN)
+#include <Windows.h>
+#endif
+
+QString getSystemTotalRAM()
+{
+    qint64 totalRAM = 0;
+
+#if defined(Q_OS_LINUX)
+    QFile file("/proc/meminfo");
+    if (file.open(QIODevice::ReadOnly | QIODevice::Text)) {
+        QTextStream in(&file);
+        QString line = in.readLine();
+        while (!line.isNull()) {
+            if (line.startsWith("MemTotal")) {
+                QStringList parts = line.split(QRegularExpression("\\s+"));
+                totalRAM = parts[1].toLongLong() * 1024; // Convert from KB to bytes
+                break;
+            }
+            line = in.readLine();
+        }
+        file.close();
+    }
+#elif defined(Q_OS_MAC)
+    int mib[2] = {CTL_HW, HW_MEMSIZE};
+    size_t length = sizeof(totalRAM);
+    sysctl(mib, 2, &totalRAM, &length, NULL, 0);
+#elif defined(Q_OS_WIN)
+    MEMORYSTATUSEX memoryStatus;
+    memoryStatus.dwLength = sizeof(memoryStatus);
+    GlobalMemoryStatusEx(&memoryStatus);
+    totalRAM = memoryStatus.ullTotalPhys;
+#endif
+
+    double totalRAM_GB = static_cast<double>(totalRAM) / (1024 * 1024 * 1024);
+    return QString::number(totalRAM_GB, 'f', 2) + " GB";
+}
diff --git a/gpt4all-chat/test_hw.cpp b/gpt4all-chat/test_hw.cpp
new file mode 100644
index 00000000..eef10129
--- /dev/null
+++ b/gpt4all-chat/test_hw.cpp
@@ -0,0 +1,29 @@
+#include <stdio.h>
+#include <string>
+
+int main(int argc, char *argv[])
+{
+    static bool avx = __builtin_cpu_supports("avx");
+    static bool avx2 = __builtin_cpu_supports("avx2");
+    static bool fma = __builtin_cpu_supports("fma");
+    static bool sse3 = __builtin_cpu_supports("sse3");
+    static std::string s;
+    s  = "gpt4all hardware test results:\n";
+    s += "    AVX  = "        + std::to_string(avx)         + "\n";
+    s += "    AVX2 = "        + std::to_string(avx2)        + "\n";
+    s += "    FMA  = "        + std::to_string(fma)         + "\n";
+    s += "    SSE3 = "        + std::to_string(sse3)        + "\n";
+    fprintf(stderr, "%s", s.c_str());
+    fprintf(stderr, "your hardware supports the \"");
+    fflush(stderr);
+    if (avx2)
+        printf("full");
+    else if (avx && fma)
+        printf("avx_only");
+    else
+        printf("bare_minimum");
+    fflush(stdout);
+    fprintf(stderr, "\" version of gpt4all.\n");
+    fflush(stderr);
+    return 0;
+}