From 67507105d01e5b971696d2ce7c124ecd5013282c Mon Sep 17 00:00:00 2001 From: DocShotgun <126566557+DocShotgun@users.noreply.github.com> Date: Mon, 4 Dec 2023 22:20:46 -0800 Subject: [PATCH] Update colab, expose additional args * Exposed draft model args for speculative decoding * Exposed int8 cache, dummy models, and no flash attention * Resolved CUDA 11.8 dependency issue --- TabbyAPI_Colab_Example.ipynb | 68 ++++++++++++++++++++++-------------- requirements-colab.txt | 10 ++++++ 2 files changed, 52 insertions(+), 26 deletions(-) create mode 100644 requirements-colab.txt diff --git a/TabbyAPI_Colab_Example.ipynb b/TabbyAPI_Colab_Example.ipynb index c584b84..9ad687b 100644 --- a/TabbyAPI_Colab_Example.ipynb +++ b/TabbyAPI_Colab_Example.ipynb @@ -16,11 +16,19 @@ "accelerator": "GPU" }, "cells": [ + { + "cell_type": "markdown", + "source": [ + "# **TabbyAPI Colab**" + ], + "metadata": { + "id": "NcgQp3r7BS-q" + } + }, { "cell_type": "code", "source": [ - "#CELL 1\n", - "#@title Keep this widget playing to prevent Colab from disconnecting you { display-mode: \"form\" }\n", + "#@title # Keep this widget playing to prevent Colab from disconnecting you { display-mode: \"form\" }\n", "#@markdown Press play on the audio player that will appear below:\n", "%%html\n", "