From 93659f3eb417388d5e6cb946f4fbf46be7d85056 Mon Sep 17 00:00:00 2001
From: Victor Hall <victor.charles.hall@gmail.com>
Date: Sun, 24 Mar 2024 09:30:23 -0400
Subject: [PATCH] caption cog notebook

---
 CaptionCog.ipynb | 47 +++++++++++++++++++++++++++++++++++++----------
 1 file changed, 37 insertions(+), 10 deletions(-)

diff --git a/CaptionCog.ipynb b/CaptionCog.ipynb
index ef36d48..29c9e01 100644
--- a/CaptionCog.ipynb
+++ b/CaptionCog.ipynb
@@ -23,10 +23,14 @@
    "outputs": [],
    "source": [
     "# install dependencies\n",
-    "!pip install huggingface-hub\n",
-    "!pip install transformers\n",
-    "!pip install pynvml\n",
-    "!pip install colorama"
+    "!pip install huggingface-hub -q\n",
+    "!pip install transformers -q\n",
+    "!pip install pynvml -q\n",
+    "!pip install colorama -q\n",
+    "!pip install peft -q\n",
+    "!pip install bitsandbytes -q\n",
+    "!pip install einops -q\n",
+    "!pip install xformers -q"
    ]
   },
   {
@@ -38,7 +42,8 @@
     "# Colab only setup (do NOT run for docker/runpod/vast)\n",
     "!git clone https://github.com/victorchall/EveryDream2trainer\n",
     "%cd EveryDream2trainer\n",
-    "%mkdir -p /content/EveryDream2trainer/input"
+    "%mkdir -p /content/EveryDream2trainer/input\n",
+    "%cd /content/EveryDream2trainer"
    ]
   },
   {
@@ -71,6 +76,17 @@
     "            tar_ref.extractall(input_folder)"
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "## Connect Gdrive (Optional, will popup a warning)\n",
+    "from google.colab import drive\n",
+    "drive.mount('/content/drive')"
+   ]
+  },
   {
    "attachments": {},
    "cell_type": "markdown",
@@ -78,9 +94,8 @@
    "source": [
     "## Run captions.\n",
     "\n",
-    "Place your images in \"input\" folder, or you can change the data_root to point to a Gdrive folder.\n",
-    "\n",
-    "Run either the 24GB or 16GB model or adjust settings on your own."
+    "Place your images in \"input\" folder, or you can change the image_dir to point to a Gdrive folder.\n",
+    "\n"
    ]
   },
   {
@@ -92,7 +107,7 @@
     "# 16GB GPU, must not use more than 1 beam\n",
     "# 24GB GPU, can use 3 beams\n",
     "%cd /content/EveryDream2trainer\n",
-    "%run caption_cog.py --image_dir \"input\" --num_beams 1 --prompt \"Write a description.\""
+    "%run caption_cog.py --image_dir \"input\" --num_beams 1 --prompt \"Write a description.\" --no_overwrite"
    ]
   },
   {
@@ -103,8 +118,20 @@
    "source": [
     "# This is a fancier version of above with more options set\n",
     "%cd /content/EveryDream2trainer\n",
-    "%run caption_cog.py --image_dir \"input\" --num_beams 1 --prompt \"Write a description.\" --starts_with \"An image of\" --remove_starts_with --temp 0.9 --top_p 0.9 --top_k 40 --bad_words \"depicts,showcases,appears,suggests\""
+    "%run caption_cog.py --image_dir \"input\" --num_beams 1 \\\n",
+    "    --prompt \"Write a description.\" \\\n",
+    "    --starts_with \"An image of\" --remove_starts_with \\\n",
+    "    --temp 0.9 --top_p 0.9 --top_k 40 \\\n",
+    "    --bad_words \"depicts,showcases,appears,suggests\" \\\n",
+    "    --no_overwrite "
    ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
   }
  ],
  "metadata": {