From 9251043aec56167901b7ac4a9b3ecb0e7235c135 Mon Sep 17 00:00:00 2001
From: Dominik Polakovics <dominik.polakovics@cloonar.com>
Date: Mon, 30 Dec 2024 00:42:51 +0100
Subject: [PATCH] feat: remove chunking and switch it to a multi step process
 instead if tokens are too high

---
 lua/chatgpt_nvim/config.lua |  3 ++
 lua/chatgpt_nvim/init.lua   | 85 ++++++++++++++-----------------------
 lua/chatgpt_nvim/ui.lua     | 31 +++-----------
 3 files changed, 40 insertions(+), 79 deletions(-)

diff --git a/lua/chatgpt_nvim/config.lua b/lua/chatgpt_nvim/config.lua
index 114665f..33d6365 100644
--- a/lua/chatgpt_nvim/config.lua
+++ b/lua/chatgpt_nvim/config.lua
@@ -37,6 +37,9 @@ local prompt_blocks = {
     and a top-level key named 'files', which is a list of file changes. Each element in 'files' must be a mapping with:
     - 'path' for the file path relative to the project’s root directory.
     - either 'content' with a multiline string for new content, or 'delete: true' if the file should be deleted.
+    Important: dont use comments in the code to explain which steps you have taken.
+    Comments should just explain the code and not your thought process.
+    You can explain your thought process outside of the YAML.
 
     If more context is needed at any point before providing the final YAML, request it outside of the YAML.
     Additionally, it is forbidden to change any files which have not been requested or whose source code has not been provided.
diff --git a/lua/chatgpt_nvim/init.lua b/lua/chatgpt_nvim/init.lua
index 7a84faa..da59d25 100644
--- a/lua/chatgpt_nvim/init.lua
+++ b/lua/chatgpt_nvim/init.lua
@@ -77,18 +77,25 @@ local function get_estimate_fn()
   end
 end
 
------------------------------------------------------------------------------
--- CHUNKING
------------------------------------------------------------------------------
-local function handle_chunking_if_needed(prompt, estimate_fn)
+---------------------------------------------------------------------------------
+-- Step-by-Step Handling (replaces chunking)
+---------------------------------------------------------------------------------
+local function handle_step_by_step_if_needed(prompt, estimate_fn)
   local conf = config.load()
   local token_count = estimate_fn(prompt)
-  if not conf.enable_chunking or token_count <= (conf.token_limit or 8000) then
+  -- If step-by-step is disabled or token count is within limit, return original prompt
+  if not conf.enable_step_by_step or token_count <= (conf.token_limit or 8000) then
     return { prompt }
   end
 
-  local chunks = ui.chunkify(prompt, estimate_fn, conf.token_limit or 8000)
-  return chunks
+  -- If we exceed the token limit, create a single message prompting the user to split tasks
+  local step_prompt = [[
+    It appears this request might exceed the model's token limit if done all at once.
+    Please break down the tasks into smaller steps and handle them one by one. 
+    At each step, we'll provide relevant files or context if needed.
+    Thank you!
+  ]]
+  return { step_prompt }
 end
 
 -- Close an existing buffer by name (if it exists)
@@ -339,33 +346,16 @@ function M.run_chatgpt_command()
       store_prompt_for_reference(prompt)
 
       local estimate_fn = get_estimate_fn()
-      local chunks = handle_chunking_if_needed(prompt, estimate_fn)
+      local chunks = handle_step_by_step_if_needed(prompt, estimate_fn)
 
+      -- We either get the original prompt or a single special prompt
+      copy_to_clipboard(chunks[1])
       if #chunks == 1 then
-        copy_to_clipboard(chunks[1])
         vim.api.nvim_out_write("Prompt copied to clipboard! Paste into ChatGPT.\n")
       else
-        -- Multiple chunks. We'll create separate scratch buffers
-        for i, chunk in ipairs(chunks) do
-          close_existing_buffer_by_name("ChatGPT_Generated_Chunk_" .. i .. "$")
-
-          local cbuf = vim.api.nvim_create_buf(false, true)
-          vim.api.nvim_buf_set_name(cbuf, "ChatGPT_Generated_Chunk_" .. i)
-          vim.api.nvim_buf_set_option(cbuf, "filetype", "markdown")
-
-          local lines = {
-            "# Chunk " .. i .. " of " .. #chunks .. ":",
-            "# Copy/paste this chunk into ChatGPT, then come back and copy the next chunk as needed.",
-            ""
-          }
-          vim.list_extend(lines, vim.split(chunk, "\n"))
-          vim.api.nvim_buf_set_lines(cbuf, 0, -1, false, lines)
-
-          if i == 1 then
-            copy_to_clipboard(chunk)
-            vim.api.nvim_out_write("Copied chunk #1 of " .. #chunks .. " to clipboard!\n")
-          end
-        end
+        -- In this revised approach, we no longer generate multiple buffers. 
+        -- We simply rely on the single step-by-step prompt in chunks[1].
+        vim.api.nvim_out_write("Step-by-step prompt copied to clipboard!\n")
       end
 
       vim.api.nvim_buf_set_option(bufnr, "modified", false)
@@ -498,28 +488,17 @@ function M.run_chatgpt_paste_command()
       local token_count = estimate_fn(prompt)
       ui.debug_log("Returning requested files. Token count: " .. token_count)
 
-      if token_count > (conf.token_limit or 8000) then
-        if conf.enable_chunking then
-          local chunks = ui.chunkify(prompt, estimate_fn, conf.token_limit or 8000)
-          for i, chunk in ipairs(chunks) do
-            local cbuf = vim.api.nvim_create_buf(false, true)
-            vim.api.nvim_buf_set_name(cbuf, "ChatGPT_Requested_Files_Chunk_" .. i)
-            local lines = {
-              "# Chunk " .. i .. " of " .. #chunks .. ":",
-              "# Copy/paste this chunk into ChatGPT, then come back and copy next chunk as needed.",
-              ""
-            }
-            vim.list_extend(lines, vim.split(chunk, "\n"))
-            vim.api.nvim_buf_set_lines(cbuf, 0, -1, false, lines)
-
-            if i == 1 then
-              copy_to_clipboard(chunk)
-              print("Copied chunk #1 of " .. #chunks .. " to clipboard!")
-            end
-          end
-        else
-          vim.api.nvim_err_writeln("Too many requested files. Exceeds token limit.")
-        end
+      -- We simply check if step-by-step is enabled, then provide a short note if needed
+      if token_count > (conf.token_limit or 8000) and conf.enable_step_by_step then
+        local step_message = [[
+          It appears this requested data is quite large. Please consider handling these files step by step.
+          Let me know how you would like to proceed.
+        ]]
+        copy_to_clipboard(step_message)
+        print("Step-by-step guidance copied to clipboard!")
+        return
+      elseif token_count > (conf.token_limit or 8000) then
+        vim.api.nvim_err_writeln("Requested files exceed token limit. No step-by-step support enabled.")
         return
       end
 
@@ -531,4 +510,4 @@ function M.run_chatgpt_paste_command()
   end
 end
 
-return M
\ No newline at end of file
+return M
diff --git a/lua/chatgpt_nvim/ui.lua b/lua/chatgpt_nvim/ui.lua
index 959aada..cca92d1 100644
--- a/lua/chatgpt_nvim/ui.lua
+++ b/lua/chatgpt_nvim/ui.lua
@@ -19,8 +19,7 @@ end
 
 function M.debug_log(msg)
   if conf.improved_debug and debug_bufnr then
-    local lines = vim.split(msg, "\n")
-    vim.api.nvim_buf_set_lines(debug_bufnr, -1, -1, false, lines)
+    vim.api.nvim_buf_set_lines(debug_bufnr, -1, -1, false, { msg })
   else
     if conf.debug then
       vim.api.nvim_out_write("[chatgpt_nvim:debug] " .. msg .. "\n")
@@ -89,28 +88,8 @@ function M.pick_directories(dirs)
   return selected_dirs
 end
 
-function M.chunkify(text, estimate_tokens_fn, token_limit)
-  local lines = vim.split(text, "\n")
-  local chunks = {}
-  local current_chunk = {}
-  local current_text = ""
+--------------------------------------------------------------------------------
+-- The old chunkify method has been removed, since we now rely on step-by-step
+--------------------------------------------------------------------------------
 
-  for _, line in ipairs(lines) do
-    local test_text = (current_text == "") and line or (current_text .. "\n" .. line)
-    local est_tokens = estimate_tokens_fn(test_text)
-    if est_tokens > token_limit then
-      table.insert(chunks, current_text)
-      current_text = line
-    else
-      current_text = test_text
-    end
-  end
-
-  if current_text ~= "" then
-    table.insert(chunks, current_text)
-  end
-
-  return chunks
-end
-
-return M
+return M
\ No newline at end of file