codebuff/backend/src/tools.ts at bfd29c08ccc6168c12fc6404f0810d95c6c5bc6b · CodebuffAI/codebuff · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
import { spawn } from 'child_process'
import fs from 'fs'
import path from 'path'

import { FileChange } from 'common/actions'
import { models, TEST_USER_ID } from 'common/constants'
import {
  getToolCallString,
  ToolName as GlobalToolNameImport,
} from 'common/src/constants/tools'
import { z } from 'zod'

import { buildArray } from 'common/util/array'
import { promptFlashWithFallbacks } from './llm-apis/gemini-with-fallbacks'
import { gitCommitGuidePrompt } from './system-prompt/prompts'

// Define Zod schemas for parameter validation
const toolConfigsList = [
  {
    name: 'add_subgoal',
    schema: z
      .object({
        id: z
          .string()
          .min(1, 'Id cannot be empty')
          .describe(
            `A unique identifier for the subgoal. Try to choose the next sequential integer that is not already in use.`
          ),
        objective: z
          .string()
          .min(1, 'Objective cannot be empty')
          .describe(
            `The objective of the subgoal, concisely and clearly stated.`
          ),
        status: z
          .enum(['NOT_STARTED', 'IN_PROGRESS', 'COMPLETE', 'ABORTED'])
          .describe(
            `The status of the subgoal. One of ["NOT_STARTED", "IN_PROGRESS", "COMPLETE", "ABORTED"]`
          ),
        plan: z.string().optional().describe('A plan for the subgoal.'),
        log: z
          .string()
          .optional()
          .describe('A log message for the subgoal progress.'),
      })
      .describe(
        `Add a new subgoal for tracking progress. To be used for complex requests that can't be solved in a single step, as you may forget what happened!`
      ),

    additionalInfo: `
Example:
${getToolCallString('add_subgoal', {
  id: '1',
  objective: 'Add a new "deploy api" subgoal',
  status: 'IN_PROGRESS',
})}
`.trim(),
  },
  {
    name: 'update_subgoal',
    schema: z
      .object({
        id: z
          .string()
          .min(1, 'Id cannot be empty')
          .describe(`The id of the subgoal to update.`),
        status: z
          .enum(['NOT_STARTED', 'IN_PROGRESS', 'COMPLETE', 'FAILED'])
          .optional()
          .describe(
            `Change the status of the subgoal. One of ["NOT_STARTED", "IN_PROGRESS", "COMPLETE", "FAILED"]`
          ),
        plan: z
          .string()
          .optional()
          .describe(`Change the plan for the subgoal.`),
        log: z
          .string()
          .optional()
          .describe(
            `Add a log message to the subgoal. This will create a new log entry and append it to the existing logs. Use this to record your progress and any new information you learned as you go.`
          ),
      })
      .describe(
        `Update a subgoal in the context given the id, and optionally the status or plan, or a new log to append. Feel free to update any combination of the status, plan, or log in one invocation.`
      ),
    additionalInfo: `
Examples:

Usage 1 (update status):
${getToolCallString('update_subgoal', {
  id: '1',
  status: 'COMPLETE',
})}

Usage 2 (update plan):
${getToolCallString('update_subgoal', {
  id: '3',
  plan: 'Create file for endpoint in the api. Register it in the router.',
})}

Usage 3 (add log):
${getToolCallString('update_subgoal', {
  id: '1',
  log: 'Found the error in the tests. Culprit: foo function.',
})}

Usage 4 (update status and add log):
${getToolCallString('update_subgoal', {
  id: '1',
  status: 'COMPLETE',
  log: 'Reran the tests (passed)',
})}
    `.trim(),
  },
  {
    name: 'write_file',
    schema: z
      .object({
        path: z
          .string()
          .min(1, 'Path cannot be empty')
          .describe(`Path to the file relative to the **project root**`),
        content: z.string().describe(`Edit snippet to apply to the file.`),
      })
      .describe(`Create or edit a file with the given content.`),
    additionalInfo: `
#### **IMPORTANT** Edit Snippet

Format the \`content\` parameter as an edit snippet that describes how you would like to modify the provided existing code.

Edit snippets will be parsed by a less intelligent "fast-apply" model, so you MUST follow this format, otherwise the finetuned smaller model will not understand what to change. For example, do not include detailed instructions on how to apply code changes for the fast-apply model.

Abbreviate any sections of the code in your response that will remain the same with placeholder comments: "// ... existing code ...". Be descriptive in the comment. You MUST to use these in order to **MINIMIZE** the number of characters in the \`content\` parameter.

Make sure that you are abbreviating exactly where you believe the existing code will remain the same.
Indicate the location and nature of the modifications (additions and deletions) with comments and ellipses.

Make sure that you preserve the indentation and code structure of exactly how you believe the final code will look like (do not output lines that will not be in the final code after they are merged).

**CRITICAL FOR DELETIONS** If you plan on deleting a section, you MUST provide a comment giving the relevant context such that the code is understood to be removed. This is REQUIRED for the fast-apply model to understand what to delete.

Examples:

If the initial code is:
\`\`\`Some code
Block 1
Block 2
Block 3
More code
\`\`\`
And if you want to delete code block 2, you MUST include a comment like:
\`\`\`// existing code
Block 1
// Delete Block 2
Block 3
// rest of code
\`\`\`

**YOU MUST ALWAYS INCLUDE DELETION COMMENTS** when removing code blocks, functions, variables, or any other code elements. The fast-apply model cannot understand deletions without these explicit comments. This applies to every type of file: source files, config files, markdown files, css files, json files, etc, etc.

#### Additional Info

Prefer using this tool to str_replace.

Do not use this tool to delete or rename a file. Instead run a terminal command for that.

Notes for editing a file:
- If you don't use any placeholder comments, the entire file will be replaced. E.g. don't write out a single function without using placeholder comments unless you want to replace the entire file with that function.
- When editing a file, try not to change any user code that doesn't need to be changed. In particular, you must preserve pre-existing user comments exactly as they are.
- You can also use this tool to create new files.
- After you have written out a write_file block, the changes will be applied immediately. You can assume that the changes went through as intended. However, note that there are sometimes mistakes in the processs of applying the edits you described in the write_file block, e.g. sometimes large portions of the file are deleted. If you notice that the changes did not go through as intended, based on further updates to the file, you can write out a new write_file block to fix the mistake.

Examples:
${getToolCallString('write_file', {
  path: 'path/to/file',
  content: 'Your file content here',
})}

Example 1 - Simple file creation:
${getToolCallString('write_file', {
  path: 'new-file.ts',
  content: 'console.log("Hello, world!");',
})}

Example 2 - Editing with placeholder comments:
${getToolCallString('write_file', {
  path: 'foo.ts',
  content: `// no change to imports

function foo() {
  console.log('foo');
  for (let i = 0; i < 10; i++) {
    console.log(i);
  }
  doSomething();
}

// rest of code`,
})}

    `.trim(),
  },
  {
    name: 'str_replace',
    schema: z
      .object({
        path: z
          .string()
          .min(1, 'Path cannot be empty')
          .describe(`The path to the file to edit.`),
        old_vals: z
          .array(z.string())
          .describe(
            `The strings to replace. This must be an *exact match* of the string you want to replace, including whitespace and punctuation.`
          ),
        new_vals: z
          .array(z.string())
          .describe(
            `The strings to replace the corresponding old string with. Can be empty to delete.`
          ),
      })
      .refine((data) => data.old_vals.length === data.new_vals.length, {
        message: 'old_vals and new_vals must have the same number of elements.',
      })
      .describe(`Replace strings in a file with new strings.`),
    additionalInfo: `
This should only be used as a backup to the write_file tool, if the write_file tool fails to apply the changes you intended. You should also use this tool to make precise edits for very large files (>2000 lines).

If you are making multiple edits row to a single file with this tool, use only one <str_replace> call (without closing the tool) with old_0, new_0, old_1, new_1, old_2, new_2, etc. instead of calling str_replace multiple times on the same file.

Example:
${getToolCallString('str_replace', {
  path: 'path/to/file',
  old_0: 'old',
  new_0: 'new',
  old_1: 'to_delete',
  new_1: '',
})}
    `.trim(),
  },
  {
    name: 'read_files',
    schema: z
      .object({
        paths: z
          .string()
          .min(1, 'Paths cannot be empty')
          .describe(
            `List of file paths to read relative to the **project root**, separated by newlines. Absolute file paths will not work.`
          ),
      })
      .describe(
        `Read the multiple files from disk and return their contents. Use this tool to read as many files as would be helpful to answer the user's request.`
      ),
    additionalInfo: `
Note: DO NOT call this tool for files you've already read! There's no need to read them again — any changes to the files will be surfaced to you as a file update tool result.

Example:
${getToolCallString('read_files', {
  paths: 'path/to/file1.ts\npath/to/file2.ts',
})}
    `.trim(),
  },
  {
    name: 'find_files',
    schema: z
      .object({
        description: z
          .string()
          .min(1, 'Description cannot be empty')
          .describe(
            `A brief natural language description of the files or the name of a function or class you are looking for. It's also helpful to mention a directory or two to look within.`
          ),
      })
      .describe(
        `Find several files related to a brief natural language description of the files or the name of a function or class you are looking for.`
      ),
    additionalInfo: `
Example:
${getToolCallString('find_files', {
  description: 'The implementation of function foo',
})}

Purpose: Better fulfill the user request by reading files which could contain information relevant to the user's request.
Use cases:
- If you are calling a function or creating a class and want to know how it works, use this tool to get the implementation.
- If you need to understand a section of the codebase, read more files in that directory or subdirectories.
- Some requests require a broad understanding of multiple parts of the codebase. Consider using find_files to gain more context before making changes.

Don't use this tool if:
- You already know the exact path of the file(s) you are looking for — in this case, use read_files.
- You already read the files you need in context.
- You know the name of the file you need. Instead use run_terminal_command with \`find -name\` (or \`dir /s /b\` or \`Get-ChildItem -Recurse -Filter\`)

This tool is not guaranteed to find the correct file. In general, prefer using read_files instead of find_files.
      `.trim(),
  },
  {
    name: 'code_search',
    schema: z
      .object({
        pattern: z
          .string()
          .min(1, 'Pattern cannot be empty')
          .describe(`The pattern to search for.`),
      })
      .describe(
        `Search for string patterns in the project's files. This tool uses ripgrep (rg), a fast line-oriented search tool. Use this tool only when read_files is not sufficient to find the files you need.`
      ),

    additionalInfo: `
Purpose: Search through code files to find files with specific text patterns, function names, variable names, and more.

Prefer to use read_files instead of code_search unless you need to search for a specific pattern in multiple files.

Use cases:
1. Finding all references to a function, class, or variable name across the codebase
2. Searching for specific code patterns or implementations
3. Looking up where certain strings or text appear
4. Finding files that contain specific imports or dependencies
5. Locating configuration settings or environment variables

The pattern supports regular expressions and will search recursively through all files in the project by default. Some tips:
- Be as constraining in the pattern as possible to limit the number of files returned, e.g. if searching for the definition of a function, use "(function foo|const foo)" or "def foo" instead of merely "foo".
- Use word boundaries (\\b) to match whole words only
- Searches file content and filenames
- Automatically ignores binary files, hidden files, and files in .gitignore
- Case-sensitive by default. Use -i to make it case insensitive.
- Constrain the search to specific file types using -t <file-type>, e.g. -t ts or -t py.

Note: Do not use the end_turn tool after this tool! You will want to see the output of this tool before ending your turn.

Examples:
${getToolCallString('code_search', { pattern: 'foo' })}
${getToolCallString('code_search', { pattern: 'import.*foo' })}
    `.trim(),
  },
  {
    name: 'run_terminal_command',
    schema: z
      .object({
        // Can be empty to use it for a timeout.
        command: z.string().describe(`CLI command valid for user's OS.`),
        process_type: z
          .enum(['SYNC', 'BACKGROUND'])
          .default('SYNC')
          .describe(
            `Either SYNC (waits, returns output) or BACKGROUND (runs in background). Default SYNC`
          ),
        cwd: z
          .string()
          .optional()
          .describe(
            `The working directory to run the command in. Default is the project root.`
          ),
        timeout_seconds: z
          .string()
          .default('30')
          .describe(
            `Set to -1 for no timeout. Does not apply for BACKGROUND commands. Default 30`
          ),
      })
      .describe(
        `Execute a CLI command from the **project root** (different from the user's cwd).`
      ),
    additionalInfo: `
Stick to these use cases:
1. Compiling the project or running build (e.g., "npm run build"). Reading the output can help you edit code to fix build errors. If possible, use an option that performs checks but doesn't emit files, e.g. \`tsc --noEmit\`.
2. Running tests (e.g., "npm test"). Reading the output can help you edit code to fix failing tests. Or, you could write new unit tests and then run them.
3. Moving, renaming, or deleting files and directories. These actions can be vital for refactoring requests. Use commands like \`mv\`/\`move\` or \`rm\`/\`del\`.

Most likely, you should ask for permission for any other type of command you want to run. If asking for permission, show the user the command you want to run using \`\`\` tags and *do not* use the tool call format, e.g.:
\`\`\`bash
git branch -D foo
\`\`\`

When using this tool, please adhere to the following rules:

1. Do not run commands that can modify files outside of the project directory, install packages globally, install virtual environments, or have significant side effects outside of the project directory, unless you have explicit permission from the user. Treat anything outside of the project directory as read-only.
2. Do not run \`git push\` because it can break production (!) if the user was not expecting it. Don't run \`git commit\`, \`git rebase\`, or related commands unless you get explicit permission. If a user asks to commit changes, you can do so, but you should not invoke any further git commands beyond the git commit command.
3. Do not run scripts without asking. Especially don't run scripts that could run against the production environment or have permanent effects without explicit permission from the user. Don't run scripts with side effects without permission from the user unless they don't have much effect or are simple.
4. Be careful with any command that has big or irreversible effects. Anything that touches a production environment, servers, the database, or other systems that could be affected by a command should be run with explicit permission from the user.
5. Do not run too many commands in a row without pausing to check in with what the user wants to do next.
6. Do not use the run_terminal_command tool to create or edit files. Do not use \`cat\` or \`echo\` to create or edit files. You should instead write out <write_file> blocks for for editing or creating files as detailed above in the <editing_instructions> block.
7. Do not install packages without asking, unless it is within a small, new-ish project. Users working on a larger project will want to manage packages themselves, so ask first.
8. Do not use the wrong package manager for the project. For example, if the project uses \`pnpm\` or \`bun\` or \`yarn\`, you should not use \`npm\`. Similarly not everyone uses \`pip\` for python, etc.
9. Do not use more than one run_terminal_command tool call in a single response. Wait for the tool results of each command before invoking the next one.
10. The user will not be able to interact with these processes, e.g. confirming the command. So if there's an opportunity to use "-y" or "--yes" flags, use them. Any command that prompts for confirmation will hang if you don't use the flags.

Notes:
- If the user references a specific file, it could be either from their cwd or from the project root. You **must** determine which they are referring to (either infer or ask). Then, you must specify the path relative to the project root (or use the cwd parameter)
- Commands can succeed without giving any output, e.g. if no type errors were found. So you may not always see output for successful executions.

${gitCommitGuidePrompt}

Example:
${getToolCallString('run_terminal_command', {
  command: 'echo "hello world"',
  process_type: 'SYNC',
})}
    `.trim(),
  },
  {
    name: 'think_deeply',
    schema: z
      .object({
        thought: z
          .string()
          .min(1, 'Thought cannot be empty')
          .describe(
            `Detailed step-by-step analysis. Initially keep each step concise (max ~5-7 words per step).`
          ),
      })
      .describe(
        `Deeply consider complex tasks by brainstorming approaches and tradeoffs step-by-step.`
      ),
    additionalInfo: `
Use when user request:
- Explicitly asks for deep planning.
- Requires multi-file changes or complex logic.
- Involves significant architecture or potential edge cases.

Avoid for simple changes (e.g., single functions, minor edits).

This tool does not generate a tool result.

Example:
${getToolCallString('think_deeply', {
  thought: [
    '1. Check current user authentication',
    '2. Refactor auth logic into module',
    '3. Update imports across project',
    '4. Add tests for new module',
  ].join('\n'),
})}
    `.trim(),
  },
  {
    name: 'create_plan',
    schema: z
      .object({
        path: z
          .string()
          .min(1, 'Path cannot be empty')
          .describe(
            `The path including the filename of a markdown file that will be overwritten with the plan.`
          ),
        plan: z
          .string()
          .min(1, 'Plan cannot be empty')
          .describe(`A detailed plan to solve the user's request.`),
      })
      .describe(`Generate a detailed markdown plan for complex tasks.`),
    additionalInfo: `
Use when:
- User explicitly requests a detailed plan.
- Task involves significant architectural or multi-file changes.
- Only use this tool to create new plans. Do not modify existing plans using this tool—use the \`write_file\` tool instead for modifications.

Don't include:
- Goals, timelines, benefits, next steps.
- Background context or extensive explanations.

For a technical plan, act as an expert architect engineer and provide direction to your editor engineer.
- Study the change request and the current code.
- Describe how to modify the code to complete the request. The editor engineer will rely solely on your instructions, so make them unambiguous and complete.
- Explain all needed code changes clearly and completely, but concisely.
- Just show the changes needed.

What to include in the plan:
- Include code, but not full files of it. Write out key snippets of code and use lots of psuedo code. For example, interfaces between modules, function signatures, and other code that is not immediately obvious should be written out explicitly. Function and method bodies could be written out in psuedo code.
- Do not waste time on much background information, focus on the exact steps of the implementation.
- Do not wrap the path content in markdown code blocks, e.g. \`\`\`.

Do not include any of the following sections in the plan:
- goals
- a timeline or schedule
- benefits/key improvements
- next steps

After creating than plan, you should end turn to let the user review the plan.

Important: Use this tool sparingly. Do not use this tool more than once in a conversation, if a plan was already created, or for similar user requests.

Examples:
${getToolCallString('create_plan', {
  path: 'feature-x-plan.md',
  plan: [
    '1. Create module `auth.ts` in `/src/auth/`.',
    '```ts',
    'export function authenticate(user: User): boolean { /* pseudo-code logic */ }',
    '```',
    '2. Refactor existing auth logic into this module.',
    '3. Update imports across codebase.',
    '4. Write integration tests covering new module logic.',
  ].join('\n'),
})}
    `.trim(),
  },
  {
    name: 'browser_logs',
    schema: z
      .object({
        type: z
          .string()
          .min(1, 'Type cannot be empty')
          .describe(
            'The type of browser action to perform (e.g., "navigate").'
          ),
        url: z
          .string()
          .min(1, 'URL cannot be empty')
          .describe('The URL to navigate to.'),
        waitUntil: z
          .enum(['load', 'domcontentloaded', 'networkidle0'])
          .optional()
          .describe(
            "When to consider navigation successful. Defaults to 'load'."
          ),
      })
      .describe(
        `In a headless browser, navigate to a web page and get the console logs after page load.`
      ),
    additionalInfo: `
Purpose: Use this tool to check the output of console.log or errors in order to debug issues, test functionality, or verify expected behavior.

IMPORTANT: Assume the user's development server is ALREADY running and active, unless you see logs indicating otherwise. Never start the user's development server for them, unless they ask you to do so.
Never offer to interact with the website aside from reading them (see available actions below). The user will manipulate the website themselves and bring you to the UI they want you to interact with.

### Response Analysis

After each action, you'll receive:
1. Success/failure status
2. New console logs since last action
3. Network requests and responses
4. JavaScript errors with stack traces

Use this data to:
- Verify expected behavior
- Debug issues
- Guide next actions
- Make informed decisions about fixes

### Best Practices

**Workflow**
- Navigate to the user's website, probably on localhost, but you can compare with the production site if you want.
- Scroll to the relevant section
- Take screenshots and analyze confirm changes
- Check network requests for anomalies

**Debugging Flow**
- Start with minimal reproduction steps
- Collect data at each step
- Analyze results before next action
- Take screenshots to track your changes after each UI change you make

There is currently only one type of browser action available:
Navigate:
   - Load a new URL in the current browser window and get the logs after page load.
   Params:
   - \`type\`: (required) Must be equal to 'navigate'
   - \`url\`: (required) The URL to navigate to.
   - \`waitUntil\`: (required) One of 'load', 'domcontentloaded', 'networkidle0'

Example:
${getToolCallString('browser_logs', {
  type: 'navigate',
  url: 'localhost:3000',
  waitUntil: 'domcontentloaded',
})}
    `.trim(),
  },
  {
    name: 'kill_terminal',
    schema: z
      .object({})
      .transform(() => ({}))
      .describe(
        `Kill the current terminal process and restart it. Only available in agent mode.`
      ),
    additionalInfo: `
Purpose: Use this tool to forcefully terminate the current terminal session and start fresh. This is useful when a command is stuck or the terminal is in an unresponsive state.

This tool is only available in agent mode and will not work in regular Codebuff.

Example:
${getToolCallString('kill_terminal', {})}
    `.trim(),
  },
  {
    name: 'sleep',
    schema: z
      .object({
        seconds: z
          .string()
          .min(1, 'Seconds cannot be empty')
          .describe(`Number of seconds to sleep (as string)`),
      })
      .describe(
        `Sleep for a specified number of seconds. Only available in agent mode.`
      ),
    additionalInfo: `
Purpose: Use this tool to pause execution for a specified amount of time. This can be useful when waiting for processes to complete, giving time for services to start up, or adding delays between operations.

This tool is only available in agent mode and will not work in regular Codebuff.

Example:
${getToolCallString('sleep', { seconds: '5' })}
    `.trim(),
  },
  {
    name: 'end_turn',
    schema: z
      .object({})
      .transform(() => ({}))
      .describe(
        `End your turn, regardless of any new tool results that might be coming. This will allow the user to type another prompt.`
      ),
    additionalInfo: `
Purpose: Use this tool if you have fully responded to the user and want to get their feedback. This ignores any tool results (from write_file, run_terminal_command, etc.), so be sure you are done before using it.

Make sure to use this tool if you want a response from the user and not the system. Otherwise, you may receive tool results from the previous tools. e.g. "Let me know if you need xyz!${getToolCallString('end_turn', {})}"

Example:
${getToolCallString('end_turn', {})}
    `.trim(),
  },
] as const

// Helper function to generate markdown for parameter list
function generateParamsList(
  toolName: string,
  schema: z.ZodType<any, any, any>
): string[] {
  const params: string[] = []
  let shape = null

  if (schema instanceof z.ZodObject) {
    shape = schema.shape
  } else if (
    schema instanceof z.ZodEffects &&
    schema._def.schema instanceof z.ZodObject
  ) {
    shape = schema._def.schema.shape
  }

  if (shape) {
    for (const key in shape) {
      const paramSchema = shape[key] as z.ZodTypeAny
      let paramMarkdownName = `\`${key}\``

      if (
        toolName === 'str_replace' &&
        (key === 'old_vals' || key === 'new_vals')
      ) {
        paramMarkdownName = `\`${key.replace('_vals', '')}_{i}\``
      }

      let paramLine = `- ${paramMarkdownName}: `

      let requiredOptionalMarker = '(required)'
      if (
        paramSchema instanceof z.ZodOptional ||
        paramSchema._def.typeName === 'ZodDefault'
      ) {
        requiredOptionalMarker = '(optional)'
      }

      const descriptionText =
        paramSchema.description ||
        `(${paramSchema._def.typeName || 'parameter'})`
      paramLine += `${requiredOptionalMarker} ${descriptionText}`
      params.push(paramLine)
    }
  }

  if (params.length === 0) {
    return ['None']
  }

  return params
}

// Helper function to build the full tool description markdown
function buildToolDescription(
  toolName: string,
  schema: z.ZodType<any, any, any>,
  additionalInfo: string
): string {
  const mainDescription = schema.description || ''
  const paramsArray = generateParamsList(toolName, schema)

  let paramsSection = ''
  if (paramsArray.length === 1 && paramsArray[0] === 'None') {
    paramsSection = 'Params: None'
  } else if (paramsArray.length > 0) {
    paramsSection = `Params:\n${paramsArray.join('\n')}`
  }

  return buildArray([
    `### ${toolName}`,
    mainDescription,
    paramsSection,
    additionalInfo,
  ]).join('\n\n')
}

const tools = toolConfigsList.map((config) => ({
  name: config.name,
  description: buildToolDescription(
    config.name,
    config.schema,
    config.additionalInfo
  ),
})) as { name: GlobalToolNameImport; description: string }[]

const managerTools = tools.filter((tool) =>
  ['run_terminal_command', 'kill_terminal', 'sleep', 'end_turn'].includes(
    tool.name
  )
)

const toolSchemas = Object.fromEntries(
  toolConfigsList.map((tool) => [tool.name, tool.schema])
) as {
  [K in (typeof toolConfigsList)[number]['name']]: Extract<
    (typeof toolConfigsList)[number],
    { name: K }
  >['schema']
}

type ToolConfig = (typeof toolConfigsList)[number]

export type ToolCall = {
  [K in ToolConfig as K['name']]: {
    name: K['name']
    parameters: z.infer<K['schema']>
  }
}[ToolConfig['name']]

export type ToolCallError = {
  name?: string
  parameters: Record<string, string>
  error: string
}

export function parseRawToolCall(rawToolCall: {
  name: string
  parameters: Record<string, string>
}): ToolCall | ToolCallError {
  const name = rawToolCall.name

  if (!(name in toolSchemas)) {
    return {
      name,
      parameters: rawToolCall.parameters,
      error: `Tool ${name} not found`,
    }
  }
  const validName = name as GlobalToolNameImport

  let schema: z.ZodObject<any> | z.ZodEffects<any> = toolSchemas[validName]
  while (schema instanceof z.ZodEffects) {
    schema = schema.innerType()
  }
  const processedParameters: Record<string, any> = { ...rawToolCall.parameters }

  const arrayParamPattern = /^(.+)_(\d+)$/
  const arrayParamsCollector: Record<string, string[]> = {}

  for (const [key, value] of Object.entries(rawToolCall.parameters)) {
    const match = key.match(arrayParamPattern)
    if (match) {
      const [, paramNameBase, indexStr] = match
      const index = parseInt(indexStr, 10)
      const arraySchemaKey = `${paramNameBase}_vals`

      const schemaShape = schema.shape
      if (
        schemaShape &&
        schemaShape[arraySchemaKey] &&
        schemaShape[arraySchemaKey] instanceof z.ZodArray
      ) {
        if (!arrayParamsCollector[arraySchemaKey]) {
          arrayParamsCollector[arraySchemaKey] = []
        }
        arrayParamsCollector[arraySchemaKey][index] = value
        delete processedParameters[key]
      }
    }
  }

  for (const [arrayKey, values] of Object.entries(arrayParamsCollector)) {
    processedParameters[arrayKey] = values.filter((v) => v !== undefined)
  }

  const result = schema.safeParse(processedParameters)
  if (!result.success) {
    return {
      name: validName,
      parameters: rawToolCall.parameters,
      error: `Invalid parameters for ${validName}: ${JSON.stringify(result.error.issues, null, 2)}`,
    }
  }

  return { name: validName, parameters: result.data } as ToolCall
}

export const TOOL_LIST = tools.map((tool) => tool.name)
export type ToolName = (typeof TOOL_LIST)[number]

export const TOOLS_WHICH_END_THE_RESPONSE = [
  'read_files',
  'find_files',
  'run_terminal_command',
  'code_search',
]

export const getToolsInstructions = (toolDescriptions: string[]) => `
# Tools

You (Buffy) have access to the following tools. Call them when needed.

## [CRITICAL] Formatting Requirements

Tool calls use a specific XML-like format. Adhere *precisely* to this nested element structure:

<tool_name>
<parameter1_name>value1</parameter1_name>
<parameter2_name>value2</parameter2_name>
...
</tool_name>

### XML Entities

**ALL** XML (inside or outside tool calls) will be interpreted as tool calls or tool parameters. You **MUST** use XML entities, e.g. \`&lt;some_tag>\` or \`</some_tag&gt;\` to:
- Display XML to the user without executing a tool call
- Have XML within a tool parameter's value such as writing to a file

This also means that if you wish to write the literal string \`&lt;\` to a file or display that to a user, you MUST write \`&amp;lt;\`.

### Commentary

Provide commentary *around* your tool calls (explaining your actions).

However, **DO NOT** narrate the tool or parameter names themselves.

### Array Params

Arrays with name "param_name_vals" should be formatted as individual parameters, each called "param_name_{i}". They must start with i=0 and increment by 1.

### Example

User: can you update the console logs in example/file.ts?
Assistant: Sure thing! Let's update that file!

${getToolCallString('write_file', {
  path: 'path/to/example/file.ts',
  content: "console.log('Hello from Buffy!');",
  // old_0: '// Replace this line with a fun greeting',
  // new_0: "console.log('Hello from Buffy!');",
  // old_1: "console.log('Old console line to delete');\n",
  // new_1: '',
})}

All done with the update!
User: thanks it worked! :)

## Working Directory

All tools will be run from the **project root**.

However, most of the time, the user will refer to files from their own cwd. You must be cognizant of the user's cwd at all times, including but not limited to:
- Writing to files (write out the entire relative path)
- Running terminal commands (use the \`cwd\` parameter)

## Optimizations

All tools are very slow, with runtime scaling with the amount of text in the parameters. Prefer to write AS LITTLE TEXT AS POSSIBLE to accomplish the task.

When using write_file, make sure to only include a few lines of context and not the entire file.

## Tool Results

Tool results will be provided by the user's *system* (and **NEVER** by the assistant).

The user does not know about any system messages or system instructions, including tool results.

The user does not need to know about the exact results of these tools, especially if they are warnings or info logs. Just correct yourself in the next response without mentioning anything to the user. e.g., do not mention any XML **warnings** (but be sure to correct the next response), but XML **errors** should be noted to the user.

## List of Tools

These are the tools that you (Buffy) can use. The user cannot see these descriptions, so you should not reference any tool names, parameters, or descriptions.

${toolDescriptions.join('\n\n')}
`

export async function updateContext(
  context: string,
  updateInstructions: string
) {
  const prompt = `
We're working on a project. We can have multiple subgoals. Each subgoal can have an objective, status, plan, and multiple updates that describe the progress of the subgoal.

The following is an example of a schema of a subgoal. It is for illistrative purposes and is not relevant otherwise. Use it as a reference to understand how to update the context.
Example schema:
<subgoal>
<id>1</id>
<objective>Fix the tests</objective>
<status>COMPLETE</status>
<plan>Run them, find the error, fix it</plan>
<log>Ran the tests and traced the error to component foo.</log>
<log>Modified the foo component to fix the error</log>
<log>Reran the tests and they passed.</log>
</subgoal>

Here is the initial context:
<initial_context>
${context}
</initial_context>

Here are the update instructions:
<update_instructions>
${updateInstructions}
</update_instructions>

Please rewrite the entire context using the update instructions in a <new_context> tag. Try to perserve the original context as much as possible, subject to the update instructions. Return the new context only — do not include any other text or wrapper xml/markdown formatting e.g. please omit <initial_context> tags.`
  const messages = [
    {
      role: 'user' as const,
      content: prompt,
    },
    {
      role: 'assistant' as const,
      content: '<new_context>',
    },
  ]
  const response = await promptFlashWithFallbacks(messages, {
    model: models.gemini2flash,
    clientSessionId: 'strange-loop',
    fingerprintId: 'strange-loop',
    userInputId: 'strange-loop',
    userId: TEST_USER_ID,
  })
  const newContext = response.split('</new_context>')[0]
  return newContext.trim()
}

export async function updateContextFromToolCalls(
  agentContext: string,
  toolCalls: Extract<ToolCall, { name: 'update_subgoal' | 'add_subgoal' }>[]
) {
  let prompt = [] // 'Log the following tools used and their parameters, and also act on any other instructions:\n'

  for (const toolCall of toolCalls) {
    const { name, parameters } = toolCall
    if (name === 'add_subgoal') {
      prompt.push(
        `Please add the following subgoal:\n${renderSubgoalUpdate(
          parameters as any
        )}`
      )
    } else if (name === 'update_subgoal') {
      prompt.push(
        `Please update the subgoal with the matching id. For <status> and <plan>, if there are already tags, update them to the new values, keeping only one. For <log>, please keep all the existing logs and append a new <log> entry at the end of the subgoal. Finally, for any unmentioned parameters, do not change them in the existing subgoal:\n${renderSubgoalUpdate(
          parameters as any
        )}`
      )
    }
  }
  return await updateContext(agentContext, prompt.join('\n\n'))
}

export async function readFiles(
  paths: string[],
  projectPath: string
): Promise<Record<string, string | null>> {
  const results: Record<string, string | null> = {}
  for (const filePath of paths) {
    const fullPath = path.join(projectPath, filePath)
    if (!fullPath.startsWith(projectPath)) {
      throw new Error('Cannot access files outside project directory')
    }
    try {
      results[filePath] = await fs.promises.readFile(fullPath, 'utf-8')
    } catch {
      results[filePath] = null
    }
  }
  return results
}

export async function writeFile(
  filePath: string,
  content: string,
  projectPath: string
) {
  const fullPath = path.join(projectPath, filePath)